PyPI - mindspore - Versions diffs - 1.10.0__cp39-cp39-win_amd64.whl → 2.0.0rc1__cp39-cp39-win_amd64.whl - Mend

mindspore 1.10.0__cp39-cp39-win_amd64.whl → 2.0.0rc1__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.

This version of mindspore might be problematic. Click here for more details.

Files changed (966) hide show

mindspore/.commit_id +1 -1
mindspore/ConcurrencyCheck.dll +0 -0
mindspore/CppBuildInsights.dll +0 -0
mindspore/CppCoreCheck.dll +0 -0
mindspore/EnumIndex.dll +0 -0
mindspore/EspXEngine.dll +0 -0
mindspore/HResultCheck.dll +0 -0
mindspore/KernelTraceControl.dll +0 -0
mindspore/LocalESPC.dll +0 -0
mindspore/Microsoft.Diagnostics.Tracing.EventSource.dll +0 -0
mindspore/Microsoft.VisualStudio.RemoteControl.dll +0 -0
mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
mindspore/Microsoft.VisualStudio.Utilities.Internal.dll +0 -0
mindspore/Newtonsoft.Json.dll +0 -0
mindspore/System.Runtime.CompilerServices.Unsafe.dll +0 -0
mindspore/VariantClear.dll +0 -0
mindspore/__init__.py +9 -4
mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
mindspore/_check_jit_forbidden_api.py +102 -0
mindspore/_checkparam.py +1066 -1001
mindspore/_extends/builtin_operations.py +32 -4
mindspore/_extends/graph_kernel/model/graph_split.py +66 -222
mindspore/_extends/parallel_compile/akg_compiler/akg_process.py +12 -9
mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +119 -26
mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +50 -50
mindspore/_extends/parallel_compile/akg_compiler/util.py +9 -6
mindspore/_extends/parallel_compile/tbe_compiler/tbe_adapter.py +4 -25
mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +9 -4
mindspore/_extends/parallel_compile/tbe_compiler/tbe_job_manager.py +1 -27
mindspore/_extends/parse/__init__.py +5 -3
mindspore/_extends/parse/namespace.py +17 -2
mindspore/_extends/parse/parser.py +193 -34
mindspore/_extends/parse/resources.py +7 -8
mindspore/_extends/parse/standard_method.py +1780 -435
mindspore/_extends/parse/trope.py +3 -1
mindspore/amp.py +53 -58
mindspore/atlprov.dll +0 -0
mindspore/boost/adasum.py +3 -2
mindspore/boost/boost.py +2 -2
mindspore/boost/boost_cell_wrapper.py +46 -26
mindspore/boost/dim_reduce.py +6 -5
mindspore/boost/grad_accumulation.py +2 -1
mindspore/boost/group_loss_scale_manager.py +1 -1
mindspore/c1.dll +0 -0
mindspore/c1xx.dll +0 -0
mindspore/c2.dll +0 -0
mindspore/cfgpersist.dll +0 -0
mindspore/clang_rt.asan_dbg_dynamic-x86_64.dll +0 -0
mindspore/clang_rt.asan_dynamic-x86_64.dll +0 -0
mindspore/common/__init__.py +11 -10
mindspore/common/_decorator.py +2 -0
mindspore/common/_register_for_adapter.py +55 -0
mindspore/common/_stub_tensor.py +201 -0
mindspore/common/_utils.py +57 -0
mindspore/common/api.py +582 -297
mindspore/common/dtype.py +66 -18
mindspore/common/dump.py +2 -2
mindspore/common/initializer.py +38 -1
mindspore/common/jit_config.py +25 -13
mindspore/common/mutable.py +53 -24
mindspore/common/parameter.py +60 -37
mindspore/common/seed.py +8 -24
mindspore/common/sparse_tensor.py +927 -0
mindspore/common/tensor.py +1627 -3900
mindspore/communication/__init__.py +10 -5
mindspore/communication/_comm_helper.py +78 -214
mindspore/communication/_hccl_management.py +2 -1
mindspore/communication/management.py +136 -47
mindspore/config/op_info.config +501 -1008
mindspore/context.py +291 -56
mindspore/d3dcompiler_47.dll +0 -0
mindspore/dataset/__init__.py +12 -8
mindspore/dataset/audio/__init__.py +9 -9
mindspore/dataset/audio/transforms.py +1090 -228
mindspore/dataset/audio/utils.py +87 -39
mindspore/dataset/audio/validators.py +223 -1
mindspore/dataset/callback/ds_callback.py +17 -15
mindspore/dataset/core/config.py +246 -17
mindspore/dataset/core/py_util_helpers.py +4 -3
mindspore/dataset/core/validator_helpers.py +10 -10
mindspore/{parallel/nn/layers.py → dataset/debug/__init__.py} +7 -8
mindspore/dataset/debug/debug_hook.py +65 -0
mindspore/dataset/debug/pre_defined_hook.py +67 -0
mindspore/dataset/engine/__init__.py +7 -3
mindspore/dataset/engine/cache_client.py +9 -9
mindspore/dataset/engine/datasets.py +648 -477
mindspore/dataset/engine/datasets_audio.py +165 -167
mindspore/dataset/engine/datasets_standard_format.py +93 -67
mindspore/dataset/engine/datasets_text.py +492 -342
mindspore/dataset/engine/datasets_user_defined.py +85 -50
mindspore/dataset/engine/datasets_vision.py +1224 -699
mindspore/dataset/engine/graphdata.py +134 -69
mindspore/dataset/engine/iterators.py +50 -9
mindspore/dataset/engine/offload.py +52 -31
mindspore/dataset/engine/samplers.py +27 -24
mindspore/dataset/engine/serializer_deserializer.py +14 -15
mindspore/dataset/engine/validators.py +213 -52
mindspore/dataset/text/__init__.py +10 -8
mindspore/dataset/text/transforms.py +152 -57
mindspore/dataset/text/utils.py +98 -49
mindspore/dataset/text/validators.py +25 -0
mindspore/dataset/transforms/__init__.py +4 -2
mindspore/dataset/transforms/c_transforms.py +11 -13
mindspore/dataset/transforms/py_transforms.py +2 -2
mindspore/dataset/transforms/py_transforms_util.py +10 -0
mindspore/dataset/transforms/transforms.py +13 -15
mindspore/dataset/transforms/validators.py +7 -7
mindspore/dataset/utils/__init__.py +2 -1
mindspore/dataset/utils/browse_dataset.py +13 -13
mindspore/dataset/utils/line_reader.py +121 -0
mindspore/dataset/vision/__init__.py +8 -7
mindspore/dataset/vision/c_transforms.py +125 -126
mindspore/dataset/vision/py_transforms.py +37 -37
mindspore/dataset/vision/py_transforms_util.py +23 -20
mindspore/dataset/vision/transforms.py +316 -315
mindspore/dataset/vision/utils.py +313 -17
mindspore/dataset/vision/validators.py +6 -6
mindspore/default_config.py +0 -1
mindspore/dpcmi.dll +0 -0
mindspore/{compression → experimental}/__init__.py +6 -5
mindspore/experimental/map_parameter.py +275 -0
mindspore/include/OWNERS +0 -1
mindspore/include/api/callback/callback.h +9 -13
mindspore/include/api/callback/ckpt_saver.h +2 -2
mindspore/include/api/callback/loss_monitor.h +2 -2
mindspore/include/api/callback/lr_scheduler.h +5 -5
mindspore/include/api/callback/time_monitor.h +2 -2
mindspore/include/api/callback/train_accuracy.h +4 -6
mindspore/include/api/cfg.h +19 -6
mindspore/include/api/context.h +70 -9
mindspore/include/api/delegate.h +8 -1
mindspore/include/api/dual_abi_helper.h +8 -24
mindspore/include/api/metrics/accuracy.h +2 -2
mindspore/include/api/metrics/metrics.h +4 -3
mindspore/include/api/model.h +9 -4
mindspore/include/api/model_group.h +68 -0
mindspore/include/api/model_parallel_runner.h +17 -17
mindspore/include/api/net.h +12 -11
mindspore/include/api/serialization.h +20 -4
mindspore/include/api/status.h +7 -1
mindspore/include/api/types.h +25 -21
mindspore/include/api/visible.h +4 -0
mindspore/include/c_api/model_c.h +5 -0
mindspore/include/c_api/status_c.h +1 -1
mindspore/include/dataset/config.h +1 -1
mindspore/include/dataset/constants.h +14 -0
mindspore/include/dataset/text.h +59 -0
mindspore/include/dataset/vision.h +56 -117
mindspore/include/dataset/vision_lite.h +102 -0
mindspore/jpeg62.dll +0 -0
mindspore/log.py +28 -28
mindspore/mindrecord/common/exceptions.py +2 -4
mindspore/mindrecord/filereader.py +19 -1
mindspore/mindrecord/filewriter.py +250 -88
mindspore/mindrecord/mindpage.py +13 -13
mindspore/mindrecord/shardheader.py +15 -15
mindspore/mindrecord/shardreader.py +9 -0
mindspore/mindrecord/shardwriter.py +29 -29
mindspore/mindrecord/tools/cifar100_to_mr.py +9 -9
mindspore/mindrecord/tools/cifar10_to_mr.py +9 -9
mindspore/mindrecord/tools/csv_to_mr.py +4 -4
mindspore/mindrecord/tools/imagenet_to_mr.py +70 -65
mindspore/mindrecord/tools/mnist_to_mr.py +41 -41
mindspore/mindrecord/tools/tfrecord_to_mr.py +6 -6
mindspore/{libmindspore_backend.dll → mindspore_backend.dll} +0 -0
mindspore/mindspore_common.dll +0 -0
mindspore/mindspore_core.dll +0 -0
mindspore/mindspore_glog.dll +0 -0
mindspore/mindspore_shared_lib.dll +0 -0
mindspore/msobj140.dll +0 -0
mindspore/mspdb140.dll +0 -0
mindspore/mspdbcore.dll +0 -0
mindspore/mspdbst.dll +0 -0
mindspore/mspft140.dll +0 -0
mindspore/msvcdis140.dll +0 -0
mindspore/msvcp140_1.dll +0 -0
mindspore/msvcp140_2.dll +0 -0
mindspore/msvcp140_atomic_wait.dll +0 -0
mindspore/msvcp140_codecvt_ids.dll +0 -0
mindspore/nn/__init__.py +1 -5
mindspore/nn/cell.py +297 -234
mindspore/nn/dynamic_lr.py +1 -1
mindspore/nn/grad/cell_grad.py +17 -42
mindspore/nn/layer/__init__.py +7 -4
mindspore/nn/layer/activation.py +131 -88
mindspore/nn/layer/basic.py +313 -613
mindspore/nn/layer/channel_shuffle.py +103 -0
mindspore/nn/layer/combined.py +1 -1
mindspore/nn/layer/container.py +52 -6
mindspore/nn/layer/conv.py +112 -43
mindspore/nn/layer/dense.py +10 -9
mindspore/nn/layer/embedding.py +36 -34
mindspore/nn/layer/image.py +123 -27
mindspore/nn/layer/math.py +108 -107
mindspore/nn/layer/normalization.py +212 -366
mindspore/nn/layer/padding.py +370 -42
mindspore/nn/layer/pooling.py +1443 -219
mindspore/nn/layer/rnn_cells.py +11 -16
mindspore/nn/layer/rnns.py +38 -39
mindspore/nn/layer/thor_layer.py +24 -25
mindspore/nn/layer/timedistributed.py +5 -5
mindspore/nn/layer/transformer.py +701 -0
mindspore/nn/learning_rate_schedule.py +8 -8
mindspore/nn/loss/__init__.py +9 -6
mindspore/nn/loss/loss.py +678 -142
mindspore/nn/metrics.py +53 -0
mindspore/nn/optim/_dist_optimizer_registry.py +2 -2
mindspore/nn/optim/ada_grad.py +8 -8
mindspore/nn/optim/adadelta.py +2 -3
mindspore/nn/optim/adafactor.py +18 -14
mindspore/nn/optim/adam.py +429 -87
mindspore/nn/optim/adamax.py +5 -6
mindspore/nn/optim/adasum.py +10 -8
mindspore/nn/optim/asgd.py +7 -7
mindspore/nn/optim/ftrl.py +81 -11
mindspore/nn/optim/lamb.py +7 -8
mindspore/nn/optim/lars.py +4 -4
mindspore/nn/optim/lazyadam.py +82 -7
mindspore/nn/optim/momentum.py +8 -7
mindspore/nn/optim/optimizer.py +19 -10
mindspore/nn/optim/proximal_ada_grad.py +6 -5
mindspore/nn/optim/rmsprop.py +3 -3
mindspore/nn/optim/rprop.py +20 -16
mindspore/nn/optim/sgd.py +21 -15
mindspore/nn/optim/thor.py +23 -21
mindspore/nn/probability/__init__.py +0 -2
mindspore/nn/probability/bijector/bijector.py +7 -6
mindspore/nn/probability/bijector/invert.py +4 -2
mindspore/nn/probability/bijector/softplus.py +2 -2
mindspore/nn/probability/bnn_layers/dense_variational.py +1 -1
mindspore/nn/probability/bnn_layers/layer_distribution.py +2 -2
mindspore/nn/probability/distribution/__init__.py +6 -0
mindspore/nn/probability/distribution/_utils/custom_ops.py +3 -2
mindspore/nn/probability/distribution/_utils/utils.py +11 -17
mindspore/nn/probability/distribution/bernoulli.py +6 -6
mindspore/nn/probability/distribution/beta.py +1 -1
mindspore/nn/probability/distribution/categorical.py +9 -9
mindspore/nn/probability/distribution/cauchy.py +8 -8
mindspore/nn/probability/distribution/distribution.py +12 -6
mindspore/nn/probability/distribution/exponential.py +5 -5
mindspore/nn/probability/distribution/gamma.py +3 -3
mindspore/nn/probability/distribution/geometric.py +6 -5
mindspore/nn/probability/distribution/gumbel.py +5 -5
mindspore/nn/probability/distribution/half_normal.py +133 -0
mindspore/nn/probability/distribution/laplace.py +128 -0
mindspore/nn/probability/distribution/log_normal.py +0 -1
mindspore/nn/probability/distribution/logistic.py +4 -5
mindspore/nn/probability/distribution/normal.py +11 -15
mindspore/nn/probability/distribution/poisson.py +6 -2
mindspore/nn/probability/distribution/student_t.py +150 -0
mindspore/nn/probability/distribution/transformed_distribution.py +4 -4
mindspore/nn/probability/distribution/uniform.py +5 -5
mindspore/nn/reinforcement/_tensors_queue.py +3 -3
mindspore/nn/reinforcement/tensor_array.py +2 -2
mindspore/nn/sparse/sparse.py +8 -1
mindspore/nn/wrap/cell_wrapper.py +55 -27
mindspore/nn/wrap/grad_reducer.py +20 -11
mindspore/nn/wrap/loss_scale.py +47 -30
mindspore/numpy/array_creations.py +33 -22
mindspore/numpy/array_ops.py +46 -42
mindspore/numpy/logic_ops.py +6 -27
mindspore/numpy/math_ops.py +26 -19
mindspore/numpy/utils.py +1 -8
mindspore/numpy/utils_const.py +112 -62
mindspore/opencv_core452.dll +0 -0
mindspore/opencv_imgcodecs452.dll +0 -0
mindspore/opencv_imgproc452.dll +0 -0
mindspore/ops/__init__.py +6 -3
mindspore/ops/_constants.py +0 -6
mindspore/ops/_grad/__init__.py +2 -1
mindspore/ops/_grad/grad_array_ops.py +209 -152
mindspore/ops/_grad/grad_base.py +55 -17
mindspore/ops/_grad/grad_clip_ops.py +11 -3
mindspore/ops/_grad/grad_comm_ops.py +58 -47
mindspore/ops/_grad/grad_implementations.py +21 -61
mindspore/ops/_grad/grad_inner_ops.py +48 -6
mindspore/ops/_grad/grad_math_ops.py +306 -161
mindspore/ops/_grad/grad_nn_ops.py +192 -181
mindspore/ops/_grad/grad_other_ops.py +1 -1
mindspore/ops/_grad/grad_quant_ops.py +5 -5
mindspore/ops/_grad/grad_sequence_ops.py +296 -0
mindspore/ops/_grad/grad_sparse.py +15 -9
mindspore/ops/_grad_experimental/__init__.py +1 -0
mindspore/ops/_grad_experimental/grad_array_ops.py +441 -55
mindspore/ops/_grad_experimental/grad_image_ops.py +25 -7
mindspore/ops/_grad_experimental/grad_inner_ops.py +3 -44
mindspore/ops/_grad_experimental/grad_linalg_ops.py +16 -21
mindspore/ops/_grad_experimental/grad_math_ops.py +979 -49
mindspore/ops/_grad_experimental/grad_nn_ops.py +78 -8
mindspore/ops/_grad_experimental/grad_scalar_ops.py +112 -0
mindspore/ops/_grad_experimental/grad_sparse_ops.py +197 -13
mindspore/ops/_op_impl/__init__.py +3 -3
mindspore/ops/_op_impl/_custom_op/__init__.py +0 -1
mindspore/ops/_op_impl/_custom_op/_basic.py +0 -1
mindspore/ops/_op_impl/_custom_op/batch_matmul_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/batchnorm_fold.py +4 -2
mindspore/ops/_op_impl/_custom_op/batchnorm_fold2.py +2 -2
mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad_reduce.py +5 -5
mindspore/ops/_op_impl/_custom_op/batchnorm_fold_grad.py +3 -3
mindspore/ops/_op_impl/_custom_op/cholesky_trsm_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/correction_mul.py +3 -3
mindspore/ops/_op_impl/_custom_op/correction_mul_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/dsd_back_impl.py +4 -8
mindspore/ops/_op_impl/_custom_op/dsd_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad_reduce.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad_reduce.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer.py +2 -2
mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer_grad.py +2 -2
mindspore/ops/_op_impl/_custom_op/fused_abs_max1_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/img2col_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_left_impl.py +2 -2
mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_right_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_left_cast_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_right_mul_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/matmul_cube_impl.py +2 -2
mindspore/ops/_op_impl/_custom_op/matmul_dds_grad_impl.py +0 -1
mindspore/ops/_op_impl/_custom_op/matmul_dds_impl.py +0 -1
mindspore/ops/_op_impl/_custom_op/matrix_combine_impl.py +1 -1
mindspore/ops/_op_impl/_custom_op/minmax_update_perchannel.py +2 -2
mindspore/ops/_op_impl/_custom_op/minmax_update_perlayer.py +2 -2
mindspore/ops/_op_impl/_custom_op/transpose02314_impl.py +1 -1
mindspore/ops/_op_impl/aicpu/__init__.py +238 -3
mindspore/ops/_op_impl/aicpu/abs.py +36 -0
mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d.py +34 -0
mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d_grad.py +34 -0
mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d.py +39 -0
mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d_grad.py +39 -0
mindspore/ops/_op_impl/aicpu/adaptive_max_pool_2d_grad.py +37 -0
mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d.py +42 -0
mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d_grad.py +152 -0
mindspore/ops/_op_impl/aicpu/add.py +43 -0
mindspore/ops/_op_impl/aicpu/addcdiv.py +0 -32
mindspore/ops/_op_impl/aicpu/addcmul.py +0 -84
mindspore/ops/_op_impl/aicpu/affine_grid_grad.py +35 -0
mindspore/ops/_op_impl/aicpu/arg_max.py +75 -0
mindspore/ops/_op_impl/aicpu/arg_min.py +75 -0
mindspore/ops/_op_impl/aicpu/argmin_with_value.py +43 -0
mindspore/ops/_op_impl/aicpu/batch_matmul.py +43 -0
mindspore/ops/_op_impl/aicpu/batch_norm_grad_grad.py +49 -0
mindspore/ops/_op_impl/aicpu/bernoulli.py +48 -0
mindspore/ops/_op_impl/aicpu/bessel_i0.py +31 -0
mindspore/ops/_op_impl/aicpu/bias_add.py +44 -0
mindspore/ops/_op_impl/aicpu/bias_add_grad.py +43 -0
mindspore/ops/_op_impl/aicpu/bincount.py +33 -0
mindspore/{nn/probability/infer/variational/__init__.py → ops/_op_impl/aicpu/cauchy.py} +17 -10
mindspore/ops/_op_impl/aicpu/channel_shuffle.py +40 -0
mindspore/ops/_op_impl/aicpu/cholesky.py +1 -1
mindspore/ops/_op_impl/{cpu/bias_add.py → aicpu/choleskygrad.py} +9 -7
mindspore/ops/_op_impl/aicpu/combined_non_max_suppression.py +42 -0
mindspore/ops/_op_impl/aicpu/concat_offset.py +42 -0
mindspore/ops/_op_impl/aicpu/concat_offset_v1.py +31 -0
mindspore/ops/_op_impl/aicpu/conj.py +11 -0
mindspore/ops/_op_impl/aicpu/crop_and_resize_grad_image.py +38 -0
mindspore/ops/_op_impl/aicpu/cumulative_logsumexp.py +36 -0
mindspore/ops/_op_impl/aicpu/deformable_offsets.py +38 -0
mindspore/ops/_op_impl/aicpu/deformable_offsets_grad.py +2 -2
mindspore/ops/_op_impl/aicpu/dense_to_sparse_set_operation.py +48 -0
mindspore/ops/_op_impl/aicpu/diag.py +36 -0
mindspore/ops/_op_impl/aicpu/diag_part.py +36 -0
mindspore/ops/_op_impl/aicpu/diagonal.py +35 -0
mindspore/ops/_op_impl/{cpu/bias_add_grad.py → aicpu/digamma.py} +9 -7
mindspore/ops/_op_impl/aicpu/eig.py +35 -0
mindspore/ops/_op_impl/aicpu/fft_with_size.py +41 -0
mindspore/ops/_op_impl/aicpu/flatten.py +1 -0
mindspore/ops/_op_impl/aicpu/fmax.py +36 -0
mindspore/ops/_op_impl/aicpu/fmin.py +37 -0
mindspore/ops/_op_impl/aicpu/fractional_max_pool3d_with_fixed_ksize.py +1 -1
mindspore/ops/_op_impl/aicpu/fse_decode.py +43 -0
mindspore/ops/_op_impl/aicpu/glu.py +33 -0
mindspore/ops/_op_impl/aicpu/glu_grad.py +34 -0
mindspore/ops/_op_impl/aicpu/greater.py +41 -0
mindspore/ops/_op_impl/aicpu/greater_equal.py +41 -0
mindspore/ops/_op_impl/aicpu/index_put.py +50 -0
mindspore/ops/_op_impl/{tbe/scatter_add_ds.py → aicpu/inplace_index_add.py} +17 -21
mindspore/ops/_op_impl/aicpu/instance_norm_v2.py +41 -0
mindspore/ops/_op_impl/aicpu/instance_norm_v2_grad.py +44 -0
mindspore/ops/_op_impl/aicpu/layer_norm_grad_grad.py +47 -0
mindspore/ops/_op_impl/aicpu/less.py +41 -0
mindspore/ops/_op_impl/aicpu/less_equal.py +41 -0
mindspore/ops/_op_impl/aicpu/lgamma.py +32 -0
mindspore/ops/_op_impl/aicpu/log_normal_reverse.py +33 -0
mindspore/ops/_op_impl/aicpu/logit.py +33 -0
mindspore/ops/_op_impl/aicpu/logit_grad.py +34 -0
mindspore/ops/_op_impl/aicpu/masked_fill.py +42 -0
mindspore/ops/_op_impl/aicpu/masked_scatter.py +39 -0
mindspore/ops/_op_impl/aicpu/matmul.py +39 -0
mindspore/ops/_op_impl/aicpu/matrix_logarithm.py +31 -0
mindspore/ops/_op_impl/aicpu/matrix_power.py +32 -0
mindspore/ops/_op_impl/aicpu/matrix_solve_ls.py +36 -0
mindspore/ops/_op_impl/aicpu/matrix_triangular_solve.py +36 -0
mindspore/ops/_op_impl/aicpu/mirror_pad.py +2 -0
mindspore/ops/_op_impl/aicpu/mirror_pad_grad.py +0 -4
mindspore/ops/_op_impl/aicpu/mul.py +3 -1
mindspore/ops/_op_impl/aicpu/multinomial.py +14 -6
mindspore/ops/_op_impl/aicpu/multinomial_with_replacement.py +35 -0
mindspore/ops/_op_impl/aicpu/nan_to_num.py +34 -0
mindspore/ops/_op_impl/aicpu/nllloss.py +38 -0
mindspore/ops/_op_impl/aicpu/nllloss_grad.py +39 -0
mindspore/ops/_op_impl/aicpu/ones_like.py +0 -2
mindspore/ops/_op_impl/aicpu/polar.py +32 -0
mindspore/ops/_op_impl/aicpu/polygamma.py +34 -0
mindspore/ops/_op_impl/aicpu/qr.py +36 -0
mindspore/ops/_op_impl/aicpu/quant_dtype_cast.py +40 -0
mindspore/ops/_op_impl/aicpu/quantile.py +35 -0
mindspore/ops/_op_impl/aicpu/ragged_tensor_to_sparse.py +73 -0
mindspore/ops/_op_impl/aicpu/ragged_tensor_to_tensor.py +74 -0
mindspore/ops/_op_impl/aicpu/random_shuffle.py +3 -0
mindspore/ops/_op_impl/aicpu/randperm_v2.py +41 -0
mindspore/ops/_op_impl/aicpu/range.py +36 -0
mindspore/ops/_op_impl/aicpu/reciprocal.py +34 -0
mindspore/ops/_op_impl/aicpu/reciprocal_grad.py +35 -0
mindspore/ops/_op_impl/aicpu/reduce_sum.py +57 -0
mindspore/ops/_op_impl/aicpu/resize_bicubic.py +2 -8
mindspore/ops/_op_impl/aicpu/resize_bicubic_grad.py +1 -1
mindspore/ops/_op_impl/aicpu/resize_v2.py +68 -0
mindspore/ops/_op_impl/aicpu/resize_v2_grad.py +68 -0
mindspore/ops/_op_impl/aicpu/scatter_elements.py +4 -0
mindspore/ops/_op_impl/aicpu/scatter_nd_update.py +2 -0
mindspore/ops/_op_impl/aicpu/search_sorted.py +12 -6
mindspore/ops/_op_impl/aicpu/self_adjoint_eig.py +34 -0
mindspore/ops/_op_impl/aicpu/sequence_add.py +34 -0
mindspore/ops/_op_impl/aicpu/sequence_add_offset.py +34 -0
mindspore/ops/_op_impl/aicpu/sequence_addn.py +38 -0
mindspore/ops/_op_impl/aicpu/slice_grad.py +76 -0
mindspore/ops/_op_impl/aicpu/smooth_l1_loss.py +35 -0
mindspore/ops/_op_impl/aicpu/smooth_l1_loss_grad.py +37 -0
mindspore/ops/_op_impl/aicpu/sort.py +39 -0
mindspore/ops/_op_impl/aicpu/sparse_apply_adagrad_da.py +0 -24
mindspore/ops/_op_impl/aicpu/sparse_cross.py +42 -0
mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows.py +63 -0
mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows_grad.py +45 -0
mindspore/ops/_op_impl/aicpu/sparse_matrix_mat_mul.py +56 -0
mindspore/ops/_op_impl/{tbe/slice_ds.py → aicpu/sparse_segment_sum.py} +16 -24
mindspore/ops/_op_impl/aicpu/sparse_segment_sum_with_num_segments.py +68 -0
mindspore/ops/_op_impl/aicpu/sparse_slice.py +63 -0
mindspore/ops/_op_impl/aicpu/sparse_slice_grad.py +61 -0
mindspore/ops/_op_impl/aicpu/squared_difference.py +2 -0
mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +93 -0
mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +66 -0
mindspore/ops/_op_impl/aicpu/tensor_scatter_update.py +59 -0
mindspore/ops/_op_impl/{tbe/gather_v2.py → aicpu/tile.py} +24 -24
mindspore/ops/_op_impl/aicpu/tridiagonal_solve.py +35 -0
mindspore/ops/_op_impl/aicpu/tril_indices.py +34 -0
mindspore/ops/_op_impl/aicpu/triu_indices.py +34 -0
mindspore/ops/_op_impl/aicpu/uniform.py +34 -0
mindspore/ops/_op_impl/aicpu/uniform_candidate_sampler.py +1 -0
mindspore/ops/_op_impl/aicpu/unique_consecutive.py +10 -2
mindspore/ops/_op_impl/cpu/__init__.py +1 -2
mindspore/ops/_op_impl/cpu/dynamic_shape.py +5 -1
mindspore/ops/_op_impl/cpu/maximum_grad.py +2 -0
mindspore/{compression/common/__init__.py → ops/_op_impl/cpu/pyexecute.py} +13 -8
mindspore/ops/_op_impl/cpu/reduce_sum.py +8 -0
mindspore/ops/_op_impl/cpu/sparse_slice.py +62 -0
mindspore/ops/_op_impl/cpu/sparse_slice_grad.py +60 -0
mindspore/ops/_op_impl/cpu/tensor_shape.py +5 -1
mindspore/ops/_op_impl/tbe/__init__.py +27 -608
mindspore/ops/_op_impl/tbe/addcdiv_ds.py +42 -0
mindspore/ops/_op_impl/tbe/addcmul_ds.py +44 -0
mindspore/ops/_op_impl/tbe/assign_add_ds.py +1 -0
mindspore/ops/_op_impl/tbe/atomic_addr_clean.py +1 -1
mindspore/ops/_op_impl/tbe/avg_pool_3d_grad.py +1 -1
mindspore/ops/_op_impl/tbe/basic_lstm_cell_c_state_grad_v2.py +0 -1
mindspore/ops/_op_impl/tbe/batch_to_space.py +1 -1
mindspore/ops/_op_impl/tbe/batch_to_space_nd.py +1 -1
mindspore/ops/_op_impl/tbe/batch_to_space_nd_v2.py +41 -0
mindspore/ops/_op_impl/tbe/bce_with_logits_loss.py +1 -0
mindspore/ops/_op_impl/tbe/bias_add_grad.py +2 -0
mindspore/ops/_op_impl/tbe/bn_infer_grad.py +4 -2
mindspore/ops/_op_impl/tbe/bn_infer_grad_ds.py +40 -0
mindspore/ops/_op_impl/tbe/bn_training_update.py +0 -1
mindspore/ops/_op_impl/tbe/bn_training_update_ds.py +0 -1
mindspore/ops/_op_impl/tbe/broadcast_to_ds.py +6 -4
mindspore/ops/_op_impl/tbe/cast.py +0 -2
mindspore/ops/_op_impl/tbe/cast_ds.py +3 -3
mindspore/ops/_op_impl/tbe/ctc_loss_v2.py +0 -2
mindspore/ops/_op_impl/tbe/ctc_loss_v2_grad.py +0 -2
mindspore/ops/_op_impl/tbe/data_format_dim_map_ds.py +1 -0
mindspore/ops/_op_impl/tbe/deformable_offsets.py +1 -0
mindspore/ops/_op_impl/tbe/depthwise_conv2d.py +1 -1
mindspore/ops/_op_impl/tbe/dynamic_atomic_addr_clean.py +1 -1
mindspore/ops/_op_impl/tbe/gather_nd.py +1 -0
mindspore/ops/_op_impl/tbe/greater.py +2 -0
mindspore/ops/_op_impl/tbe/{index_add.py → inplace_index_add.py} +3 -6
mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_v2.py +0 -1
mindspore/ops/_op_impl/tbe/npu_clear_float_status_v2.py +35 -0
mindspore/ops/_op_impl/tbe/npu_get_float_status_v2.py +35 -0
mindspore/ops/_op_impl/tbe/one_hot_ds.py +0 -6
mindspore/ops/_op_impl/tbe/{greater_ds.py → reduce_all_ds.py} +13 -16
mindspore/ops/_op_impl/tbe/reduce_any_ds.py +39 -0
mindspore/ops/_op_impl/tbe/roi_align_ds.py +44 -0
mindspore/ops/_op_impl/tbe/roi_align_grad_ds.py +44 -0
mindspore/ops/_op_impl/tbe/scatter_add.py +2 -0
mindspore/ops/_op_impl/tbe/scatter_nd_add.py +2 -2
mindspore/ops/_op_impl/tbe/slice.py +26 -15
mindspore/ops/_op_impl/tbe/space_to_batch.py +1 -1
mindspore/ops/_op_impl/tbe/space_to_batch_nd.py +1 -1
mindspore/ops/_op_impl/tbe/strided_slice_grad_d.py +1 -0
mindspore/ops/_op_impl/tbe/trans_data_ds.py +15 -5
mindspore/ops/_op_impl/tbe/unsorted_segment_sum.py +1 -1
mindspore/ops/_op_impl/tbe/unsorted_segment_sum_ds.py +2 -0
mindspore/ops/_primitive_cache.py +3 -2
mindspore/ops/_register_for_op.py +11 -0
mindspore/ops/_utils/__init__.py +1 -1
mindspore/ops/_utils/utils.py +20 -41
mindspore/ops/_vmap/__init__.py +2 -2
mindspore/ops/_vmap/vmap_array_ops.py +170 -78
mindspore/ops/_vmap/vmap_base.py +24 -10
mindspore/ops/_vmap/vmap_convolution_ops.py +7 -10
mindspore/ops/_vmap/vmap_grad_math_ops.py +4 -4
mindspore/ops/_vmap/vmap_grad_nn_ops.py +41 -9
mindspore/ops/_vmap/vmap_image_ops.py +52 -0
mindspore/ops/_vmap/vmap_math_ops.py +77 -6
mindspore/ops/_vmap/vmap_nn_ops.py +78 -29
mindspore/ops/_vmap/vmap_other_ops.py +3 -1
mindspore/ops/_vmap/vmap_random_ops.py +55 -3
mindspore/ops/_vmap/vmap_sparse_ops.py +1 -0
mindspore/ops/bprop_mindir/AdaptiveAvgPool2D_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/AdaptiveMaxPool2D_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/ApproximateEqual_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/Argmax_bprop.mindir +13 -12
mindspore/ops/bprop_mindir/Argmin_bprop.mindir +14 -13
mindspore/ops/bprop_mindir/AssignSub_bprop.mindir +17 -18
mindspore/ops/bprop_mindir/Assign_bprop.mindir +16 -16
mindspore/ops/bprop_mindir/AvgPool3D_bprop.mindir +150 -0
mindspore/ops/bprop_mindir/AvgPool_bprop.mindir +66 -0
mindspore/ops/bprop_mindir/BCEWithLogitsLoss_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/BNTrainingReduce_bprop.mindir +13 -12
mindspore/ops/bprop_mindir/BatchNormGrad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/BatchToSpaceND_bprop.mindir +28 -0
mindspore/ops/bprop_mindir/BiasAddGrad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/BinaryCrossEntropy_bprop.mindir +33 -0
mindspore/ops/bprop_mindir/BroadcastTo_bprop.mindir +306 -0
mindspore/ops/bprop_mindir/Broadcast_bprop.mindir +12 -8
mindspore/ops/bprop_mindir/CTCLoss_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Concat_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Conv2DBackpropFilter_bprop.mindir +240 -0
mindspore/ops/bprop_mindir/Conv2DBackpropInput_bprop.mindir +247 -0
mindspore/ops/bprop_mindir/Conv2DTranspose_bprop.mindir +247 -0
mindspore/ops/bprop_mindir/Conv3DTranspose_bprop.mindir +315 -0
mindspore/ops/bprop_mindir/Conv3D_bprop.mindir +278 -0
mindspore/ops/bprop_mindir/DType_bprop.mindir +12 -12
mindspore/ops/bprop_mindir/DeformableOffsets_bprop.mindir +58 -0
mindspore/ops/bprop_mindir/Depend_bprop.mindir +12 -13
mindspore/ops/bprop_mindir/DepthToSpace_bprop.mindir +23 -0
mindspore/ops/bprop_mindir/DepthwiseConv2dNative_bprop.mindir +138 -0
mindspore/ops/bprop_mindir/DiagPart_bprop.mindir +15 -0
mindspore/ops/bprop_mindir/Dropout2D_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Dropout3D_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/DropoutDoMask_bprop.mindir +22 -24
mindspore/ops/bprop_mindir/DropoutGenMask_bprop.mindir +16 -14
mindspore/ops/bprop_mindir/DropoutGrad_bprop.mindir +27 -0
mindspore/ops/bprop_mindir/Dropout_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/DynamicGRUV2_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/DynamicRNN_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/DynamicShape_bprop.mindir +12 -12
mindspore/ops/bprop_mindir/Elu_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/EmbeddingLookup_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Equal_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/ExpandDims_bprop.mindir +58 -0
mindspore/ops/bprop_mindir/FastGeLU_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/Flatten_bprop.mindir +54 -0
mindspore/ops/bprop_mindir/FloorDiv_bprop.mindir +18 -15
mindspore/ops/bprop_mindir/GatherD_bprop.mindir +26 -0
mindspore/ops/bprop_mindir/GatherNd_bprop.mindir +57 -0
mindspore/ops/bprop_mindir/Gather_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/GreaterEqual_bprop.mindir +17 -18
mindspore/ops/bprop_mindir/Greater_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/HSigmoid_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/HSwish_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/IOU_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/InstanceNorm_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/IsFinite_bprop.mindir +13 -12
mindspore/ops/bprop_mindir/IsInf_bprop.mindir +13 -10
mindspore/ops/bprop_mindir/IsNan_bprop.mindir +14 -11
mindspore/ops/bprop_mindir/KLDivLoss_bprop.mindir +126 -0
mindspore/ops/bprop_mindir/L2Loss_bprop.mindir +15 -0
mindspore/ops/bprop_mindir/L2Normalize_bprop.mindir +30 -0
mindspore/ops/bprop_mindir/LRN_bprop.mindir +43 -0
mindspore/ops/bprop_mindir/LayerNormGrad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/LessEqual_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/Less_bprop.mindir +17 -18
mindspore/ops/bprop_mindir/LinSpace_bprop.mindir +22 -19
mindspore/ops/bprop_mindir/Load_bprop.mindir +12 -13
mindspore/ops/bprop_mindir/LogSoftmax_bprop.mindir +23 -0
mindspore/ops/bprop_mindir/LogicalAnd_bprop.mindir +17 -18
mindspore/ops/bprop_mindir/LogicalNot_bprop.mindir +14 -13
mindspore/ops/bprop_mindir/MaskedSelect_bprop.mindir +21 -0
mindspore/ops/bprop_mindir/MaxPool3DGradGrad_bprop.mindir +74 -0
mindspore/ops/bprop_mindir/MaxPool3DGrad_bprop.mindir +74 -0
mindspore/ops/bprop_mindir/MaxPool3D_bprop.mindir +75 -0
mindspore/ops/bprop_mindir/MaxPoolGradGrad_bprop.mindir +65 -0
mindspore/ops/bprop_mindir/MaxPoolWithArgmax_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Maximum_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Minimum_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/MirrorPad_bprop.mindir +27 -0
mindspore/ops/bprop_mindir/Mish_bprop.mindir +35 -0
mindspore/ops/bprop_mindir/MulNoNan_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/NLLLoss_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/NonZero_bprop.mindir +14 -0
mindspore/ops/bprop_mindir/NotEqual_bprop.mindir +18 -19
mindspore/ops/bprop_mindir/OneHot_bprop.mindir +25 -23
mindspore/ops/bprop_mindir/OnesLike_bprop.mindir +13 -13
mindspore/ops/bprop_mindir/PReLU_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Pad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Padding_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/RNNTLoss_bprop.mindir +29 -0
mindspore/ops/bprop_mindir/ROIAlign_bprop.mindir +82 -0
mindspore/ops/bprop_mindir/Range_bprop.mindir +21 -19
mindspore/ops/bprop_mindir/Rank_bprop.mindir +11 -11
mindspore/ops/bprop_mindir/ReLU6_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/ReLUV2_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/ReduceAll_bprop.mindir +18 -17
mindspore/ops/bprop_mindir/ReduceAny_bprop.mindir +18 -17
mindspore/ops/bprop_mindir/ReluGrad_bprop.mindir +19 -23
mindspore/ops/bprop_mindir/Reshape_bprop.mindir +60 -0
mindspore/ops/bprop_mindir/ResizeBilinear_bprop.mindir +29 -0
mindspore/ops/bprop_mindir/ResizeNearestNeighbor_bprop.mindir +89 -0
mindspore/ops/bprop_mindir/ReverseSequence_bprop.mindir +52 -0
mindspore/ops/bprop_mindir/ReverseV2_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/Round_bprop.mindir +14 -13
mindspore/ops/bprop_mindir/ScatterMax_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/ScatterMin_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/ScatterNdUpdate_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/ScatterNd_bprop.mindir +24 -0
mindspore/ops/bprop_mindir/ScatterNonAliasingAdd_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/ScatterUpdate_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/SeLU_bprop.mindir +21 -0
mindspore/ops/bprop_mindir/Select_bprop.mindir +30 -34
mindspore/ops/bprop_mindir/Shape_bprop.mindir +12 -12
mindspore/ops/bprop_mindir/SigmoidCrossEntropyWithLogits_bprop.mindir +21 -0
mindspore/ops/bprop_mindir/SigmoidGrad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Sigmoid_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/Sign_bprop.mindir +13 -12
mindspore/ops/bprop_mindir/Slice_bprop.mindir +26 -0
mindspore/ops/bprop_mindir/SmoothL1Loss_bprop.mindir +36 -0
mindspore/ops/bprop_mindir/SoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Softplus_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/Softsign_bprop.mindir +33 -0
mindspore/ops/bprop_mindir/Sort_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/SpaceToBatchND_bprop.mindir +28 -0
mindspore/ops/bprop_mindir/SpaceToDepth_bprop.mindir +23 -0
mindspore/ops/bprop_mindir/SparseGatherV2_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/SparseSoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Split_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/Squeeze_bprop.mindir +54 -0
mindspore/ops/bprop_mindir/StridedSliceGrad_bprop.mindir +95 -0
mindspore/ops/bprop_mindir/StridedSlice_bprop.mindir +98 -0
mindspore/ops/bprop_mindir/Switch_bprop.mindir +28 -32
mindspore/ops/bprop_mindir/TanhGrad_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/Tanh_bprop.mindir +66 -0
mindspore/ops/bprop_mindir/TensorScatterAdd_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/TensorScatterUpdate_bprop.mindir +29 -0
mindspore/ops/bprop_mindir/TensorShape_bprop.mindir +14 -0
mindspore/ops/bprop_mindir/Tile_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/TopK_bprop.mindir +0 -0
mindspore/ops/bprop_mindir/TransShape_bprop.mindir +23 -0
mindspore/ops/bprop_mindir/TruncateDiv_bprop.mindir +18 -15
mindspore/ops/bprop_mindir/TupleGetItem_bprop.mindir +11 -13
mindspore/ops/bprop_mindir/Unique_bprop.mindir +16 -0
mindspore/ops/bprop_mindir/Unstack_bprop.mindir +22 -0
mindspore/ops/bprop_mindir/UpsampleNearest3D_bprop.mindir +32 -0
mindspore/ops/bprop_mindir/UpsampleTrilinear3D_bprop.mindir +38 -0
mindspore/ops/bprop_mindir/ZerosLike_bprop.mindir +13 -12
mindspore/ops/bprop_mindir/__init__.py +1 -4
mindspore/ops/bprop_mindir/generate_mindir.py +32 -20
mindspore/ops/composite/__init__.py +12 -13
mindspore/ops/composite/base.py +261 -254
mindspore/ops/composite/env_ops.py +41 -0
mindspore/ops/composite/math_ops.py +197 -156
mindspore/ops/composite/multitype_ops/_compile_utils.py +428 -176
mindspore/ops/composite/multitype_ops/_constexpr_utils.py +188 -87
mindspore/ops/composite/multitype_ops/add_impl.py +23 -1
mindspore/ops/composite/multitype_ops/div_impl.py +3 -3
mindspore/ops/composite/multitype_ops/equal_impl.py +1 -0
mindspore/ops/composite/multitype_ops/floordiv_impl.py +1 -1
mindspore/ops/composite/multitype_ops/getitem_impl.py +52 -5
mindspore/ops/composite/multitype_ops/greater_equal_impl.py +31 -0
mindspore/ops/composite/multitype_ops/greater_impl.py +31 -0
mindspore/ops/composite/multitype_ops/in_impl.py +15 -3
mindspore/ops/composite/multitype_ops/less_equal_impl.py +33 -2
mindspore/ops/composite/multitype_ops/less_impl.py +33 -0
mindspore/ops/composite/multitype_ops/logical_and_impl.py +2 -2
mindspore/ops/composite/multitype_ops/logical_or_impl.py +2 -1
mindspore/ops/composite/multitype_ops/mod_impl.py +1 -1
mindspore/ops/composite/multitype_ops/mul_impl.py +21 -7
mindspore/ops/composite/multitype_ops/not_in_impl.py +15 -3
mindspore/ops/composite/multitype_ops/ones_like_impl.py +2 -4
mindspore/ops/composite/multitype_ops/pow_impl.py +1 -0
mindspore/ops/composite/multitype_ops/setitem_impl.py +62 -70
mindspore/ops/composite/multitype_ops/sub_impl.py +3 -3
mindspore/ops/composite/multitype_ops/zeros_like_impl.py +41 -4
mindspore/ops/function/__init__.py +323 -8
mindspore/ops/function/array_func.py +3511 -780
mindspore/ops/function/clip_func.py +329 -0
mindspore/ops/function/debug_func.py +6 -6
mindspore/ops/function/grad/__init__.py +5 -1
mindspore/ops/function/grad/grad_func.py +736 -65
mindspore/ops/function/image_func.py +270 -0
mindspore/ops/function/linalg_func.py +268 -8
mindspore/ops/function/math_func.py +8032 -3164
mindspore/ops/function/nn_func.py +5619 -1855
mindspore/ops/function/other_func.py +115 -0
mindspore/ops/function/parameter_func.py +11 -10
mindspore/ops/function/random_func.py +939 -77
mindspore/ops/function/sparse_func.py +249 -84
mindspore/ops/function/sparse_unary_func.py +2303 -0
mindspore/ops/function/spectral_func.py +146 -0
mindspore/ops/function/vmap_func.py +114 -0
mindspore/ops/functional.py +182 -254
mindspore/ops/op_info_register.py +79 -34
mindspore/ops/operations/__init__.py +210 -118
mindspore/ops/operations/_csr_ops.py +7 -7
mindspore/ops/operations/_embedding_cache_ops.py +25 -15
mindspore/ops/operations/_grad_ops.py +447 -322
mindspore/ops/operations/_inner_ops.py +547 -176
mindspore/ops/operations/_map_tensor_ops.py +112 -0
mindspore/ops/operations/_ms_kernel.py +29 -27
mindspore/ops/operations/_ocr_ops.py +11 -11
mindspore/ops/operations/_opaque_predicate_registry.py +41 -0
mindspore/ops/operations/_quant_ops.py +186 -101
mindspore/ops/operations/_rl_inner_ops.py +122 -61
mindspore/ops/operations/_scalar_ops.py +466 -0
mindspore/ops/operations/_sequence_ops.py +1047 -0
mindspore/ops/operations/_tensor_array.py +10 -11
mindspore/ops/operations/_thor_ops.py +4 -4
mindspore/ops/operations/array_ops.py +1428 -1226
mindspore/ops/operations/comm_ops.py +180 -117
mindspore/ops/operations/control_ops.py +4 -2
mindspore/ops/operations/custom_ops.py +185 -98
mindspore/ops/operations/debug_ops.py +92 -54
mindspore/ops/operations/image_ops.py +406 -211
mindspore/ops/operations/inner_ops.py +42 -53
mindspore/ops/operations/linalg_ops.py +32 -29
mindspore/ops/operations/math_ops.py +2076 -897
mindspore/ops/operations/nn_ops.py +1282 -1252
mindspore/ops/operations/other_ops.py +124 -278
mindspore/ops/operations/random_ops.py +345 -178
mindspore/ops/operations/rl_ops.py +8 -9
mindspore/ops/operations/sparse_ops.py +502 -157
mindspore/ops/operations/spectral_ops.py +107 -0
mindspore/ops/primitive.py +192 -15
mindspore/ops/vm_impl_registry.py +23 -2
mindspore/parallel/__init__.py +6 -1
mindspore/parallel/_auto_parallel_context.py +199 -92
mindspore/parallel/_cell_wrapper.py +4 -2
mindspore/parallel/_cost_model_context.py +3 -0
mindspore/parallel/_dp_allreduce_fusion.py +2 -1
mindspore/parallel/_offload_context.py +185 -0
mindspore/parallel/_parallel_serialization.py +167 -28
mindspore/parallel/_ps_context.py +9 -5
mindspore/parallel/_recovery_context.py +1 -1
mindspore/parallel/_tensor.py +9 -1
mindspore/{nn/transformer → parallel/_transformer}/__init__.py +6 -6
mindspore/{nn/transformer → parallel/_transformer}/layers.py +59 -37
mindspore/{nn/transformer → parallel/_transformer}/loss.py +4 -7
mindspore/{nn/transformer → parallel/_transformer}/moe.py +160 -35
mindspore/{nn/transformer → parallel/_transformer}/op_parallel_config.py +3 -3
mindspore/{nn/transformer → parallel/_transformer}/transformer.py +235 -196
mindspore/parallel/_utils.py +47 -7
mindspore/parallel/algo_parameter_config.py +5 -1
mindspore/parallel/checkpoint_transform.py +329 -0
mindspore/parallel/shard.py +229 -0
mindspore/perf_msvcbuildinsights.dll +0 -0
mindspore/pgodb140.dll +0 -0
mindspore/pgort140.dll +0 -0
mindspore/profiler/__init__.py +2 -1
mindspore/profiler/common/util.py +4 -3
mindspore/profiler/common/validator/validate_path.py +2 -2
mindspore/profiler/envprofiling.py +249 -0
mindspore/profiler/parser/aicpu_data_parser.py +38 -39
mindspore/profiler/parser/ascend_timeline_generator.py +497 -0
mindspore/profiler/parser/base_timeline_generator.py +471 -0
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +684 -0
mindspore/profiler/parser/framework_parser.py +42 -16
mindspore/profiler/parser/hccl_parser.py +158 -158
mindspore/profiler/parser/hwts_log_parser.py +7 -6
mindspore/profiler/parser/integrator.py +18 -1579
mindspore/profiler/parser/minddata_analyzer.py +8 -8
mindspore/profiler/parser/msadvisor_analyzer.py +14 -27
mindspore/profiler/parser/msadvisor_parser.py +2 -4
mindspore/profiler/parser/optime_parser.py +17 -18
mindspore/profiler/parser/profiler_info.py +108 -0
mindspore/profiler/parser/step_trace_parser.py +1 -1
mindspore/profiler/profiling.py +396 -194
mindspore/rewrite/__init__.py +6 -2
mindspore/rewrite/api/node.py +51 -110
mindspore/rewrite/api/node_type.py +10 -6
mindspore/rewrite/api/pattern_engine.py +51 -7
mindspore/rewrite/api/scoped_value.py +64 -53
mindspore/rewrite/api/symbol_tree.py +108 -61
mindspore/rewrite/api/tree_node_helper.py +2 -3
mindspore/{compression/quant/__init__.py → rewrite/ast_creator_register.py} +20 -11
mindspore/rewrite/ast_helpers/__init__.py +6 -3
mindspore/rewrite/ast_helpers/ast_creator.py +115 -0
mindspore/rewrite/ast_helpers/ast_finder.py +99 -1
mindspore/rewrite/ast_helpers/ast_modifier.py +17 -4
mindspore/rewrite/ast_helpers/ast_replacer.py +1 -1
mindspore/rewrite/ast_transformers/__init__.py +0 -1
mindspore/rewrite/ast_transformers/flatten_recursive_stmt.py +46 -5
mindspore/rewrite/ast_transformers/remove_return_out_of_if.py +6 -3
mindspore/rewrite/common/__init__.py +2 -0
mindspore/rewrite/common/event.py +1 -1
mindspore/rewrite/common/observable.py +1 -1
mindspore/rewrite/common/observer.py +1 -1
mindspore/rewrite/common/rewrite_elog.py +35 -0
mindspore/rewrite/namer.py +2 -2
mindspore/rewrite/namespace.py +14 -4
mindspore/rewrite/node.py +161 -13
mindspore/rewrite/parser.py +0 -1
mindspore/rewrite/parser_register.py +0 -1
mindspore/rewrite/parsers/arguments_parser.py +3 -2
mindspore/rewrite/parsers/assign_parser.py +267 -67
mindspore/rewrite/parsers/attribute_parser.py +56 -0
mindspore/rewrite/parsers/class_def_parser.py +191 -108
mindspore/rewrite/parsers/constant_parser.py +101 -0
mindspore/rewrite/parsers/container_parser.py +88 -0
mindspore/rewrite/parsers/for_parser.py +28 -15
mindspore/rewrite/parsers/function_def_parser.py +21 -5
mindspore/rewrite/parsers/if_parser.py +11 -28
mindspore/rewrite/parsers/module_parser.py +9 -6
mindspore/rewrite/parsers/return_parser.py +3 -2
mindspore/rewrite/sparsify/__init__.py +0 -0
mindspore/rewrite/sparsify/sparse_transformer.py +448 -0
mindspore/rewrite/sparsify/sparsify.py +109 -0
mindspore/rewrite/sparsify/utils.py +173 -0
mindspore/rewrite/symbol_tree.py +322 -109
mindspore/rewrite/symbol_tree_builder.py +45 -8
mindspore/rewrite/symbol_tree_dumper.py +0 -1
mindspore/rewrite/topological_manager.py +1 -2
mindspore/run_check/_check_version.py +209 -112
mindspore/run_check/run_check.py +2 -1
mindspore/tbbmalloc.dll +0 -0
mindspore/tinyxml2.dll +0 -0
mindspore/train/__init__.py +6 -4
mindspore/train/_utils.py +28 -5
mindspore/train/amp.py +321 -50
mindspore/train/callback/__init__.py +3 -1
mindspore/train/callback/_backup_and_restore.py +120 -0
mindspore/train/callback/_callback.py +8 -8
mindspore/train/callback/_checkpoint.py +12 -9
mindspore/train/callback/_early_stop.py +13 -7
mindspore/train/callback/_history.py +8 -8
mindspore/train/callback/_lambda_callback.py +6 -6
mindspore/train/callback/_landscape.py +36 -38
mindspore/train/callback/_loss_monitor.py +12 -6
mindspore/train/callback/_lr_scheduler_callback.py +2 -4
mindspore/train/callback/_on_request_exit.py +212 -0
mindspore/train/callback/_reduce_lr_on_plateau.py +13 -7
mindspore/train/callback/_summary_collector.py +27 -19
mindspore/train/callback/_time_monitor.py +13 -7
mindspore/train/checkpoint_pb2.py +68 -8
mindspore/train/data_sink.py +122 -33
mindspore/train/dataset_helper.py +28 -87
mindspore/train/loss_scale_manager.py +4 -7
mindspore/{nn → train}/metrics/__init__.py +20 -20
mindspore/{nn → train}/metrics/accuracy.py +12 -10
mindspore/{nn → train}/metrics/auc.py +4 -4
mindspore/{nn → train}/metrics/bleu_score.py +4 -4
mindspore/{nn → train}/metrics/confusion_matrix.py +10 -8
mindspore/{nn → train}/metrics/cosine_similarity.py +4 -4
mindspore/{nn → train}/metrics/dice.py +6 -5
mindspore/{nn → train}/metrics/error.py +7 -5
mindspore/{nn → train}/metrics/fbeta.py +9 -7
mindspore/{nn → train}/metrics/hausdorff_distance.py +8 -6
mindspore/{nn → train}/metrics/loss.py +4 -3
mindspore/{nn → train}/metrics/mean_surface_distance.py +6 -5
mindspore/{nn → train}/metrics/metric.py +6 -5
mindspore/{nn → train}/metrics/occlusion_sensitivity.py +4 -3
mindspore/{nn → train}/metrics/perplexity.py +5 -4
mindspore/{nn → train}/metrics/precision.py +5 -4
mindspore/{nn → train}/metrics/recall.py +5 -4
mindspore/{nn → train}/metrics/roc.py +7 -6
mindspore/{nn → train}/metrics/root_mean_square_surface_distance.py +6 -5
mindspore/{nn → train}/metrics/topk.py +7 -5
mindspore/train/mind_ir_pb2.py +339 -32
mindspore/train/model.py +113 -84
mindspore/train/serialization.py +547 -167
mindspore/train/summary/_summary_adapter.py +1 -1
mindspore/train/summary/summary_record.py +43 -12
mindspore/train/train_thor/convert_utils.py +7 -1
mindspore/train/train_thor/dataset_helper.py +3 -3
mindspore/train/train_thor/model_thor.py +0 -4
mindspore/turbojpeg.dll +0 -0
mindspore/vcmeta.dll +0 -0
mindspore/vcruntime140.dll +0 -0
mindspore/vcruntime140_1.dll +0 -0
mindspore/version.py +1 -1
{mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/METADATA +4 -3
{mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/RECORD +901 -660
mindspore/compression/common/constant.py +0 -124
mindspore/compression/export/__init__.py +0 -19
mindspore/compression/export/quant_export.py +0 -514
mindspore/compression/quant/qat.py +0 -636
mindspore/compression/quant/quant_utils.py +0 -462
mindspore/compression/quant/quantizer.py +0 -68
mindspore/libatomic-1.dll +0 -0
mindspore/libgcc_s_seh-1.dll +0 -0
mindspore/libgfortran-4.dll +0 -0
mindspore/libgomp-1.dll +0 -0
mindspore/libjpeg-62.dll +0 -0
mindspore/libmindspore.dll +0 -0
mindspore/libmindspore_common.dll +0 -0
mindspore/libmindspore_core.dll +0 -0
mindspore/libmindspore_glog.dll +0 -0
mindspore/libnnacl.dll +0 -0
mindspore/libopencv_core452.dll +0 -0
mindspore/libopencv_imgcodecs452.dll +0 -0
mindspore/libopencv_imgproc452.dll +0 -0
mindspore/libquadmath-0.dll +0 -0
mindspore/libsqlite3.dll +0 -0
mindspore/libssp-0.dll +0 -0
mindspore/libstdc++-6.dll +0 -0
mindspore/libtinyxml2.dll +0 -0
mindspore/libturbojpeg.dll +0 -0
mindspore/libwinpthread-1.dll +0 -0
mindspore/nn/layer/quant.py +0 -1868
mindspore/nn/layer/rnn_utils.py +0 -90
mindspore/nn/probability/dpn/__init__.py +0 -22
mindspore/nn/probability/dpn/vae/__init__.py +0 -25
mindspore/nn/probability/dpn/vae/cvae.py +0 -138
mindspore/nn/probability/dpn/vae/vae.py +0 -122
mindspore/nn/probability/infer/__init__.py +0 -22
mindspore/nn/probability/infer/variational/elbo.py +0 -70
mindspore/nn/probability/infer/variational/svi.py +0 -84
mindspore/nn/probability/toolbox/__init__.py +0 -22
mindspore/nn/probability/toolbox/anomaly_detection.py +0 -99
mindspore/nn/probability/toolbox/uncertainty_evaluation.py +0 -363
mindspore/nn/probability/transforms/__init__.py +0 -22
mindspore/nn/probability/transforms/transform_bnn.py +0 -262
mindspore/nn/probability/zhusuan/__init__.py +0 -18
mindspore/nn/probability/zhusuan/framework/__init__.py +0 -18
mindspore/nn/probability/zhusuan/framework/bn.py +0 -95
mindspore/nn/probability/zhusuan/variational/__init__.py +0 -18
mindspore/nn/probability/zhusuan/variational/elbo.py +0 -46
mindspore/ops/_op_impl/tbe/bias_add_grad_ds.py +0 -52
mindspore/ops/_op_impl/tbe/scatter_nd_add_ds.py +0 -43
mindspore/ops/bprop_mindir/AssignAdd_bprop.mindir +0 -20
mindspore/ops/bprop_mindir/Identity_bprop.mindir +0 -9
mindspore/ops/bprop_mindir/LogicalOr_bprop.mindir +0 -20
mindspore/ops/bprop_mindir/ReLU_bprop.mindir +0 -16
mindspore/ops/bprop_mindir/UpdateState_bprop.mindir +0 -17
mindspore/ops/bprop_mindir/stop_gradient_bprop.mindir +0 -12
mindspore/ops/composite/array_ops.py +0 -210
mindspore/ops/composite/clip_ops.py +0 -238
mindspore/ops/composite/random_ops.py +0 -426
mindspore/ops/composite/vmap_ops.py +0 -38
mindspore/ops/operations/sponge_ops.py +0 -3531
mindspore/ops/operations/sponge_update_ops.py +0 -2546
mindspore/parallel/nn/__init__.py +0 -42
mindspore/parallel/nn/loss.py +0 -22
mindspore/parallel/nn/moe.py +0 -21
mindspore/parallel/nn/op_parallel_config.py +0 -22
mindspore/parallel/nn/transformer.py +0 -31
mindspore/run_check/_check_deps_version.py +0 -84
{mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/WHEEL +0 -0
{mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/entry_points.txt +0 -0
{mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/top_level.txt +0 -0

mindspore/dataset/engine/datasets_text.py CHANGED Viewed

@@ -30,43 +30,49 @@ from .validators import check_imdb_dataset, check_iwslt2016_dataset, check_iwslt
     check_penn_treebank_dataset, check_ag_news_dataset, check_amazon_review_dataset, check_udpos_dataset, \
     check_wiki_text_dataset, check_conll2000_dataset, check_cluedataset, \
     check_sogou_news_dataset, check_textfiledataset, check_dbpedia_dataset, check_yelp_review_dataset, \
-    check_en_wik9_dataset, check_yahoo_answers_dataset, check_multi30k_dataset, check_squad_dataset
+    check_en_wik9_dataset, check_yahoo_answers_dataset, check_multi30k_dataset, check_squad_dataset, \
+    check_sst2_dataset
 from ..core.validator_helpers import replace_none
 class AGNewsDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses AG News datasets.
+    AG News dataset.
-    The generated dataset has three columns: :py:obj:`[index, title, description]`.
-    The tensor of column :py:obj:`index` is of the string type.
-    The tensor of column :py:obj:`title` is of the string type.
-    The tensor of column :py:obj:`description` is of the string type.
+    The generated dataset has three columns: :py:obj:`[index, title, description]` ,
+    and the data type of three columns is string type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Acceptable usages include 'train', 'test' and 'all' (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+        usage (str, optional): Acceptable usages include 'train', 'test' and 'all'. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If `shuffle` is False, no shuffling will be performed.
+            If `shuffle` is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
-            When this argument is specified, 'num_samples' reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
-            argument can only be specified when `num_shards` is also specified.
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
+            When this argument is specified, `num_samples` reflects the max sample number of per shard.
+        shard_id (int, optional): The shard ID within `num_shards` . This
+            argument can only be specified when `num_shards` is also specified. Default: None.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
+    Raises:
+        RuntimeError: If `dataset_dir` does not contain data files.
+        RuntimeError: If `num_shards` is specified but `shard_id` is None.
+        RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> ag_news_dataset_dir = "/path/to/ag_news_dataset_file"
@@ -125,49 +131,48 @@ class AGNewsDataset(SourceDataset, TextBaseDataset):
 class AmazonReviewDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses Amazon Review Polarity and Amazon Review Full datasets.
+    Amazon Review Polarity and Amazon Review Full datasets.
-    The generated dataset has three columns: :py:obj:`[label, title, content]`.
-    The tensor of column :py:obj:`label` is of the string type.
-    The tensor of column :py:obj:`title` is of the string type.
-    The tensor of column :py:obj:`content` is of the string type.
+    The generated dataset has three columns: :py:obj:`[label, title, content]` ,
+    and the data type of three columns is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the Amazon Review Polarity dataset
             or the Amazon Review Full dataset.
-        usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all' (default= 'all').
+        usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all'.
             For Polarity dataset, 'train' will read from 3,600,000 train samples,
             'test' will read from 400,000 test samples,
             'all' will read from all 4,000,000 samples.
             For Full dataset, 'train' will read from 3,000,000 train samples,
             'test' will read from 650,000 test samples,
-            'all' will read from all 3,650,000 samples (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to be read (default=None, reads the full dataset).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            'all' will read from all 3,650,000 samples. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to be read. Default: None, reads the full dataset.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If `shuffle` is False, no shuffling will be performed.
+            If `shuffle` is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the  mindspore.dataset.config).
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> amazon_review_dataset_dir = "/path/to/amazon_review_dataset_dir"
@@ -180,7 +185,7 @@ class AmazonReviewDataset(SourceDataset, TextBaseDataset):
     The dataset is mainly used for text classification, given the content and title, predict the correct star rating.
     The Amazon reviews polarity dataset is constructed by taking review score 1 and 2 as negative, 4 and 5 as positive.
-    Samples of score 3 is ignored. In the dataset, class 1 is the negative and class 2 is the positive.
+    Samples of score 3 is ignored.
     The Amazon Reviews Polarity and Amazon Reviews Full datasets have the same directory structures.
     You can unzip the dataset files into the following structure and read by MindSpore's API:
@@ -222,21 +227,22 @@ class AmazonReviewDataset(SourceDataset, TextBaseDataset):
 class CLUEDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses CLUE datasets.
+    CLUE(Chinese Language Understanding Evaluation) dataset.
     Supported CLUE classification tasks: 'AFQMC', 'TNEWS', 'IFLYTEK', 'CMNLI', 'WSC' and 'CSL'.
     Args:
         dataset_files (Union[str, list[str]]): String or list of files to be read or glob strings to search for
             a pattern of files. The list will be sorted in a lexicographical order.
         task (str, optional): The kind of task, one of 'AFQMC', 'TNEWS', 'IFLYTEK', 'CMNLI', 'WSC' and 'CSL'.
-            (default=AFQMC).
-        usage (str, optional): Specify the 'train', 'test' or 'eval' part of dataset (default='train').
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all images).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+            Default: 'AFQMC'.
+        usage (str, optional): Specify the 'train', 'test' or 'eval' part of dataset. Default: 'train'.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all images.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Default: Shuffle.GLOBAL. Bool type and Shuffle enum are both supported to pass in.
             If shuffle is False, no shuffling will be performed.
             If shuffle is True, performs global shuffle.
             There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
@@ -245,13 +251,13 @@ class CLUEDataset(SourceDataset, TextBaseDataset):
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     The generated dataset with different task setting has different output columns:
@@ -400,9 +406,9 @@ class CLUEDataset(SourceDataset, TextBaseDataset):
         ValueError: task is not in 'AFQMC', 'TNEWS', 'IFLYTEK', 'CMNLI', 'WSC' or 'CSL'.
         ValueError: usage is not in 'train', 'test' or 'eval'.
         ValueError: If `num_parallel_workers` exceeds the max thread numbers.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        ValueError: If `shard_id` is invalid (< 0 or >= `num_shards`).
     Examples:
         >>> clue_dataset_dir = ["/path/to/clue_dataset_file"] # contains 1 or multiple clue files
@@ -457,10 +463,10 @@ class CLUEDataset(SourceDataset, TextBaseDataset):
 class CoNLL2000Dataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses CoNLL2000 chunking dataset.
+    CoNLL-2000(Conference on Computational Natural Language Learning) chunking dataset.
-    The generated dataset has three columns: :py:obj:`[word, pos_tag, chunk_tag]`.
-    The tensors of column :py:obj:`word`, column :py:obj:`pos_tag`,
+    The generated dataset has three columns: :py:obj:`[word, pos_tag, chunk_tag]` .
+    The tensors of column :py:obj:`word` , column :py:obj:`pos_tag` ,
     and column :py:obj:`chunk_tag` are of the string type.
     Args:
@@ -471,7 +477,7 @@ class CoNLL2000Dataset(SourceDataset, TextBaseDataset):
             'all' will read from all 1,0948 samples. Default: None, read all samples.
         num_samples (int, optional): Number of samples (rows) to be read. Default: None, read the full dataset.
         shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
-            Default: mindspore.dataset.Shuffle.GLOBAL.
+            Default: `mindspore.dataset.Shuffle.GLOBAL` .
             If shuffle is False, no shuffling will be performed.
             If shuffle is True, performs global shuffle.
             There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
@@ -481,12 +487,13 @@ class CoNLL2000Dataset(SourceDataset, TextBaseDataset):
         num_shards (int, optional): Number of shards that the dataset will be divided into.
             When this argument is specified, `num_samples` reflects the max sample number of per shard. Default: None.
-        shard_id (int, optional): The shard ID within `num_shards`. This
+        shard_id (int, optional): The shard ID within `num_shards` . This
             argument can only be specified when `num_shards` is also specified. Default: None.
-        num_parallel_workers (int, optional): Number of workers to read the data.
-            Default: None, number set in the config.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_.
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
             Default: None, which means no cache is used.
     Raises:
@@ -547,47 +554,46 @@ class CoNLL2000Dataset(SourceDataset, TextBaseDataset):
 class DBpediaDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses the DBpedia dataset.
+    DBpedia dataset.
-    The generated dataset has three columns :py:obj:`[class, title, content]`.
-    The tensor of column :py:obj:`class` is of the string type.
-    The tensor of column :py:obj:`title` is of the string type.
-    The tensor of column :py:obj:`content` is of the string type.
+    The generated dataset has three columns :py:obj:`[class, title, content]` ,
+    and the data type of three columns is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
         usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all'.
             'train' will read from 560,000 train samples,
             'test' will read from 70,000 test samples,
-            'all' will read from all 630,000 samples (default=None, all samples).
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all text).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+            'all' will read from all 630,000 samples. Default: None, all samples.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all text.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
             If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        ValueError: If `shard_id` is invalid (< 0 or >= `num_shards`).
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
     Examples:
         >>> dbpedia_dataset_dir = "/path/to/dbpedia_dataset_directory"
@@ -646,33 +652,40 @@ class DBpediaDataset(SourceDataset, TextBaseDataset):
 class EnWik9Dataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses EnWik9 dataset.
+    EnWik9 dataset.
     The generated dataset has one column :py:obj:`[text]` with type string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all samples).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=True). Bool type and Shuffle enum are both supported to pass in.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all samples.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: True.
             If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
+    Raises:
+        RuntimeError: If `dataset_dir` does not contain data files.
+        RuntimeError: If `num_shards` is specified but `shard_id` is None.
+        RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> en_wik9_dataset_dir = "/path/to/en_wik9_dataset"
@@ -723,45 +736,46 @@ class EnWik9Dataset(SourceDataset, TextBaseDataset):
 class IMDBDataset(MappableDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses Internet Movie Database (IMDb).
+    IMDb(Internet Movie Database) dataset.
-    The generated dataset has two columns: :py:obj:`[text, label]`.
+    The generated dataset has two columns: :py:obj:`[text, label]` .
     The tensor of column :py:obj:`text` is of the string type.
-    The tensor of column :py:obj:`label` is of a scalar of uint32 type.
+    The column :py:obj:`label` is of a scalar of uint32 type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all'
-            (default=None, will read all samples).
-        num_samples (int, optional): The number of images to be included in the dataset
-            (default=None, will read all samples).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, set in the config).
-        shuffle (bool, optional): Whether or not to perform shuffle on the dataset
-            (default=None, expected order behavior shown in the table).
-        sampler (Sampler, optional): Object used to choose samples from the
-            dataset (default=None, expected order behavior shown in the table).
+        usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all'.
+            Default: None, will read all samples.
+        num_samples (int, optional): The number of images to be included in the dataset.
+            Default: None, will include all samples.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (bool, optional): Whether or not to perform shuffle on the dataset.
+            Default: None, expected order behavior shown in the table below.
+        sampler (Sampler, optional): Object used to choose samples from the dataset.
+            Default: None, expected order behavior shown in the table below.
         num_shards (int, optional): Number of shards that the dataset will be divided
-            into (default=None). When this argument is specified, `num_samples` reflects
+            into. Default: None. When this argument is specified, `num_samples` reflects
             the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `sampler` and `shuffle` are specified at the same time.
         RuntimeError: If `sampler` and `num_shards`/`shard_id` are specified at the same time.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        ValueError: If `shard_id` is invalid (< 0 or >= `num_shards`).
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
     Note:
         - The shape of the test column.
-        - This dataset can take in a `sampler`. `sampler` and `shuffle` are mutually exclusive.
+        - This dataset can take in a `sampler` . `sampler` and `shuffle` are mutually exclusive.
           The table below shows what input arguments are allowed and their expected behavior.
     .. list-table:: Expected Order Behavior of Using `sampler` and `shuffle`
@@ -865,49 +879,51 @@ class IMDBDataset(MappableDataset, TextBaseDataset):
 class IWSLT2016Dataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses IWSLT2016 datasets.
+    IWSLT2016(International Workshop on Spoken Language Translation) dataset.
-    The generated dataset has two columns: :py:obj:`[text, translation]`.
+    The generated dataset has two columns: :py:obj:`[text, translation]` .
     The tensor of column :py:obj: `text` is of the string type.
-    The tensor of column :py:obj: `translation` is of the string type.
+    The column :py:obj: `translation` is of the string type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Acceptable usages include 'train', 'valid', 'test' and 'all' (default=None, all samples).
+        usage (str, optional): Acceptable usages include 'train', 'valid', 'test' and 'all'. Default: None, all samples.
         language_pair (sequence, optional): Sequence containing source and target language, supported values are
             ('en', 'fr'), ('en', 'de'), ('en', 'cs'), ('en', 'ar'), ('fr', 'en'), ('de', 'en'), ('cs', 'en'),
-            ('ar', 'en') (default=('de', 'en')).
+            ('ar', 'en'). Default: ('de', 'en').
         valid_set (str, optional): A string to identify validation set, when usage is valid or all, the validation set
-            of valid_set type will be read, supported values are 'dev2010', 'tst2010', 'tst2011', 'tst2012', 'tst2013'
-            and 'tst2014' (default='tst2013').
-        test_set (str, optional): A string to identify test set, when usage is test or all, the test set of test_set
-            type will be read, supported values are 'dev2010', 'tst2010', 'tst2011', 'tst2012', 'tst2013' and 'tst2014'
-            (default='tst2014').
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            of `valid_set` type will be read, supported values are 'dev2010', 'tst2010', 'tst2011', 'tst2012', 'tst2013'
+            and 'tst2014'. Default: 'tst2013'.
+        test_set (str, optional): A string to identify test set, when usage is test or all, the test set of `test_set`
+            type will be read, supported values are 'dev2010', 'tst2010', 'tst2011', 'tst2012', 'tst2013' and 'tst2014'.
+            Default: 'tst2014'.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If `shuffle` is False, no shuffling will be performed.
+            If `shuffle` is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> iwslt2016_dataset_dir = "/path/to/iwslt2016_dataset_dir"
@@ -918,8 +934,8 @@ class IWSLT2016Dataset(SourceDataset, TextBaseDataset):
     IWSLT is an international oral translation conference, a major annual scientific conference dedicated to all aspects
     of oral translation. The MT task of the IWSLT evaluation activity constitutes a dataset, which can be publicly
-    obtained through the WIT3 website wit3.fbk.eu. The IWSLT2016 dataset includes translations from English to Arabic,
-    Czech, French, and German, and translations from Arabic, Czech, French, and German to English.
+    obtained through the WIT3 website `wit3 <https://wit3.fbk.eu>`_ . The IWSLT2016 dataset includes translations from
+    English to Arabic, Czech, French, and German, and translations from Arabic, Czech, French, and German to English.
     You can unzip the original IWSLT2016 dataset files into this directory structure and read by MindSpore's API. After
     decompression, you also need to decompress the dataset to be read in the specified folder. For example, if you want
@@ -992,44 +1008,45 @@ class IWSLT2016Dataset(SourceDataset, TextBaseDataset):
 class IWSLT2017Dataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses IWSLT2017 datasets.
+    IWSLT2017(International Workshop on Spoken Language Translation) dataset.
-    The generated dataset has two columns: :py:obj:`[text, translation]`.
-    The tensor of column :py:obj:`text` is of the string type.
-    The tensor of column :py:obj:`translation` is of the string type.
+    The generated dataset has two columns: :py:obj:`[text, translation]` .
+    The tensor of column :py:obj:`text` and :py:obj:`translation` are of the string type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Acceptable usages include 'train', 'valid', 'test' and 'all' (default=None, all samples).
+        usage (str, optional): Acceptable usages include 'train', 'valid', 'test' and 'all'. Default: None, all samples.
         language_pair (sequence, optional): List containing src and tgt language, supported values are ('en', 'nl'),
             ('en', 'de'), ('en', 'it'), ('en', 'ro'), ('nl', 'en'), ('nl', 'de'), ('nl', 'it'), ('nl', 'ro'),
             ('de', 'en'), ('de', 'nl'), ('de', 'it'), ('de', 'ro'), ('it', 'en'), ('it', 'nl'), ('it', 'de'),
-            ('it', 'ro'), ('ro', 'en'), ('ro', 'nl'), ('ro', 'de'), ('ro', 'it') (default=('de', 'en')).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+            ('it', 'ro'), ('ro', 'en'), ('ro', 'nl'), ('ro', 'de'), ('ro', 'it'). Default: ('de', 'en').
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
             If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> iwslt2017_dataset_dir = "/path/to/iwslt2017_dataset_dir"
@@ -1039,8 +1056,8 @@ class IWSLT2017Dataset(SourceDataset, TextBaseDataset):
     IWSLT is an international oral translation conference, a major annual scientific conference dedicated to all aspects
     of oral translation. The MT task of the IWSLT evaluation activity constitutes a dataset, which can be publicly
-    obtained through the WIT3 website wit3.fbk.eu. The IWSLT2017 dataset involves German, English, Italian, Dutch, and
-    Romanian. The dataset includes translations in any two different languages.
+    obtained through the WIT3 website  `wit3 <https://wit3.fbk.eu>`_ . The IWSLT2017 dataset involves German, English,
+    Italian, Dutch, and Romanian. The dataset includes translations in any two different languages.
     You can unzip the original IWSLT2017 dataset files into this directory structure and read by MindSpore's API. You
     need to decompress the dataset package in texts/DeEnItNlRo/DeEnItNlRo directory to get the DeEnItNlRo-DeEnItNlRo
@@ -1089,48 +1106,49 @@ class IWSLT2017Dataset(SourceDataset, TextBaseDataset):
 class Multi30kDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses Multi30k dataset.
+    Multi30k dataset.
-    The generated dataset has two columns :py:obj:`[text, translation]`.
-    The tensor of column :py:obj:'text' is of the string type.
-    The tensor of column :py:obj:'translation' is of the string type.
+    The generated dataset has two columns :py:obj:`[text, translation]` .
+    The tensor of column :py:obj:`text` is of the string type.
+    The tensor of column :py:obj:`translation` is of the string type.
-      Args:
+    Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Acceptable usages include 'train', 'test, 'valid' or 'all' (default='all').
-        language_pair (str, optional): Acceptable language_pair include ['en', 'de'], ['de', 'en']
-            (default=['en', 'de']).
-        num_samples (int, optional): The number of images to be included in the dataset
-            (default=None, all samples).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+        usage (str, optional): Acceptable usages include 'train', 'test, 'valid' or 'all'.
+            Default: None, will read all samples.
+        language_pair (Sequence[str, str], optional): Acceptable language_pair include ['en', 'de'], ['de', 'en'].
+            Default: None, means ['en', 'de'].
+        num_samples (int, optional): The number of images to be included in the dataset.
+            Default: None, will read all samples.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Whether to shuffle the dataset. Default: None, means Shuffle.GLOBAL.
+            If False is provided, no shuffling will be performed.
+            If True is provided, it is the same as setting to mindspore.dataset.Shuffle.GLOBAL.
+            If Shuffle is provided, the effect is as follows:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
         num_shards (int, optional): Number of shards that the dataset will be divided
-            into (default=None). When this argument is specified, `num_samples` reflects
+            into. Default: None. When this argument is specified, `num_samples` reflects
             the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        RuntimeError: If `usage` is not 'train', 'test', 'valid' or 'all'.
-        RuntimeError: If the length of language_pair is not equal to 2.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
+        ValueError: If `usage` is not 'train', 'test', 'valid' or 'all'.
+        TypeError: If `language_pair` is not of type Sequence[str, str].
+        RuntimeError: If num_samples is less than 0.
+        RuntimeError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        RuntimeError: If num_samples is less than 0.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
     Examples:
         >>> multi30k_dataset_dir = "/path/to/multi30k_dataset_directory"
@@ -1138,11 +1156,11 @@ class Multi30kDataset(SourceDataset, TextBaseDataset):
     About Multi30k dataset:
-    Multi30K is a dataset to stimulate multilingual multimodal research for English-German.
-    It is based on the Flickr30k dataset, which contains images sourced from online
-    photo-sharing websites. Each image is paired with five English descriptions, which were
-    collected from Amazon Mechanical Turk. The Multi30K dataset extends the Flickr30K
-    dataset with translated and independent German sentences.
+    Multi30K is a multilingual dataset that features approximately 31,000 standardized images
+    described in multiple languages. The images are sourced from Flickr and each image comes
+    with sentence descripitions in both English and German, as well as descriptions in other
+    languages. Multi30k is used primarily for training and testing in tasks such as image
+    captioning, machine translation, and visual question answering.
     You can unzip the dataset files into the following directory structure and read by MindSpore's API.
@@ -1190,9 +1208,9 @@ class Multi30kDataset(SourceDataset, TextBaseDataset):
 class PennTreebankDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses PennTreebank datasets.
+    PennTreebank dataset.
-    The generated dataset has one column :py:obj:`[text]`.
+    The generated dataset has one column :py:obj:`[text]` .
     The tensor of column :py:obj:`text` is of the string type.
     Args:
@@ -1201,27 +1219,34 @@ class PennTreebankDataset(SourceDataset, TextBaseDataset):
             'train' will read from 42,068 train samples of string type,
             'test' will read from 3,370 test samples of string type,
             'valid' will read from 3,761 test samples of string type,
-            'all' will read from all 49,199 samples of string type (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+            'all' will read from all 49,199 samples of string type. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
             If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
-            - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
+            - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
-            When this argument is specified, 'num_samples' reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
+            When this argument is specified, `num_samples` reflects the max sample number of per shard.
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
+    Raises:
+        RuntimeError: If `dataset_dir` does not contain data files.
+        RuntimeError: If `num_shards` is specified but `shard_id` is None.
+        RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> penn_treebank_dataset_dir = "/path/to/penn_treebank_dataset_directory"
@@ -1281,43 +1306,42 @@ class PennTreebankDataset(SourceDataset, TextBaseDataset):
 class SogouNewsDataset(SourceDataset, TextBaseDataset):
     r"""
-    A source dataset that reads and parses Sogou News dataset.
+    Sogou News dataset.
-    The generated dataset has three columns: :py:obj:`[index, title, content]`.
-    The tensor of column :py:obj:`index` is of the string type.
-    The tensor of column :py:obj:`title` is of the string type.
-    The tensor of column :py:obj:`content` is of the string type.
+    The generated dataset has three columns: :py:obj:`[index, title, content]` ,
+    and the data type of three columns is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
         usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all' .
             'train' will read from 450,000 train samples, 'test' will read from 60,000 test samples,
-            'all' will read from all 510,000 samples (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, read all samples).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+            'all' will read from all 510,000 samples. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, read all samples.
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
             If shuffle is False, no shuffling will be performed.
-            If shuffle is True, performs global shuffle.
-            There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
             - Shuffle.GLOBAL: Shuffle both the files and samples, same as setting shuffle to True.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> sogou_news_dataset_dir = "/path/to/sogou_news_dataset_dir"
@@ -1369,46 +1393,46 @@ class SogouNewsDataset(SourceDataset, TextBaseDataset):
 class SQuADDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses SQuAD 1.1 and SQuAD 2.0 datasets.
+    SQuAD 1.1 and SQuAD 2.0 datasets.
     The generated dataset with different versions and usages has the same output columns:
-        :py:obj:`[context, question, text, answer_start]`.
+    :py:obj:`[context, question, text, answer_start]` .
     The tensor of column :py:obj:`context` is of the string type.
     The tensor of column :py:obj:`question` is of the string type.
     The tensor of column :py:obj:`text` is the answer in the context of the string type.
     The tensor of column :py:obj:`answer_start` is the start index of answer in context,
-        which is of the uint32 type.
+    which is of the uint32 type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Specify the `train`, `dev` or `all` part of dataset (default=None, all samples).
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all samples).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+        usage (str, optional): Specify the 'train', 'dev' or 'all' part of dataset. Default: None, all samples.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all samples.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Whether to shuffle the dataset. Default: Shuffle.GLOBAL.
+            If False is provided, no shuffling will be performed.
+            If True is provided, it is the same as setting to mindspore.dataset.Shuffle.GLOBAL.
+            If Shuffle is provided, the effect is as follows:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
         ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
     Examples:
         >>> squad_dataset_dir = "/path/to/squad_dataset_file"
@@ -1416,7 +1440,7 @@ class SQuADDataset(SourceDataset, TextBaseDataset):
     About SQuAD dataset:
-    Stanford Question Answering Dataset (SQuAD) is a reading comprehension dataset, consisting of questions posed by
+    SQuAD (Stanford Question Answering Dataset) is a reading comprehension dataset, consisting of questions posed by
     crowdworkers on a set of Wikipedia articles, where the answer to every question is a segment of text, or span,
     from the corresponding reading passage, or the question might be unanswerable.
@@ -1430,6 +1454,7 @@ class SQuADDataset(SourceDataset, TextBaseDataset):
     For SQuAD 1.1:
     .. code-block::
         .
         └── SQuAD1
              ├── train-v1.1.json
@@ -1438,6 +1463,7 @@ class SQuADDataset(SourceDataset, TextBaseDataset):
     For SQuAD 2.0:
     .. code-block::
         .
         └── SQuAD2
              ├── train-v2.0.json
@@ -1479,6 +1505,106 @@ class SQuADDataset(SourceDataset, TextBaseDataset):
                              self.num_shards, self.shard_id)
+class SST2Dataset(SourceDataset, TextBaseDataset):
+    """
+    SST2(Stanford Sentiment Treebank v2) dataset.
+    The generated dataset's train.tsv and dev.tsv have two columns :py:obj:`[sentence, label]` .
+    The generated dataset's test.tsv has one column :py:obj:`[sentence]` .
+    The tensor of column :py:obj:`sentence` and :py:obj:`label` are of the string type.
+    Args:
+        dataset_dir (str): Path to the root directory that contains the dataset.
+        usage (str, optional): Usage of this dataset, can be `train`, `test` or `dev`. `train` will read
+            from 67,349 train samples, `test` will read from 1,821 test samples, `dev` will read from
+            all 872 samples. Default: None, will read train samples.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all text.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If shuffle is False, no shuffling will be performed;
+            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
+            Set the mode of data shuffling by passing in enumeration variables:
+            - Shuffle.GLOBAL: Shuffle the samples.
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
+            When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
+        shard_id (int, optional): The shard ID within num_shards. This argument can only be specified when
+            num_shards is also specified. Default: None.
+        cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
+    Raises:
+        RuntimeError: If `dataset_dir` does not contain data files.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
+        RuntimeError: If `num_shards` is specified but shard_id is None.
+        RuntimeError: If `shard_id` is specified but num_shards is None.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
+    Examples:
+        >>> sst2_dataset_dir = "/path/to/sst2_dataset_directory"
+        >>>
+        >>> # 1) Read 3 samples from SST2 dataset
+        >>> dataset = ds.SST2Dataset(dataset_dir=sst2_dataset_dir, num_samples=3)
+        >>>
+        >>> # 2) Read train samples from SST2 dataset
+        >>> dataset = ds.SST2Dataset(dataset_dir=sst2_dataset_dir, usage="train")
+    About SST2 dataset:
+    The Stanford Sentiment Treebank is a corpus with fully labeled parse trees that allows for a complete
+    analysis of the compositional effects of sentiment in language. The corpus is based on the dataset introduced
+    by Pang and Lee (2005) and consists of 11,855 single sentences extracted from movie reviews. It was parsed
+    with the Stanford parser and includes a total of 215,154 unique phrases from those parse trees, each
+    annotated by 3 human judges.
+    Here is the original SST2 dataset structure.
+    You can unzip the dataset files into this directory structure and read by Mindspore's API.
+    .. code-block::
+        .
+        └── sst2_dataset_dir
+            ├── train.tsv
+            ├── test.tsv
+            ├── dev.tsv
+            └── original
+    Citation:
+    .. code-block::
+        @inproceedings{socher-etal-2013-recursive,
+            title     = {Recursive Deep Models for Semantic Compositionality Over a Sentiment Treebank},
+            author    = {Socher, Richard and Perelygin, Alex and Wu, Jean and Chuang, Jason and Manning,
+                          Christopher D. and Ng, Andrew and Potts, Christopher},
+            booktitle = {Proceedings of the 2013 Conference on Empirical Methods in Natural Language Processing},
+            month     = oct,
+            year      = {2013},
+            address   = {Seattle, Washington, USA},
+            publisher = {Association for Computational Linguistics},
+            url       = {https://www.aclweb.org/anthology/D13-1170},
+            pages     = {1631--1642},
+        }
+    """
+    @check_sst2_dataset
+    def __init__(self, dataset_dir, usage=None, num_samples=None, num_parallel_workers=None, shuffle=Shuffle.GLOBAL,
+                 num_shards=None, shard_id=None, cache=None):
+        super().__init__(num_parallel_workers=num_parallel_workers, num_samples=num_samples, shuffle=shuffle,
+                         num_shards=num_shards, shard_id=shard_id, cache=cache)
+        self.dataset_dir = dataset_dir
+        self.usage = replace_none(usage, "train")
+    def parse(self, children=None):
+        return cde.SST2Node(self.dataset_dir, self.usage, self.num_samples, self.shuffle_flag,
+                            self.num_shards, self.shard_id)
 class TextFileDataset(SourceDataset, TextBaseDataset):
     """
     A source dataset that reads and parses datasets stored on disk in text format.
@@ -1487,12 +1613,13 @@ class TextFileDataset(SourceDataset, TextBaseDataset):
     Args:
         dataset_files (Union[str, list[str]]): String or list of files to be read or glob strings to search for a
             pattern of files. The list will be sorted in a lexicographical order.
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all images).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all images.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Default: `Shuffle.GLOBAL` . Bool type and Shuffle enum are both supported to pass in.
             If shuffle is False, no shuffling will be performed.
             If shuffle is True, performs global shuffle.
             There are three levels of shuffling, desired shuffle enum defined by mindspore.dataset.Shuffle.
@@ -1501,20 +1628,20 @@ class TextFileDataset(SourceDataset, TextBaseDataset):
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         ValueError: If dataset_files are not valid or do not exist.
         ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        ValueError: If `shard_id` is invalid (< 0 or >= `num_shards`).
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
     Examples:
         >>> text_file_dataset_dir = ["/path/to/text_file_dataset_file"] # contains 1 or multiple text files
@@ -1536,48 +1663,66 @@ class TextFileDataset(SourceDataset, TextBaseDataset):
 class UDPOSDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses UDPOS dataset.
+    UDPOS(Universal Dependencies dataset for Part of Speech) dataset.
-    The generated dataset has three columns: :py:obj:`[word, universal, stanford]`.
-    The tensor of column :py:obj:`word` is of the string type.
-    The tensor of column :py:obj:`universal` is of the string type.
-    The tensor of column :py:obj:`stanford` is of the string type.
+    The generated dataset has three columns: :py:obj:`[word, universal, stanford]` ,
+    and the data type of three columns is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
         usage (str, optional): Usage of this dataset, can be 'train', 'test', 'valid' or 'all'. 'train' will read from
             12,543 train samples, 'test' will read from 2,077 test samples, 'valid' will read from 2,002 test samples,
-            'all' will read from all 16,622 samples (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+            'all' will read from all 16,622 samples. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If shuffle is False, no shuffling will be performed.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> udpos_dataset_dir = "/path/to/udpos_dataset_dir"
         >>> dataset = ds.UDPOSDataset(dataset_dir=udpos_dataset_dir, usage='all')
+    About UDPOS dataset:
+    Text corpus dataset that clarifies syntactic or semantic sentence structure.
+    The corpus comprises 254,830 words and 16,622 sentences, taken from various web media including
+    weblogs, newsgroups, emails and reviews.
+    Citation:
+    .. code-block::
+        @inproceedings{silveira14gold,
+          year = {2014},
+          author = {Natalia Silveira and Timothy Dozat and Marie-Catherine de Marneffe and Samuel Bowman
+            and Miriam Connor and John Bauer and Christopher D. Manning},
+          title = {A Gold Standard Dependency Corpus for {E}nglish},
+          booktitle = {Proceedings of the Ninth International Conference on Language
+            Resources and Evaluation (LREC-2014)}
+        }
     """
     @check_udpos_dataset
@@ -1595,38 +1740,43 @@ class UDPOSDataset(SourceDataset, TextBaseDataset):
 class WikiTextDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses WikiText2 and WikiText103 datasets.
+    WikiText2 and WikiText103 datasets.
-    The generated dataset has one column :py:obj:`[text]`.
-    The tensor of column :py:obj:`text` is of the string type.
+    The generated dataset has one column :py:obj:`[text]` , and
+    the tensor of column `text` is of the string type.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
-        usage (str, optional): Acceptable usages include 'train', 'test', 'valid' and 'all' (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads the full dataset).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+        usage (str, optional): Acceptable usages include 'train', 'test', 'valid' and 'all'. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads the full dataset.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If shuffle is False, no shuffling will be performed.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
-            When this argument is specified, 'num_samples' reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
+            When this argument is specified, `num_samples` reflects the max sample number of per shard.
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
-    Examples:
-        >>> wiki_text_dataset_dir = "/path/to/wiki_text_dataset_directory"
-        >>> dataset = ds.WikiTextDataset(dataset_dir=wiki_text_dataset_dir, usage='all')
+    Raises:
+        RuntimeError: If `dataset_dir` does not contain data files or invalid.
+        RuntimeError: If `num_shards` is specified but `shard_id` is None.
+        RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
+        ValueError: If `num_samples` is invalid (< 0).
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     About WikiTextDataset dataset:
@@ -1657,6 +1807,10 @@ class WikiTextDataset(SourceDataset, TextBaseDataset):
           journal={arXiv preprint arXiv:1609.07843},
           year={2016}
         }
+    Examples:
+        >>> wiki_text_dataset_dir = "/path/to/wiki_text_dataset_directory"
+        >>> dataset = ds.WikiTextDataset(dataset_dir=wiki_text_dataset_dir, usage='all')
     """
     @check_wiki_text_dataset
@@ -1674,47 +1828,44 @@ class WikiTextDataset(SourceDataset, TextBaseDataset):
 class YahooAnswersDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses the YahooAnswers dataset.
+    YahooAnswers dataset.
-    The generated dataset has three columns :py:obj:`[class, title, content, answer]`.
-    The tensor of column :py:obj:`class` is of the string type.
-    The tensor of column :py:obj:`title` is of the string type.
-    The tensor of column :py:obj:`content` is of the string type.
-    The tensor of column :py:obj:`answer` is of the string type.
+    The generated dataset has four columns :py:obj:`[class, title, content, answer]` , whose data type is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
         usage (str, optional): Usage of this dataset, can be 'train', 'test' or 'all'. 'train' will read
             from 1,400,000 train samples, 'test' will read from 60,000 test samples, 'all' will read from
-            all 1,460,000 samples (default=None, all samples).
-        num_samples (int, optional): The number of samples to be included in the dataset
-            (default=None, will include all text).
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+            all 1,460,000 samples. Default: None, all samples.
+        num_samples (int, optional): The number of samples to be included in the dataset.
+            Default: None, will include all text.
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If shuffle is False, no shuffling will be performed.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the maximum sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
-        ValueError: If `shard_id` is invalid (< 0 or >= `num_shards`).
+        ValueError: If `shard_id` is not in range of [0, `num_shards` ).
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> yahoo_answers_dataset_dir = "/path/to/yahoo_answers_dataset_directory"
@@ -1772,11 +1923,9 @@ class YahooAnswersDataset(SourceDataset, TextBaseDataset):
 class YelpReviewDataset(SourceDataset, TextBaseDataset):
     """
-    A source dataset that reads and parses Yelp Review Polarity and Yelp Review Full dataset.
+    Yelp Review Polarity and Yelp Review Full datasets.
-    The generated dataset has two columns: :py:obj:`[label, text]`.
-    The tensor of column :py:obj:`label` is of the string type.
-    The tensor of column :py:obj:`text` is of the string type.
+    The generated dataset has two columns: :py:obj:`[label, text]` , and the data type of two columns is string.
     Args:
         dataset_dir (str): Path to the root directory that contains the dataset.
@@ -1784,32 +1933,33 @@ class YelpReviewDataset(SourceDataset, TextBaseDataset):
             For Polarity, 'train' will read from 560,000 train samples, 'test' will read from 38,000 test samples,
             'all' will read from all 598,000 samples.
             For Full, 'train' will read from 650,000 train samples, 'test' will read from 50,000 test samples,
-            'all' will read from all 700,000 samples (default=None, all samples).
-        num_samples (int, optional): Number of samples (rows) to read (default=None, reads all samples).
-        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch
-            (default=Shuffle.GLOBAL). Bool type and Shuffle enum are both supported to pass in.
-            If shuffle is False, no shuffling will be performed;
-            If shuffle is True, the behavior is the same as setting shuffle to be Shuffle.GLOBAL
-            Otherwise, there are two levels of shuffling:
+            'all' will read from all 700,000 samples. Default: None, all samples.
+        num_samples (int, optional): Number of samples (rows) to read. Default: None, reads all samples.
+        shuffle (Union[bool, Shuffle], optional): Perform reshuffling of the data every epoch.
+            Bool type and Shuffle enum are both supported to pass in. Default: `Shuffle.GLOBAL` .
+            If shuffle is False, no shuffling will be performed.
+            If shuffle is True, it is equivalent to setting `shuffle` to mindspore.dataset.Shuffle.GLOBAL.
+            Set the mode of data shuffling by passing in enumeration variables:
             - Shuffle.GLOBAL: Shuffle both the files and samples.
             - Shuffle.FILES: Shuffle files only.
-        num_shards (int, optional): Number of shards that the dataset will be divided into (default=None).
+        num_shards (int, optional): Number of shards that the dataset will be divided into. Default: None.
             When this argument is specified, `num_samples` reflects the max sample number of per shard.
-        shard_id (int, optional): The shard ID within `num_shards` (default=None). This
+        shard_id (int, optional): The shard ID within `num_shards` . Default: None. This
             argument can only be specified when `num_shards` is also specified.
-        num_parallel_workers (int, optional): Number of workers to read the data
-            (default=None, number set in the config).
+        num_parallel_workers (int, optional): Number of worker threads to read the data.
+            Default: None, will use global default workers(8), it can be set
+            by `mindspore.dataset.config.set_num_parallel_workers` .
         cache (DatasetCache, optional): Use tensor caching service to speed up dataset processing. More details:
-            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r1.10/dataset/cache.html>`_
-            (default=None, which means no cache is used).
+            `Single-Node Data Cache <https://www.mindspore.cn/tutorials/experts/en/r2.0/dataset/cache.html>`_ .
+            Default: None, which means no cache is used.
     Raises:
         RuntimeError: If `dataset_dir` does not contain data files.
-        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
         RuntimeError: If `num_shards` is specified but `shard_id` is None.
         RuntimeError: If `shard_id` is specified but `num_shards` is None.
+        ValueError: If `num_parallel_workers` exceeds the max thread numbers.
     Examples:
         >>> yelp_review_dataset_dir = "/path/to/yelp_review_dataset_dir"