mindspore 1.10.0__cp39-cp39-win_amd64.whl → 2.0.0rc1__cp39-cp39-win_amd64.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Potentially problematic release.
This version of mindspore might be problematic. Click here for more details.
- mindspore/.commit_id +1 -1
- mindspore/ConcurrencyCheck.dll +0 -0
- mindspore/CppBuildInsights.dll +0 -0
- mindspore/CppCoreCheck.dll +0 -0
- mindspore/EnumIndex.dll +0 -0
- mindspore/EspXEngine.dll +0 -0
- mindspore/HResultCheck.dll +0 -0
- mindspore/KernelTraceControl.dll +0 -0
- mindspore/LocalESPC.dll +0 -0
- mindspore/Microsoft.Diagnostics.Tracing.EventSource.dll +0 -0
- mindspore/Microsoft.VisualStudio.RemoteControl.dll +0 -0
- mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
- mindspore/Microsoft.VisualStudio.Utilities.Internal.dll +0 -0
- mindspore/Newtonsoft.Json.dll +0 -0
- mindspore/System.Runtime.CompilerServices.Unsafe.dll +0 -0
- mindspore/VariantClear.dll +0 -0
- mindspore/__init__.py +9 -4
- mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
- mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
- mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
- mindspore/_check_jit_forbidden_api.py +102 -0
- mindspore/_checkparam.py +1066 -1001
- mindspore/_extends/builtin_operations.py +32 -4
- mindspore/_extends/graph_kernel/model/graph_split.py +66 -222
- mindspore/_extends/parallel_compile/akg_compiler/akg_process.py +12 -9
- mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +119 -26
- mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +50 -50
- mindspore/_extends/parallel_compile/akg_compiler/util.py +9 -6
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_adapter.py +4 -25
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +9 -4
- mindspore/_extends/parallel_compile/tbe_compiler/tbe_job_manager.py +1 -27
- mindspore/_extends/parse/__init__.py +5 -3
- mindspore/_extends/parse/namespace.py +17 -2
- mindspore/_extends/parse/parser.py +193 -34
- mindspore/_extends/parse/resources.py +7 -8
- mindspore/_extends/parse/standard_method.py +1780 -435
- mindspore/_extends/parse/trope.py +3 -1
- mindspore/amp.py +53 -58
- mindspore/atlprov.dll +0 -0
- mindspore/boost/adasum.py +3 -2
- mindspore/boost/boost.py +2 -2
- mindspore/boost/boost_cell_wrapper.py +46 -26
- mindspore/boost/dim_reduce.py +6 -5
- mindspore/boost/grad_accumulation.py +2 -1
- mindspore/boost/group_loss_scale_manager.py +1 -1
- mindspore/c1.dll +0 -0
- mindspore/c1xx.dll +0 -0
- mindspore/c2.dll +0 -0
- mindspore/cfgpersist.dll +0 -0
- mindspore/clang_rt.asan_dbg_dynamic-x86_64.dll +0 -0
- mindspore/clang_rt.asan_dynamic-x86_64.dll +0 -0
- mindspore/common/__init__.py +11 -10
- mindspore/common/_decorator.py +2 -0
- mindspore/common/_register_for_adapter.py +55 -0
- mindspore/common/_stub_tensor.py +201 -0
- mindspore/common/_utils.py +57 -0
- mindspore/common/api.py +582 -297
- mindspore/common/dtype.py +66 -18
- mindspore/common/dump.py +2 -2
- mindspore/common/initializer.py +38 -1
- mindspore/common/jit_config.py +25 -13
- mindspore/common/mutable.py +53 -24
- mindspore/common/parameter.py +60 -37
- mindspore/common/seed.py +8 -24
- mindspore/common/sparse_tensor.py +927 -0
- mindspore/common/tensor.py +1627 -3900
- mindspore/communication/__init__.py +10 -5
- mindspore/communication/_comm_helper.py +78 -214
- mindspore/communication/_hccl_management.py +2 -1
- mindspore/communication/management.py +136 -47
- mindspore/config/op_info.config +501 -1008
- mindspore/context.py +291 -56
- mindspore/d3dcompiler_47.dll +0 -0
- mindspore/dataset/__init__.py +12 -8
- mindspore/dataset/audio/__init__.py +9 -9
- mindspore/dataset/audio/transforms.py +1090 -228
- mindspore/dataset/audio/utils.py +87 -39
- mindspore/dataset/audio/validators.py +223 -1
- mindspore/dataset/callback/ds_callback.py +17 -15
- mindspore/dataset/core/config.py +246 -17
- mindspore/dataset/core/py_util_helpers.py +4 -3
- mindspore/dataset/core/validator_helpers.py +10 -10
- mindspore/{parallel/nn/layers.py → dataset/debug/__init__.py} +7 -8
- mindspore/dataset/debug/debug_hook.py +65 -0
- mindspore/dataset/debug/pre_defined_hook.py +67 -0
- mindspore/dataset/engine/__init__.py +7 -3
- mindspore/dataset/engine/cache_client.py +9 -9
- mindspore/dataset/engine/datasets.py +648 -477
- mindspore/dataset/engine/datasets_audio.py +165 -167
- mindspore/dataset/engine/datasets_standard_format.py +93 -67
- mindspore/dataset/engine/datasets_text.py +492 -342
- mindspore/dataset/engine/datasets_user_defined.py +85 -50
- mindspore/dataset/engine/datasets_vision.py +1224 -699
- mindspore/dataset/engine/graphdata.py +134 -69
- mindspore/dataset/engine/iterators.py +50 -9
- mindspore/dataset/engine/offload.py +52 -31
- mindspore/dataset/engine/samplers.py +27 -24
- mindspore/dataset/engine/serializer_deserializer.py +14 -15
- mindspore/dataset/engine/validators.py +213 -52
- mindspore/dataset/text/__init__.py +10 -8
- mindspore/dataset/text/transforms.py +152 -57
- mindspore/dataset/text/utils.py +98 -49
- mindspore/dataset/text/validators.py +25 -0
- mindspore/dataset/transforms/__init__.py +4 -2
- mindspore/dataset/transforms/c_transforms.py +11 -13
- mindspore/dataset/transforms/py_transforms.py +2 -2
- mindspore/dataset/transforms/py_transforms_util.py +10 -0
- mindspore/dataset/transforms/transforms.py +13 -15
- mindspore/dataset/transforms/validators.py +7 -7
- mindspore/dataset/utils/__init__.py +2 -1
- mindspore/dataset/utils/browse_dataset.py +13 -13
- mindspore/dataset/utils/line_reader.py +121 -0
- mindspore/dataset/vision/__init__.py +8 -7
- mindspore/dataset/vision/c_transforms.py +125 -126
- mindspore/dataset/vision/py_transforms.py +37 -37
- mindspore/dataset/vision/py_transforms_util.py +23 -20
- mindspore/dataset/vision/transforms.py +316 -315
- mindspore/dataset/vision/utils.py +313 -17
- mindspore/dataset/vision/validators.py +6 -6
- mindspore/default_config.py +0 -1
- mindspore/dpcmi.dll +0 -0
- mindspore/{compression → experimental}/__init__.py +6 -5
- mindspore/experimental/map_parameter.py +275 -0
- mindspore/include/OWNERS +0 -1
- mindspore/include/api/callback/callback.h +9 -13
- mindspore/include/api/callback/ckpt_saver.h +2 -2
- mindspore/include/api/callback/loss_monitor.h +2 -2
- mindspore/include/api/callback/lr_scheduler.h +5 -5
- mindspore/include/api/callback/time_monitor.h +2 -2
- mindspore/include/api/callback/train_accuracy.h +4 -6
- mindspore/include/api/cfg.h +19 -6
- mindspore/include/api/context.h +70 -9
- mindspore/include/api/delegate.h +8 -1
- mindspore/include/api/dual_abi_helper.h +8 -24
- mindspore/include/api/metrics/accuracy.h +2 -2
- mindspore/include/api/metrics/metrics.h +4 -3
- mindspore/include/api/model.h +9 -4
- mindspore/include/api/model_group.h +68 -0
- mindspore/include/api/model_parallel_runner.h +17 -17
- mindspore/include/api/net.h +12 -11
- mindspore/include/api/serialization.h +20 -4
- mindspore/include/api/status.h +7 -1
- mindspore/include/api/types.h +25 -21
- mindspore/include/api/visible.h +4 -0
- mindspore/include/c_api/model_c.h +5 -0
- mindspore/include/c_api/status_c.h +1 -1
- mindspore/include/dataset/config.h +1 -1
- mindspore/include/dataset/constants.h +14 -0
- mindspore/include/dataset/text.h +59 -0
- mindspore/include/dataset/vision.h +56 -117
- mindspore/include/dataset/vision_lite.h +102 -0
- mindspore/jpeg62.dll +0 -0
- mindspore/log.py +28 -28
- mindspore/mindrecord/common/exceptions.py +2 -4
- mindspore/mindrecord/filereader.py +19 -1
- mindspore/mindrecord/filewriter.py +250 -88
- mindspore/mindrecord/mindpage.py +13 -13
- mindspore/mindrecord/shardheader.py +15 -15
- mindspore/mindrecord/shardreader.py +9 -0
- mindspore/mindrecord/shardwriter.py +29 -29
- mindspore/mindrecord/tools/cifar100_to_mr.py +9 -9
- mindspore/mindrecord/tools/cifar10_to_mr.py +9 -9
- mindspore/mindrecord/tools/csv_to_mr.py +4 -4
- mindspore/mindrecord/tools/imagenet_to_mr.py +70 -65
- mindspore/mindrecord/tools/mnist_to_mr.py +41 -41
- mindspore/mindrecord/tools/tfrecord_to_mr.py +6 -6
- mindspore/{libmindspore_backend.dll → mindspore_backend.dll} +0 -0
- mindspore/mindspore_common.dll +0 -0
- mindspore/mindspore_core.dll +0 -0
- mindspore/mindspore_glog.dll +0 -0
- mindspore/mindspore_shared_lib.dll +0 -0
- mindspore/msobj140.dll +0 -0
- mindspore/mspdb140.dll +0 -0
- mindspore/mspdbcore.dll +0 -0
- mindspore/mspdbst.dll +0 -0
- mindspore/mspft140.dll +0 -0
- mindspore/msvcdis140.dll +0 -0
- mindspore/msvcp140_1.dll +0 -0
- mindspore/msvcp140_2.dll +0 -0
- mindspore/msvcp140_atomic_wait.dll +0 -0
- mindspore/msvcp140_codecvt_ids.dll +0 -0
- mindspore/nn/__init__.py +1 -5
- mindspore/nn/cell.py +297 -234
- mindspore/nn/dynamic_lr.py +1 -1
- mindspore/nn/grad/cell_grad.py +17 -42
- mindspore/nn/layer/__init__.py +7 -4
- mindspore/nn/layer/activation.py +131 -88
- mindspore/nn/layer/basic.py +313 -613
- mindspore/nn/layer/channel_shuffle.py +103 -0
- mindspore/nn/layer/combined.py +1 -1
- mindspore/nn/layer/container.py +52 -6
- mindspore/nn/layer/conv.py +112 -43
- mindspore/nn/layer/dense.py +10 -9
- mindspore/nn/layer/embedding.py +36 -34
- mindspore/nn/layer/image.py +123 -27
- mindspore/nn/layer/math.py +108 -107
- mindspore/nn/layer/normalization.py +212 -366
- mindspore/nn/layer/padding.py +370 -42
- mindspore/nn/layer/pooling.py +1443 -219
- mindspore/nn/layer/rnn_cells.py +11 -16
- mindspore/nn/layer/rnns.py +38 -39
- mindspore/nn/layer/thor_layer.py +24 -25
- mindspore/nn/layer/timedistributed.py +5 -5
- mindspore/nn/layer/transformer.py +701 -0
- mindspore/nn/learning_rate_schedule.py +8 -8
- mindspore/nn/loss/__init__.py +9 -6
- mindspore/nn/loss/loss.py +678 -142
- mindspore/nn/metrics.py +53 -0
- mindspore/nn/optim/_dist_optimizer_registry.py +2 -2
- mindspore/nn/optim/ada_grad.py +8 -8
- mindspore/nn/optim/adadelta.py +2 -3
- mindspore/nn/optim/adafactor.py +18 -14
- mindspore/nn/optim/adam.py +429 -87
- mindspore/nn/optim/adamax.py +5 -6
- mindspore/nn/optim/adasum.py +10 -8
- mindspore/nn/optim/asgd.py +7 -7
- mindspore/nn/optim/ftrl.py +81 -11
- mindspore/nn/optim/lamb.py +7 -8
- mindspore/nn/optim/lars.py +4 -4
- mindspore/nn/optim/lazyadam.py +82 -7
- mindspore/nn/optim/momentum.py +8 -7
- mindspore/nn/optim/optimizer.py +19 -10
- mindspore/nn/optim/proximal_ada_grad.py +6 -5
- mindspore/nn/optim/rmsprop.py +3 -3
- mindspore/nn/optim/rprop.py +20 -16
- mindspore/nn/optim/sgd.py +21 -15
- mindspore/nn/optim/thor.py +23 -21
- mindspore/nn/probability/__init__.py +0 -2
- mindspore/nn/probability/bijector/bijector.py +7 -6
- mindspore/nn/probability/bijector/invert.py +4 -2
- mindspore/nn/probability/bijector/softplus.py +2 -2
- mindspore/nn/probability/bnn_layers/dense_variational.py +1 -1
- mindspore/nn/probability/bnn_layers/layer_distribution.py +2 -2
- mindspore/nn/probability/distribution/__init__.py +6 -0
- mindspore/nn/probability/distribution/_utils/custom_ops.py +3 -2
- mindspore/nn/probability/distribution/_utils/utils.py +11 -17
- mindspore/nn/probability/distribution/bernoulli.py +6 -6
- mindspore/nn/probability/distribution/beta.py +1 -1
- mindspore/nn/probability/distribution/categorical.py +9 -9
- mindspore/nn/probability/distribution/cauchy.py +8 -8
- mindspore/nn/probability/distribution/distribution.py +12 -6
- mindspore/nn/probability/distribution/exponential.py +5 -5
- mindspore/nn/probability/distribution/gamma.py +3 -3
- mindspore/nn/probability/distribution/geometric.py +6 -5
- mindspore/nn/probability/distribution/gumbel.py +5 -5
- mindspore/nn/probability/distribution/half_normal.py +133 -0
- mindspore/nn/probability/distribution/laplace.py +128 -0
- mindspore/nn/probability/distribution/log_normal.py +0 -1
- mindspore/nn/probability/distribution/logistic.py +4 -5
- mindspore/nn/probability/distribution/normal.py +11 -15
- mindspore/nn/probability/distribution/poisson.py +6 -2
- mindspore/nn/probability/distribution/student_t.py +150 -0
- mindspore/nn/probability/distribution/transformed_distribution.py +4 -4
- mindspore/nn/probability/distribution/uniform.py +5 -5
- mindspore/nn/reinforcement/_tensors_queue.py +3 -3
- mindspore/nn/reinforcement/tensor_array.py +2 -2
- mindspore/nn/sparse/sparse.py +8 -1
- mindspore/nn/wrap/cell_wrapper.py +55 -27
- mindspore/nn/wrap/grad_reducer.py +20 -11
- mindspore/nn/wrap/loss_scale.py +47 -30
- mindspore/numpy/array_creations.py +33 -22
- mindspore/numpy/array_ops.py +46 -42
- mindspore/numpy/logic_ops.py +6 -27
- mindspore/numpy/math_ops.py +26 -19
- mindspore/numpy/utils.py +1 -8
- mindspore/numpy/utils_const.py +112 -62
- mindspore/opencv_core452.dll +0 -0
- mindspore/opencv_imgcodecs452.dll +0 -0
- mindspore/opencv_imgproc452.dll +0 -0
- mindspore/ops/__init__.py +6 -3
- mindspore/ops/_constants.py +0 -6
- mindspore/ops/_grad/__init__.py +2 -1
- mindspore/ops/_grad/grad_array_ops.py +209 -152
- mindspore/ops/_grad/grad_base.py +55 -17
- mindspore/ops/_grad/grad_clip_ops.py +11 -3
- mindspore/ops/_grad/grad_comm_ops.py +58 -47
- mindspore/ops/_grad/grad_implementations.py +21 -61
- mindspore/ops/_grad/grad_inner_ops.py +48 -6
- mindspore/ops/_grad/grad_math_ops.py +306 -161
- mindspore/ops/_grad/grad_nn_ops.py +192 -181
- mindspore/ops/_grad/grad_other_ops.py +1 -1
- mindspore/ops/_grad/grad_quant_ops.py +5 -5
- mindspore/ops/_grad/grad_sequence_ops.py +296 -0
- mindspore/ops/_grad/grad_sparse.py +15 -9
- mindspore/ops/_grad_experimental/__init__.py +1 -0
- mindspore/ops/_grad_experimental/grad_array_ops.py +441 -55
- mindspore/ops/_grad_experimental/grad_image_ops.py +25 -7
- mindspore/ops/_grad_experimental/grad_inner_ops.py +3 -44
- mindspore/ops/_grad_experimental/grad_linalg_ops.py +16 -21
- mindspore/ops/_grad_experimental/grad_math_ops.py +979 -49
- mindspore/ops/_grad_experimental/grad_nn_ops.py +78 -8
- mindspore/ops/_grad_experimental/grad_scalar_ops.py +112 -0
- mindspore/ops/_grad_experimental/grad_sparse_ops.py +197 -13
- mindspore/ops/_op_impl/__init__.py +3 -3
- mindspore/ops/_op_impl/_custom_op/__init__.py +0 -1
- mindspore/ops/_op_impl/_custom_op/_basic.py +0 -1
- mindspore/ops/_op_impl/_custom_op/batch_matmul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold.py +4 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold2_grad_reduce.py +5 -5
- mindspore/ops/_op_impl/_custom_op/batchnorm_fold_grad.py +3 -3
- mindspore/ops/_op_impl/_custom_op/cholesky_trsm_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/correction_mul.py +3 -3
- mindspore/ops/_op_impl/_custom_op/correction_mul_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/dsd_back_impl.py +4 -8
- mindspore/ops/_op_impl/_custom_op/dsd_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perchannel_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_learned_scale_quant_perlayer_grad_reduce.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perchannel_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fake_quant_perlayer_grad.py +2 -2
- mindspore/ops/_op_impl/_custom_op/fused_abs_max1_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/img2col_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_left_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_cube_dense_right_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_left_cast_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_fracz_right_mul_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/matmul_cube_impl.py +2 -2
- mindspore/ops/_op_impl/_custom_op/matmul_dds_grad_impl.py +0 -1
- mindspore/ops/_op_impl/_custom_op/matmul_dds_impl.py +0 -1
- mindspore/ops/_op_impl/_custom_op/matrix_combine_impl.py +1 -1
- mindspore/ops/_op_impl/_custom_op/minmax_update_perchannel.py +2 -2
- mindspore/ops/_op_impl/_custom_op/minmax_update_perlayer.py +2 -2
- mindspore/ops/_op_impl/_custom_op/transpose02314_impl.py +1 -1
- mindspore/ops/_op_impl/aicpu/__init__.py +238 -3
- mindspore/ops/_op_impl/aicpu/abs.py +36 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d.py +34 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_2d_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d.py +39 -0
- mindspore/ops/_op_impl/aicpu/adaptive_avg_pool_3d_grad.py +39 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_2d_grad.py +37 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d.py +42 -0
- mindspore/ops/_op_impl/aicpu/adaptive_max_pool_3d_grad.py +152 -0
- mindspore/ops/_op_impl/aicpu/add.py +43 -0
- mindspore/ops/_op_impl/aicpu/addcdiv.py +0 -32
- mindspore/ops/_op_impl/aicpu/addcmul.py +0 -84
- mindspore/ops/_op_impl/aicpu/affine_grid_grad.py +35 -0
- mindspore/ops/_op_impl/aicpu/arg_max.py +75 -0
- mindspore/ops/_op_impl/aicpu/arg_min.py +75 -0
- mindspore/ops/_op_impl/aicpu/argmin_with_value.py +43 -0
- mindspore/ops/_op_impl/aicpu/batch_matmul.py +43 -0
- mindspore/ops/_op_impl/aicpu/batch_norm_grad_grad.py +49 -0
- mindspore/ops/_op_impl/aicpu/bernoulli.py +48 -0
- mindspore/ops/_op_impl/aicpu/bessel_i0.py +31 -0
- mindspore/ops/_op_impl/aicpu/bias_add.py +44 -0
- mindspore/ops/_op_impl/aicpu/bias_add_grad.py +43 -0
- mindspore/ops/_op_impl/aicpu/bincount.py +33 -0
- mindspore/{nn/probability/infer/variational/__init__.py → ops/_op_impl/aicpu/cauchy.py} +17 -10
- mindspore/ops/_op_impl/aicpu/channel_shuffle.py +40 -0
- mindspore/ops/_op_impl/aicpu/cholesky.py +1 -1
- mindspore/ops/_op_impl/{cpu/bias_add.py → aicpu/choleskygrad.py} +9 -7
- mindspore/ops/_op_impl/aicpu/combined_non_max_suppression.py +42 -0
- mindspore/ops/_op_impl/aicpu/concat_offset.py +42 -0
- mindspore/ops/_op_impl/aicpu/concat_offset_v1.py +31 -0
- mindspore/ops/_op_impl/aicpu/conj.py +11 -0
- mindspore/ops/_op_impl/aicpu/crop_and_resize_grad_image.py +38 -0
- mindspore/ops/_op_impl/aicpu/cumulative_logsumexp.py +36 -0
- mindspore/ops/_op_impl/aicpu/deformable_offsets.py +38 -0
- mindspore/ops/_op_impl/aicpu/deformable_offsets_grad.py +2 -2
- mindspore/ops/_op_impl/aicpu/dense_to_sparse_set_operation.py +48 -0
- mindspore/ops/_op_impl/aicpu/diag.py +36 -0
- mindspore/ops/_op_impl/aicpu/diag_part.py +36 -0
- mindspore/ops/_op_impl/aicpu/diagonal.py +35 -0
- mindspore/ops/_op_impl/{cpu/bias_add_grad.py → aicpu/digamma.py} +9 -7
- mindspore/ops/_op_impl/aicpu/eig.py +35 -0
- mindspore/ops/_op_impl/aicpu/fft_with_size.py +41 -0
- mindspore/ops/_op_impl/aicpu/flatten.py +1 -0
- mindspore/ops/_op_impl/aicpu/fmax.py +36 -0
- mindspore/ops/_op_impl/aicpu/fmin.py +37 -0
- mindspore/ops/_op_impl/aicpu/fractional_max_pool3d_with_fixed_ksize.py +1 -1
- mindspore/ops/_op_impl/aicpu/fse_decode.py +43 -0
- mindspore/ops/_op_impl/aicpu/glu.py +33 -0
- mindspore/ops/_op_impl/aicpu/glu_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/greater.py +41 -0
- mindspore/ops/_op_impl/aicpu/greater_equal.py +41 -0
- mindspore/ops/_op_impl/aicpu/index_put.py +50 -0
- mindspore/ops/_op_impl/{tbe/scatter_add_ds.py → aicpu/inplace_index_add.py} +17 -21
- mindspore/ops/_op_impl/aicpu/instance_norm_v2.py +41 -0
- mindspore/ops/_op_impl/aicpu/instance_norm_v2_grad.py +44 -0
- mindspore/ops/_op_impl/aicpu/layer_norm_grad_grad.py +47 -0
- mindspore/ops/_op_impl/aicpu/less.py +41 -0
- mindspore/ops/_op_impl/aicpu/less_equal.py +41 -0
- mindspore/ops/_op_impl/aicpu/lgamma.py +32 -0
- mindspore/ops/_op_impl/aicpu/log_normal_reverse.py +33 -0
- mindspore/ops/_op_impl/aicpu/logit.py +33 -0
- mindspore/ops/_op_impl/aicpu/logit_grad.py +34 -0
- mindspore/ops/_op_impl/aicpu/masked_fill.py +42 -0
- mindspore/ops/_op_impl/aicpu/masked_scatter.py +39 -0
- mindspore/ops/_op_impl/aicpu/matmul.py +39 -0
- mindspore/ops/_op_impl/aicpu/matrix_logarithm.py +31 -0
- mindspore/ops/_op_impl/aicpu/matrix_power.py +32 -0
- mindspore/ops/_op_impl/aicpu/matrix_solve_ls.py +36 -0
- mindspore/ops/_op_impl/aicpu/matrix_triangular_solve.py +36 -0
- mindspore/ops/_op_impl/aicpu/mirror_pad.py +2 -0
- mindspore/ops/_op_impl/aicpu/mirror_pad_grad.py +0 -4
- mindspore/ops/_op_impl/aicpu/mul.py +3 -1
- mindspore/ops/_op_impl/aicpu/multinomial.py +14 -6
- mindspore/ops/_op_impl/aicpu/multinomial_with_replacement.py +35 -0
- mindspore/ops/_op_impl/aicpu/nan_to_num.py +34 -0
- mindspore/ops/_op_impl/aicpu/nllloss.py +38 -0
- mindspore/ops/_op_impl/aicpu/nllloss_grad.py +39 -0
- mindspore/ops/_op_impl/aicpu/ones_like.py +0 -2
- mindspore/ops/_op_impl/aicpu/polar.py +32 -0
- mindspore/ops/_op_impl/aicpu/polygamma.py +34 -0
- mindspore/ops/_op_impl/aicpu/qr.py +36 -0
- mindspore/ops/_op_impl/aicpu/quant_dtype_cast.py +40 -0
- mindspore/ops/_op_impl/aicpu/quantile.py +35 -0
- mindspore/ops/_op_impl/aicpu/ragged_tensor_to_sparse.py +73 -0
- mindspore/ops/_op_impl/aicpu/ragged_tensor_to_tensor.py +74 -0
- mindspore/ops/_op_impl/aicpu/random_shuffle.py +3 -0
- mindspore/ops/_op_impl/aicpu/randperm_v2.py +41 -0
- mindspore/ops/_op_impl/aicpu/range.py +36 -0
- mindspore/ops/_op_impl/aicpu/reciprocal.py +34 -0
- mindspore/ops/_op_impl/aicpu/reciprocal_grad.py +35 -0
- mindspore/ops/_op_impl/aicpu/reduce_sum.py +57 -0
- mindspore/ops/_op_impl/aicpu/resize_bicubic.py +2 -8
- mindspore/ops/_op_impl/aicpu/resize_bicubic_grad.py +1 -1
- mindspore/ops/_op_impl/aicpu/resize_v2.py +68 -0
- mindspore/ops/_op_impl/aicpu/resize_v2_grad.py +68 -0
- mindspore/ops/_op_impl/aicpu/scatter_elements.py +4 -0
- mindspore/ops/_op_impl/aicpu/scatter_nd_update.py +2 -0
- mindspore/ops/_op_impl/aicpu/search_sorted.py +12 -6
- mindspore/ops/_op_impl/aicpu/self_adjoint_eig.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_add.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_add_offset.py +34 -0
- mindspore/ops/_op_impl/aicpu/sequence_addn.py +38 -0
- mindspore/ops/_op_impl/aicpu/slice_grad.py +76 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss.py +35 -0
- mindspore/ops/_op_impl/aicpu/smooth_l1_loss_grad.py +37 -0
- mindspore/ops/_op_impl/aicpu/sort.py +39 -0
- mindspore/ops/_op_impl/aicpu/sparse_apply_adagrad_da.py +0 -24
- mindspore/ops/_op_impl/aicpu/sparse_cross.py +42 -0
- mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows.py +63 -0
- mindspore/ops/_op_impl/aicpu/sparse_fill_empty_rows_grad.py +45 -0
- mindspore/ops/_op_impl/aicpu/sparse_matrix_mat_mul.py +56 -0
- mindspore/ops/_op_impl/{tbe/slice_ds.py → aicpu/sparse_segment_sum.py} +16 -24
- mindspore/ops/_op_impl/aicpu/sparse_segment_sum_with_num_segments.py +68 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice.py +63 -0
- mindspore/ops/_op_impl/aicpu/sparse_slice_grad.py +61 -0
- mindspore/ops/_op_impl/aicpu/squared_difference.py +2 -0
- mindspore/ops/_op_impl/aicpu/strided_slice_v2.py +93 -0
- mindspore/ops/_op_impl/aicpu/strided_slice_v2_grad.py +66 -0
- mindspore/ops/_op_impl/aicpu/tensor_scatter_update.py +59 -0
- mindspore/ops/_op_impl/{tbe/gather_v2.py → aicpu/tile.py} +24 -24
- mindspore/ops/_op_impl/aicpu/tridiagonal_solve.py +35 -0
- mindspore/ops/_op_impl/aicpu/tril_indices.py +34 -0
- mindspore/ops/_op_impl/aicpu/triu_indices.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform.py +34 -0
- mindspore/ops/_op_impl/aicpu/uniform_candidate_sampler.py +1 -0
- mindspore/ops/_op_impl/aicpu/unique_consecutive.py +10 -2
- mindspore/ops/_op_impl/cpu/__init__.py +1 -2
- mindspore/ops/_op_impl/cpu/dynamic_shape.py +5 -1
- mindspore/ops/_op_impl/cpu/maximum_grad.py +2 -0
- mindspore/{compression/common/__init__.py → ops/_op_impl/cpu/pyexecute.py} +13 -8
- mindspore/ops/_op_impl/cpu/reduce_sum.py +8 -0
- mindspore/ops/_op_impl/cpu/sparse_slice.py +62 -0
- mindspore/ops/_op_impl/cpu/sparse_slice_grad.py +60 -0
- mindspore/ops/_op_impl/cpu/tensor_shape.py +5 -1
- mindspore/ops/_op_impl/tbe/__init__.py +27 -608
- mindspore/ops/_op_impl/tbe/addcdiv_ds.py +42 -0
- mindspore/ops/_op_impl/tbe/addcmul_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/assign_add_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/avg_pool_3d_grad.py +1 -1
- mindspore/ops/_op_impl/tbe/basic_lstm_cell_c_state_grad_v2.py +0 -1
- mindspore/ops/_op_impl/tbe/batch_to_space.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_to_space_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/batch_to_space_nd_v2.py +41 -0
- mindspore/ops/_op_impl/tbe/bce_with_logits_loss.py +1 -0
- mindspore/ops/_op_impl/tbe/bias_add_grad.py +2 -0
- mindspore/ops/_op_impl/tbe/bn_infer_grad.py +4 -2
- mindspore/ops/_op_impl/tbe/bn_infer_grad_ds.py +40 -0
- mindspore/ops/_op_impl/tbe/bn_training_update.py +0 -1
- mindspore/ops/_op_impl/tbe/bn_training_update_ds.py +0 -1
- mindspore/ops/_op_impl/tbe/broadcast_to_ds.py +6 -4
- mindspore/ops/_op_impl/tbe/cast.py +0 -2
- mindspore/ops/_op_impl/tbe/cast_ds.py +3 -3
- mindspore/ops/_op_impl/tbe/ctc_loss_v2.py +0 -2
- mindspore/ops/_op_impl/tbe/ctc_loss_v2_grad.py +0 -2
- mindspore/ops/_op_impl/tbe/data_format_dim_map_ds.py +1 -0
- mindspore/ops/_op_impl/tbe/deformable_offsets.py +1 -0
- mindspore/ops/_op_impl/tbe/depthwise_conv2d.py +1 -1
- mindspore/ops/_op_impl/tbe/dynamic_atomic_addr_clean.py +1 -1
- mindspore/ops/_op_impl/tbe/gather_nd.py +1 -0
- mindspore/ops/_op_impl/tbe/greater.py +2 -0
- mindspore/ops/_op_impl/tbe/{index_add.py → inplace_index_add.py} +3 -6
- mindspore/ops/_op_impl/tbe/layer_norm_beta_gamma_backprop_v2.py +0 -1
- mindspore/ops/_op_impl/tbe/npu_clear_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/npu_get_float_status_v2.py +35 -0
- mindspore/ops/_op_impl/tbe/one_hot_ds.py +0 -6
- mindspore/ops/_op_impl/tbe/{greater_ds.py → reduce_all_ds.py} +13 -16
- mindspore/ops/_op_impl/tbe/reduce_any_ds.py +39 -0
- mindspore/ops/_op_impl/tbe/roi_align_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/roi_align_grad_ds.py +44 -0
- mindspore/ops/_op_impl/tbe/scatter_add.py +2 -0
- mindspore/ops/_op_impl/tbe/scatter_nd_add.py +2 -2
- mindspore/ops/_op_impl/tbe/slice.py +26 -15
- mindspore/ops/_op_impl/tbe/space_to_batch.py +1 -1
- mindspore/ops/_op_impl/tbe/space_to_batch_nd.py +1 -1
- mindspore/ops/_op_impl/tbe/strided_slice_grad_d.py +1 -0
- mindspore/ops/_op_impl/tbe/trans_data_ds.py +15 -5
- mindspore/ops/_op_impl/tbe/unsorted_segment_sum.py +1 -1
- mindspore/ops/_op_impl/tbe/unsorted_segment_sum_ds.py +2 -0
- mindspore/ops/_primitive_cache.py +3 -2
- mindspore/ops/_register_for_op.py +11 -0
- mindspore/ops/_utils/__init__.py +1 -1
- mindspore/ops/_utils/utils.py +20 -41
- mindspore/ops/_vmap/__init__.py +2 -2
- mindspore/ops/_vmap/vmap_array_ops.py +170 -78
- mindspore/ops/_vmap/vmap_base.py +24 -10
- mindspore/ops/_vmap/vmap_convolution_ops.py +7 -10
- mindspore/ops/_vmap/vmap_grad_math_ops.py +4 -4
- mindspore/ops/_vmap/vmap_grad_nn_ops.py +41 -9
- mindspore/ops/_vmap/vmap_image_ops.py +52 -0
- mindspore/ops/_vmap/vmap_math_ops.py +77 -6
- mindspore/ops/_vmap/vmap_nn_ops.py +78 -29
- mindspore/ops/_vmap/vmap_other_ops.py +3 -1
- mindspore/ops/_vmap/vmap_random_ops.py +55 -3
- mindspore/ops/_vmap/vmap_sparse_ops.py +1 -0
- mindspore/ops/bprop_mindir/AdaptiveAvgPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/AdaptiveMaxPool2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ApproximateEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/Argmax_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/Argmin_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/AssignSub_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/Assign_bprop.mindir +16 -16
- mindspore/ops/bprop_mindir/AvgPool3D_bprop.mindir +150 -0
- mindspore/ops/bprop_mindir/AvgPool_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/BCEWithLogitsLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BNTrainingReduce_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/BatchNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BatchToSpaceND_bprop.mindir +28 -0
- mindspore/ops/bprop_mindir/BiasAddGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/BinaryCrossEntropy_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/BroadcastTo_bprop.mindir +306 -0
- mindspore/ops/bprop_mindir/Broadcast_bprop.mindir +12 -8
- mindspore/ops/bprop_mindir/CTCLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Concat_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropFilter_bprop.mindir +240 -0
- mindspore/ops/bprop_mindir/Conv2DBackpropInput_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv2DTranspose_bprop.mindir +247 -0
- mindspore/ops/bprop_mindir/Conv3DTranspose_bprop.mindir +315 -0
- mindspore/ops/bprop_mindir/Conv3D_bprop.mindir +278 -0
- mindspore/ops/bprop_mindir/DType_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/DeformableOffsets_bprop.mindir +58 -0
- mindspore/ops/bprop_mindir/Depend_bprop.mindir +12 -13
- mindspore/ops/bprop_mindir/DepthToSpace_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/DepthwiseConv2dNative_bprop.mindir +138 -0
- mindspore/ops/bprop_mindir/DiagPart_bprop.mindir +15 -0
- mindspore/ops/bprop_mindir/Dropout2D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Dropout3D_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DropoutDoMask_bprop.mindir +22 -24
- mindspore/ops/bprop_mindir/DropoutGenMask_bprop.mindir +16 -14
- mindspore/ops/bprop_mindir/DropoutGrad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Dropout_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicGRUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicRNN_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/DynamicShape_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/Elu_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/EmbeddingLookup_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Equal_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/ExpandDims_bprop.mindir +58 -0
- mindspore/ops/bprop_mindir/FastGeLU_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Flatten_bprop.mindir +54 -0
- mindspore/ops/bprop_mindir/FloorDiv_bprop.mindir +18 -15
- mindspore/ops/bprop_mindir/GatherD_bprop.mindir +26 -0
- mindspore/ops/bprop_mindir/GatherNd_bprop.mindir +57 -0
- mindspore/ops/bprop_mindir/Gather_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/GreaterEqual_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/Greater_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/HSigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/HSwish_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/IOU_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/InstanceNorm_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/IsFinite_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/IsInf_bprop.mindir +13 -10
- mindspore/ops/bprop_mindir/IsNan_bprop.mindir +14 -11
- mindspore/ops/bprop_mindir/KLDivLoss_bprop.mindir +126 -0
- mindspore/ops/bprop_mindir/L2Loss_bprop.mindir +15 -0
- mindspore/ops/bprop_mindir/L2Normalize_bprop.mindir +30 -0
- mindspore/ops/bprop_mindir/LRN_bprop.mindir +43 -0
- mindspore/ops/bprop_mindir/LayerNormGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/LessEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/Less_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/LinSpace_bprop.mindir +22 -19
- mindspore/ops/bprop_mindir/Load_bprop.mindir +12 -13
- mindspore/ops/bprop_mindir/LogSoftmax_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/LogicalAnd_bprop.mindir +17 -18
- mindspore/ops/bprop_mindir/LogicalNot_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/MaskedSelect_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/MaxPool3DGradGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3DGrad_bprop.mindir +74 -0
- mindspore/ops/bprop_mindir/MaxPool3D_bprop.mindir +75 -0
- mindspore/ops/bprop_mindir/MaxPoolGradGrad_bprop.mindir +65 -0
- mindspore/ops/bprop_mindir/MaxPoolWithArgmax_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Maximum_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Minimum_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/MirrorPad_bprop.mindir +27 -0
- mindspore/ops/bprop_mindir/Mish_bprop.mindir +35 -0
- mindspore/ops/bprop_mindir/MulNoNan_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/NLLLoss_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/NonZero_bprop.mindir +14 -0
- mindspore/ops/bprop_mindir/NotEqual_bprop.mindir +18 -19
- mindspore/ops/bprop_mindir/OneHot_bprop.mindir +25 -23
- mindspore/ops/bprop_mindir/OnesLike_bprop.mindir +13 -13
- mindspore/ops/bprop_mindir/PReLU_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Pad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Padding_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/RNNTLoss_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ROIAlign_bprop.mindir +82 -0
- mindspore/ops/bprop_mindir/Range_bprop.mindir +21 -19
- mindspore/ops/bprop_mindir/Rank_bprop.mindir +11 -11
- mindspore/ops/bprop_mindir/ReLU6_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/ReLUV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ReduceAll_bprop.mindir +18 -17
- mindspore/ops/bprop_mindir/ReduceAny_bprop.mindir +18 -17
- mindspore/ops/bprop_mindir/ReluGrad_bprop.mindir +19 -23
- mindspore/ops/bprop_mindir/Reshape_bprop.mindir +60 -0
- mindspore/ops/bprop_mindir/ResizeBilinear_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/ResizeNearestNeighbor_bprop.mindir +89 -0
- mindspore/ops/bprop_mindir/ReverseSequence_bprop.mindir +52 -0
- mindspore/ops/bprop_mindir/ReverseV2_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/Round_bprop.mindir +14 -13
- mindspore/ops/bprop_mindir/ScatterMax_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ScatterMin_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/ScatterNdUpdate_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/ScatterNd_bprop.mindir +24 -0
- mindspore/ops/bprop_mindir/ScatterNonAliasingAdd_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/ScatterUpdate_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SeLU_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/Select_bprop.mindir +30 -34
- mindspore/ops/bprop_mindir/Shape_bprop.mindir +12 -12
- mindspore/ops/bprop_mindir/SigmoidCrossEntropyWithLogits_bprop.mindir +21 -0
- mindspore/ops/bprop_mindir/SigmoidGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Sigmoid_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Sign_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/Slice_bprop.mindir +26 -0
- mindspore/ops/bprop_mindir/SmoothL1Loss_bprop.mindir +36 -0
- mindspore/ops/bprop_mindir/SoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Softplus_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Softsign_bprop.mindir +33 -0
- mindspore/ops/bprop_mindir/Sort_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SpaceToBatchND_bprop.mindir +28 -0
- mindspore/ops/bprop_mindir/SpaceToDepth_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/SparseGatherV2_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/SparseSoftmaxCrossEntropyWithLogits_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Split_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/Squeeze_bprop.mindir +54 -0
- mindspore/ops/bprop_mindir/StridedSliceGrad_bprop.mindir +95 -0
- mindspore/ops/bprop_mindir/StridedSlice_bprop.mindir +98 -0
- mindspore/ops/bprop_mindir/Switch_bprop.mindir +28 -32
- mindspore/ops/bprop_mindir/TanhGrad_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/Tanh_bprop.mindir +66 -0
- mindspore/ops/bprop_mindir/TensorScatterAdd_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/TensorScatterUpdate_bprop.mindir +29 -0
- mindspore/ops/bprop_mindir/TensorShape_bprop.mindir +14 -0
- mindspore/ops/bprop_mindir/Tile_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TopK_bprop.mindir +0 -0
- mindspore/ops/bprop_mindir/TransShape_bprop.mindir +23 -0
- mindspore/ops/bprop_mindir/TruncateDiv_bprop.mindir +18 -15
- mindspore/ops/bprop_mindir/TupleGetItem_bprop.mindir +11 -13
- mindspore/ops/bprop_mindir/Unique_bprop.mindir +16 -0
- mindspore/ops/bprop_mindir/Unstack_bprop.mindir +22 -0
- mindspore/ops/bprop_mindir/UpsampleNearest3D_bprop.mindir +32 -0
- mindspore/ops/bprop_mindir/UpsampleTrilinear3D_bprop.mindir +38 -0
- mindspore/ops/bprop_mindir/ZerosLike_bprop.mindir +13 -12
- mindspore/ops/bprop_mindir/__init__.py +1 -4
- mindspore/ops/bprop_mindir/generate_mindir.py +32 -20
- mindspore/ops/composite/__init__.py +12 -13
- mindspore/ops/composite/base.py +261 -254
- mindspore/ops/composite/env_ops.py +41 -0
- mindspore/ops/composite/math_ops.py +197 -156
- mindspore/ops/composite/multitype_ops/_compile_utils.py +428 -176
- mindspore/ops/composite/multitype_ops/_constexpr_utils.py +188 -87
- mindspore/ops/composite/multitype_ops/add_impl.py +23 -1
- mindspore/ops/composite/multitype_ops/div_impl.py +3 -3
- mindspore/ops/composite/multitype_ops/equal_impl.py +1 -0
- mindspore/ops/composite/multitype_ops/floordiv_impl.py +1 -1
- mindspore/ops/composite/multitype_ops/getitem_impl.py +52 -5
- mindspore/ops/composite/multitype_ops/greater_equal_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/greater_impl.py +31 -0
- mindspore/ops/composite/multitype_ops/in_impl.py +15 -3
- mindspore/ops/composite/multitype_ops/less_equal_impl.py +33 -2
- mindspore/ops/composite/multitype_ops/less_impl.py +33 -0
- mindspore/ops/composite/multitype_ops/logical_and_impl.py +2 -2
- mindspore/ops/composite/multitype_ops/logical_or_impl.py +2 -1
- mindspore/ops/composite/multitype_ops/mod_impl.py +1 -1
- mindspore/ops/composite/multitype_ops/mul_impl.py +21 -7
- mindspore/ops/composite/multitype_ops/not_in_impl.py +15 -3
- mindspore/ops/composite/multitype_ops/ones_like_impl.py +2 -4
- mindspore/ops/composite/multitype_ops/pow_impl.py +1 -0
- mindspore/ops/composite/multitype_ops/setitem_impl.py +62 -70
- mindspore/ops/composite/multitype_ops/sub_impl.py +3 -3
- mindspore/ops/composite/multitype_ops/zeros_like_impl.py +41 -4
- mindspore/ops/function/__init__.py +323 -8
- mindspore/ops/function/array_func.py +3511 -780
- mindspore/ops/function/clip_func.py +329 -0
- mindspore/ops/function/debug_func.py +6 -6
- mindspore/ops/function/grad/__init__.py +5 -1
- mindspore/ops/function/grad/grad_func.py +736 -65
- mindspore/ops/function/image_func.py +270 -0
- mindspore/ops/function/linalg_func.py +268 -8
- mindspore/ops/function/math_func.py +8032 -3164
- mindspore/ops/function/nn_func.py +5619 -1855
- mindspore/ops/function/other_func.py +115 -0
- mindspore/ops/function/parameter_func.py +11 -10
- mindspore/ops/function/random_func.py +939 -77
- mindspore/ops/function/sparse_func.py +249 -84
- mindspore/ops/function/sparse_unary_func.py +2303 -0
- mindspore/ops/function/spectral_func.py +146 -0
- mindspore/ops/function/vmap_func.py +114 -0
- mindspore/ops/functional.py +182 -254
- mindspore/ops/op_info_register.py +79 -34
- mindspore/ops/operations/__init__.py +210 -118
- mindspore/ops/operations/_csr_ops.py +7 -7
- mindspore/ops/operations/_embedding_cache_ops.py +25 -15
- mindspore/ops/operations/_grad_ops.py +447 -322
- mindspore/ops/operations/_inner_ops.py +547 -176
- mindspore/ops/operations/_map_tensor_ops.py +112 -0
- mindspore/ops/operations/_ms_kernel.py +29 -27
- mindspore/ops/operations/_ocr_ops.py +11 -11
- mindspore/ops/operations/_opaque_predicate_registry.py +41 -0
- mindspore/ops/operations/_quant_ops.py +186 -101
- mindspore/ops/operations/_rl_inner_ops.py +122 -61
- mindspore/ops/operations/_scalar_ops.py +466 -0
- mindspore/ops/operations/_sequence_ops.py +1047 -0
- mindspore/ops/operations/_tensor_array.py +10 -11
- mindspore/ops/operations/_thor_ops.py +4 -4
- mindspore/ops/operations/array_ops.py +1428 -1226
- mindspore/ops/operations/comm_ops.py +180 -117
- mindspore/ops/operations/control_ops.py +4 -2
- mindspore/ops/operations/custom_ops.py +185 -98
- mindspore/ops/operations/debug_ops.py +92 -54
- mindspore/ops/operations/image_ops.py +406 -211
- mindspore/ops/operations/inner_ops.py +42 -53
- mindspore/ops/operations/linalg_ops.py +32 -29
- mindspore/ops/operations/math_ops.py +2076 -897
- mindspore/ops/operations/nn_ops.py +1282 -1252
- mindspore/ops/operations/other_ops.py +124 -278
- mindspore/ops/operations/random_ops.py +345 -178
- mindspore/ops/operations/rl_ops.py +8 -9
- mindspore/ops/operations/sparse_ops.py +502 -157
- mindspore/ops/operations/spectral_ops.py +107 -0
- mindspore/ops/primitive.py +192 -15
- mindspore/ops/vm_impl_registry.py +23 -2
- mindspore/parallel/__init__.py +6 -1
- mindspore/parallel/_auto_parallel_context.py +199 -92
- mindspore/parallel/_cell_wrapper.py +4 -2
- mindspore/parallel/_cost_model_context.py +3 -0
- mindspore/parallel/_dp_allreduce_fusion.py +2 -1
- mindspore/parallel/_offload_context.py +185 -0
- mindspore/parallel/_parallel_serialization.py +167 -28
- mindspore/parallel/_ps_context.py +9 -5
- mindspore/parallel/_recovery_context.py +1 -1
- mindspore/parallel/_tensor.py +9 -1
- mindspore/{nn/transformer → parallel/_transformer}/__init__.py +6 -6
- mindspore/{nn/transformer → parallel/_transformer}/layers.py +59 -37
- mindspore/{nn/transformer → parallel/_transformer}/loss.py +4 -7
- mindspore/{nn/transformer → parallel/_transformer}/moe.py +160 -35
- mindspore/{nn/transformer → parallel/_transformer}/op_parallel_config.py +3 -3
- mindspore/{nn/transformer → parallel/_transformer}/transformer.py +235 -196
- mindspore/parallel/_utils.py +47 -7
- mindspore/parallel/algo_parameter_config.py +5 -1
- mindspore/parallel/checkpoint_transform.py +329 -0
- mindspore/parallel/shard.py +229 -0
- mindspore/perf_msvcbuildinsights.dll +0 -0
- mindspore/pgodb140.dll +0 -0
- mindspore/pgort140.dll +0 -0
- mindspore/profiler/__init__.py +2 -1
- mindspore/profiler/common/util.py +4 -3
- mindspore/profiler/common/validator/validate_path.py +2 -2
- mindspore/profiler/envprofiling.py +249 -0
- mindspore/profiler/parser/aicpu_data_parser.py +38 -39
- mindspore/profiler/parser/ascend_timeline_generator.py +497 -0
- mindspore/profiler/parser/base_timeline_generator.py +471 -0
- mindspore/profiler/parser/cpu_gpu_timeline_generator.py +684 -0
- mindspore/profiler/parser/framework_parser.py +42 -16
- mindspore/profiler/parser/hccl_parser.py +158 -158
- mindspore/profiler/parser/hwts_log_parser.py +7 -6
- mindspore/profiler/parser/integrator.py +18 -1579
- mindspore/profiler/parser/minddata_analyzer.py +8 -8
- mindspore/profiler/parser/msadvisor_analyzer.py +14 -27
- mindspore/profiler/parser/msadvisor_parser.py +2 -4
- mindspore/profiler/parser/optime_parser.py +17 -18
- mindspore/profiler/parser/profiler_info.py +108 -0
- mindspore/profiler/parser/step_trace_parser.py +1 -1
- mindspore/profiler/profiling.py +396 -194
- mindspore/rewrite/__init__.py +6 -2
- mindspore/rewrite/api/node.py +51 -110
- mindspore/rewrite/api/node_type.py +10 -6
- mindspore/rewrite/api/pattern_engine.py +51 -7
- mindspore/rewrite/api/scoped_value.py +64 -53
- mindspore/rewrite/api/symbol_tree.py +108 -61
- mindspore/rewrite/api/tree_node_helper.py +2 -3
- mindspore/{compression/quant/__init__.py → rewrite/ast_creator_register.py} +20 -11
- mindspore/rewrite/ast_helpers/__init__.py +6 -3
- mindspore/rewrite/ast_helpers/ast_creator.py +115 -0
- mindspore/rewrite/ast_helpers/ast_finder.py +99 -1
- mindspore/rewrite/ast_helpers/ast_modifier.py +17 -4
- mindspore/rewrite/ast_helpers/ast_replacer.py +1 -1
- mindspore/rewrite/ast_transformers/__init__.py +0 -1
- mindspore/rewrite/ast_transformers/flatten_recursive_stmt.py +46 -5
- mindspore/rewrite/ast_transformers/remove_return_out_of_if.py +6 -3
- mindspore/rewrite/common/__init__.py +2 -0
- mindspore/rewrite/common/event.py +1 -1
- mindspore/rewrite/common/observable.py +1 -1
- mindspore/rewrite/common/observer.py +1 -1
- mindspore/rewrite/common/rewrite_elog.py +35 -0
- mindspore/rewrite/namer.py +2 -2
- mindspore/rewrite/namespace.py +14 -4
- mindspore/rewrite/node.py +161 -13
- mindspore/rewrite/parser.py +0 -1
- mindspore/rewrite/parser_register.py +0 -1
- mindspore/rewrite/parsers/arguments_parser.py +3 -2
- mindspore/rewrite/parsers/assign_parser.py +267 -67
- mindspore/rewrite/parsers/attribute_parser.py +56 -0
- mindspore/rewrite/parsers/class_def_parser.py +191 -108
- mindspore/rewrite/parsers/constant_parser.py +101 -0
- mindspore/rewrite/parsers/container_parser.py +88 -0
- mindspore/rewrite/parsers/for_parser.py +28 -15
- mindspore/rewrite/parsers/function_def_parser.py +21 -5
- mindspore/rewrite/parsers/if_parser.py +11 -28
- mindspore/rewrite/parsers/module_parser.py +9 -6
- mindspore/rewrite/parsers/return_parser.py +3 -2
- mindspore/rewrite/sparsify/__init__.py +0 -0
- mindspore/rewrite/sparsify/sparse_transformer.py +448 -0
- mindspore/rewrite/sparsify/sparsify.py +109 -0
- mindspore/rewrite/sparsify/utils.py +173 -0
- mindspore/rewrite/symbol_tree.py +322 -109
- mindspore/rewrite/symbol_tree_builder.py +45 -8
- mindspore/rewrite/symbol_tree_dumper.py +0 -1
- mindspore/rewrite/topological_manager.py +1 -2
- mindspore/run_check/_check_version.py +209 -112
- mindspore/run_check/run_check.py +2 -1
- mindspore/tbbmalloc.dll +0 -0
- mindspore/tinyxml2.dll +0 -0
- mindspore/train/__init__.py +6 -4
- mindspore/train/_utils.py +28 -5
- mindspore/train/amp.py +321 -50
- mindspore/train/callback/__init__.py +3 -1
- mindspore/train/callback/_backup_and_restore.py +120 -0
- mindspore/train/callback/_callback.py +8 -8
- mindspore/train/callback/_checkpoint.py +12 -9
- mindspore/train/callback/_early_stop.py +13 -7
- mindspore/train/callback/_history.py +8 -8
- mindspore/train/callback/_lambda_callback.py +6 -6
- mindspore/train/callback/_landscape.py +36 -38
- mindspore/train/callback/_loss_monitor.py +12 -6
- mindspore/train/callback/_lr_scheduler_callback.py +2 -4
- mindspore/train/callback/_on_request_exit.py +212 -0
- mindspore/train/callback/_reduce_lr_on_plateau.py +13 -7
- mindspore/train/callback/_summary_collector.py +27 -19
- mindspore/train/callback/_time_monitor.py +13 -7
- mindspore/train/checkpoint_pb2.py +68 -8
- mindspore/train/data_sink.py +122 -33
- mindspore/train/dataset_helper.py +28 -87
- mindspore/train/loss_scale_manager.py +4 -7
- mindspore/{nn → train}/metrics/__init__.py +20 -20
- mindspore/{nn → train}/metrics/accuracy.py +12 -10
- mindspore/{nn → train}/metrics/auc.py +4 -4
- mindspore/{nn → train}/metrics/bleu_score.py +4 -4
- mindspore/{nn → train}/metrics/confusion_matrix.py +10 -8
- mindspore/{nn → train}/metrics/cosine_similarity.py +4 -4
- mindspore/{nn → train}/metrics/dice.py +6 -5
- mindspore/{nn → train}/metrics/error.py +7 -5
- mindspore/{nn → train}/metrics/fbeta.py +9 -7
- mindspore/{nn → train}/metrics/hausdorff_distance.py +8 -6
- mindspore/{nn → train}/metrics/loss.py +4 -3
- mindspore/{nn → train}/metrics/mean_surface_distance.py +6 -5
- mindspore/{nn → train}/metrics/metric.py +6 -5
- mindspore/{nn → train}/metrics/occlusion_sensitivity.py +4 -3
- mindspore/{nn → train}/metrics/perplexity.py +5 -4
- mindspore/{nn → train}/metrics/precision.py +5 -4
- mindspore/{nn → train}/metrics/recall.py +5 -4
- mindspore/{nn → train}/metrics/roc.py +7 -6
- mindspore/{nn → train}/metrics/root_mean_square_surface_distance.py +6 -5
- mindspore/{nn → train}/metrics/topk.py +7 -5
- mindspore/train/mind_ir_pb2.py +339 -32
- mindspore/train/model.py +113 -84
- mindspore/train/serialization.py +547 -167
- mindspore/train/summary/_summary_adapter.py +1 -1
- mindspore/train/summary/summary_record.py +43 -12
- mindspore/train/train_thor/convert_utils.py +7 -1
- mindspore/train/train_thor/dataset_helper.py +3 -3
- mindspore/train/train_thor/model_thor.py +0 -4
- mindspore/turbojpeg.dll +0 -0
- mindspore/vcmeta.dll +0 -0
- mindspore/vcruntime140.dll +0 -0
- mindspore/vcruntime140_1.dll +0 -0
- mindspore/version.py +1 -1
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/METADATA +4 -3
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/RECORD +901 -660
- mindspore/compression/common/constant.py +0 -124
- mindspore/compression/export/__init__.py +0 -19
- mindspore/compression/export/quant_export.py +0 -514
- mindspore/compression/quant/qat.py +0 -636
- mindspore/compression/quant/quant_utils.py +0 -462
- mindspore/compression/quant/quantizer.py +0 -68
- mindspore/libatomic-1.dll +0 -0
- mindspore/libgcc_s_seh-1.dll +0 -0
- mindspore/libgfortran-4.dll +0 -0
- mindspore/libgomp-1.dll +0 -0
- mindspore/libjpeg-62.dll +0 -0
- mindspore/libmindspore.dll +0 -0
- mindspore/libmindspore_common.dll +0 -0
- mindspore/libmindspore_core.dll +0 -0
- mindspore/libmindspore_glog.dll +0 -0
- mindspore/libnnacl.dll +0 -0
- mindspore/libopencv_core452.dll +0 -0
- mindspore/libopencv_imgcodecs452.dll +0 -0
- mindspore/libopencv_imgproc452.dll +0 -0
- mindspore/libquadmath-0.dll +0 -0
- mindspore/libsqlite3.dll +0 -0
- mindspore/libssp-0.dll +0 -0
- mindspore/libstdc++-6.dll +0 -0
- mindspore/libtinyxml2.dll +0 -0
- mindspore/libturbojpeg.dll +0 -0
- mindspore/libwinpthread-1.dll +0 -0
- mindspore/nn/layer/quant.py +0 -1868
- mindspore/nn/layer/rnn_utils.py +0 -90
- mindspore/nn/probability/dpn/__init__.py +0 -22
- mindspore/nn/probability/dpn/vae/__init__.py +0 -25
- mindspore/nn/probability/dpn/vae/cvae.py +0 -138
- mindspore/nn/probability/dpn/vae/vae.py +0 -122
- mindspore/nn/probability/infer/__init__.py +0 -22
- mindspore/nn/probability/infer/variational/elbo.py +0 -70
- mindspore/nn/probability/infer/variational/svi.py +0 -84
- mindspore/nn/probability/toolbox/__init__.py +0 -22
- mindspore/nn/probability/toolbox/anomaly_detection.py +0 -99
- mindspore/nn/probability/toolbox/uncertainty_evaluation.py +0 -363
- mindspore/nn/probability/transforms/__init__.py +0 -22
- mindspore/nn/probability/transforms/transform_bnn.py +0 -262
- mindspore/nn/probability/zhusuan/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/framework/bn.py +0 -95
- mindspore/nn/probability/zhusuan/variational/__init__.py +0 -18
- mindspore/nn/probability/zhusuan/variational/elbo.py +0 -46
- mindspore/ops/_op_impl/tbe/bias_add_grad_ds.py +0 -52
- mindspore/ops/_op_impl/tbe/scatter_nd_add_ds.py +0 -43
- mindspore/ops/bprop_mindir/AssignAdd_bprop.mindir +0 -20
- mindspore/ops/bprop_mindir/Identity_bprop.mindir +0 -9
- mindspore/ops/bprop_mindir/LogicalOr_bprop.mindir +0 -20
- mindspore/ops/bprop_mindir/ReLU_bprop.mindir +0 -16
- mindspore/ops/bprop_mindir/UpdateState_bprop.mindir +0 -17
- mindspore/ops/bprop_mindir/stop_gradient_bprop.mindir +0 -12
- mindspore/ops/composite/array_ops.py +0 -210
- mindspore/ops/composite/clip_ops.py +0 -238
- mindspore/ops/composite/random_ops.py +0 -426
- mindspore/ops/composite/vmap_ops.py +0 -38
- mindspore/ops/operations/sponge_ops.py +0 -3531
- mindspore/ops/operations/sponge_update_ops.py +0 -2546
- mindspore/parallel/nn/__init__.py +0 -42
- mindspore/parallel/nn/loss.py +0 -22
- mindspore/parallel/nn/moe.py +0 -21
- mindspore/parallel/nn/op_parallel_config.py +0 -22
- mindspore/parallel/nn/transformer.py +0 -31
- mindspore/run_check/_check_deps_version.py +0 -84
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/WHEEL +0 -0
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/entry_points.txt +0 -0
- {mindspore-1.10.0.dist-info → mindspore-2.0.0rc1.dist-info}/top_level.txt +0 -0
|
@@ -31,7 +31,7 @@ Examples:
|
|
|
31
31
|
>>> tokenizer = text.UnicodeCharTokenizer()
|
|
32
32
|
>>> # Load vocabulary from list
|
|
33
33
|
>>> vocab = text.Vocab.from_list(word_list=['深', '圳', '欢', '迎', '您'])
|
|
34
|
-
>>> # Use Lookup
|
|
34
|
+
>>> # Use Lookup operation to map tokens to ids
|
|
35
35
|
>>> lookup = text.Lookup(vocab=vocab)
|
|
36
36
|
>>> text_file_dataset = text_file_dataset.map(operations=[tokenizer, lookup])
|
|
37
37
|
>>> # if text line in dataset_file is:
|
|
@@ -49,11 +49,11 @@ import mindspore._c_dataengine as cde
|
|
|
49
49
|
from mindspore.common import dtype as mstype
|
|
50
50
|
|
|
51
51
|
from .utils import JiebaMode, NormalizeForm, to_str, SPieceTokenizerOutType, SPieceTokenizerLoadType, SentencePieceVocab
|
|
52
|
-
from .validators import check_lookup, check_jieba_add_dict, check_to_vectors, \
|
|
52
|
+
from .validators import check_add_token, check_lookup, check_jieba_add_dict, check_to_vectors, \
|
|
53
53
|
check_jieba_add_word, check_jieba_init, check_with_offsets, check_unicode_script_tokenizer, \
|
|
54
54
|
check_wordpiece_tokenizer, check_regex_replace, check_regex_tokenizer, check_basic_tokenizer, check_ngram, \
|
|
55
55
|
check_pair_truncate, check_to_number, check_bert_tokenizer, check_python_tokenizer, check_slidingwindow, \
|
|
56
|
-
check_sentence_piece_tokenizer
|
|
56
|
+
check_sentence_piece_tokenizer, check_truncate
|
|
57
57
|
from ..core.datatypes import mstype_to_detype
|
|
58
58
|
from ..core.validator_helpers import replace_none
|
|
59
59
|
from ..transforms.py_transforms_util import Implementation
|
|
@@ -91,6 +91,49 @@ DE_C_INTER_SENTENCEPIECE_OUTTYPE = {
|
|
|
91
91
|
}
|
|
92
92
|
|
|
93
93
|
|
|
94
|
+
class AddToken(TextTensorOperation):
|
|
95
|
+
"""
|
|
96
|
+
Add token to beginning or end of sequence.
|
|
97
|
+
|
|
98
|
+
Args:
|
|
99
|
+
token (str): The token to be added.
|
|
100
|
+
begin (bool, optional): Choose the position where the token is inserted. If True,
|
|
101
|
+
the token will be inserted at the beginning of the sequence. Otherwise, it will
|
|
102
|
+
be inserted at the end of the sequence. Default: True.
|
|
103
|
+
|
|
104
|
+
Raises:
|
|
105
|
+
TypeError: If `token` is not of type string.
|
|
106
|
+
TypeError: If `begin` is not of type bool.
|
|
107
|
+
|
|
108
|
+
Supported Platforms:
|
|
109
|
+
``CPU``
|
|
110
|
+
|
|
111
|
+
Examples:
|
|
112
|
+
>>> dataset = ds.NumpySlicesDataset(data={"text": [['a', 'b', 'c', 'd', 'e']]})
|
|
113
|
+
>>> # Data before
|
|
114
|
+
>>> # | text |
|
|
115
|
+
>>> # +---------------------------+
|
|
116
|
+
>>> # | ['a', 'b', 'c', 'd', 'e'] |
|
|
117
|
+
>>> # +---------------------------+
|
|
118
|
+
>>> add_token_op = text.AddToken(token='TOKEN', begin=True)
|
|
119
|
+
>>> dataset = dataset.map(operations=add_token_op)
|
|
120
|
+
>>> # Data after
|
|
121
|
+
>>> # | text |
|
|
122
|
+
>>> # +---------------------------+
|
|
123
|
+
>>> # | ['TOKEN', 'a', 'b', 'c', 'd', 'e'] |
|
|
124
|
+
>>> # +---------------------------+
|
|
125
|
+
"""
|
|
126
|
+
|
|
127
|
+
@check_add_token
|
|
128
|
+
def __init__(self, token, begin=True):
|
|
129
|
+
super().__init__()
|
|
130
|
+
self.token = token
|
|
131
|
+
self.begin = begin
|
|
132
|
+
|
|
133
|
+
def parse(self):
|
|
134
|
+
return cde.AddTokenOperation(self.token, self.begin)
|
|
135
|
+
|
|
136
|
+
|
|
94
137
|
class JiebaTokenizer(TextTensorOperation):
|
|
95
138
|
"""
|
|
96
139
|
Tokenize Chinese string into words based on dictionary.
|
|
@@ -104,12 +147,15 @@ class JiebaTokenizer(TextTensorOperation):
|
|
|
104
147
|
mp_path (str): Dictionary file is used by MPSegment algorithm.
|
|
105
148
|
The dictionary can be obtained on the official website of cppjieba.
|
|
106
149
|
mode (JiebaMode, optional): Valid values can be any of [JiebaMode.MP, JiebaMode.HMM,
|
|
107
|
-
JiebaMode.MIX]
|
|
150
|
+
JiebaMode.MIX]. Default: JiebaMode.MIX.
|
|
108
151
|
|
|
109
152
|
- JiebaMode.MP, tokenize with MPSegment algorithm.
|
|
153
|
+
|
|
110
154
|
- JiebaMode.HMM, tokenize with Hidden Markov Model Segment algorithm.
|
|
155
|
+
|
|
111
156
|
- JiebaMode.MIX, tokenize with a mix of MPSegment and HMMSegment algorithm.
|
|
112
|
-
|
|
157
|
+
|
|
158
|
+
with_offsets (bool, optional): Whether or not output offsets of tokens. Default: False.
|
|
113
159
|
|
|
114
160
|
Raises:
|
|
115
161
|
ValueError: If path of HMMSegment dict is not provided.
|
|
@@ -121,6 +167,7 @@ class JiebaTokenizer(TextTensorOperation):
|
|
|
121
167
|
``CPU``
|
|
122
168
|
|
|
123
169
|
Examples:
|
|
170
|
+
>>> import mindspore.dataset.text as text
|
|
124
171
|
>>> from mindspore.dataset.text import JiebaMode
|
|
125
172
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
126
173
|
>>> jieba_hmm_file = "/path/to/jieba/hmm/file"
|
|
@@ -131,8 +178,7 @@ class JiebaTokenizer(TextTensorOperation):
|
|
|
131
178
|
>>> # ["offsets_limit", dtype=uint32]}
|
|
132
179
|
>>> tokenizer_op = text.JiebaTokenizer(jieba_hmm_file, jieba_mp_file, mode=JiebaMode.MP, with_offsets=True)
|
|
133
180
|
>>> text_file_dataset_1 = text_file_dataset_1.map(operations=tokenizer_op, input_columns=["text"],
|
|
134
|
-
... output_columns=["token", "offsets_start", "offsets_limit"]
|
|
135
|
-
... column_order=["token", "offsets_start", "offsets_limit"])
|
|
181
|
+
... output_columns=["token", "offsets_start", "offsets_limit"])
|
|
136
182
|
"""
|
|
137
183
|
|
|
138
184
|
@check_jieba_init
|
|
@@ -173,9 +219,10 @@ class JiebaTokenizer(TextTensorOperation):
|
|
|
173
219
|
word (str): The word to be added to the JiebaTokenizer instance.
|
|
174
220
|
The added word will not be written into the built-in dictionary on disk.
|
|
175
221
|
freq (int, optional): The frequency of the word to be added. The higher the frequency,
|
|
176
|
-
the better chance the word will be tokenized
|
|
222
|
+
the better chance the word will be tokenized. Default: None, use default frequency.
|
|
177
223
|
|
|
178
224
|
Examples:
|
|
225
|
+
>>> import mindspore.dataset.text as text
|
|
179
226
|
>>> from mindspore.dataset.text import JiebaMode
|
|
180
227
|
>>> jieba_hmm_file = "/path/to/jieba/hmm/file"
|
|
181
228
|
>>> jieba_mp_file = "/path/to/jieba/mp/file"
|
|
@@ -280,9 +327,9 @@ class Lookup(TextTensorOperation):
|
|
|
280
327
|
vocab (Vocab): A vocabulary object.
|
|
281
328
|
unknown_token (str, optional): Word is used for lookup. In case of the word is out of vocabulary (OOV),
|
|
282
329
|
the result of lookup will be replaced with unknown_token. If the unknown_token is not specified or
|
|
283
|
-
it is OOV, runtime error will be thrown
|
|
330
|
+
it is OOV, runtime error will be thrown. Default: None, means no unknown_token is specified.
|
|
284
331
|
data_type (mindspore.dtype, optional): The data type that lookup operation maps
|
|
285
|
-
string to
|
|
332
|
+
string to. Default: mindspore.int32.
|
|
286
333
|
|
|
287
334
|
Raises:
|
|
288
335
|
TypeError: If `vocab` is not of type text.Vocab.
|
|
@@ -293,9 +340,10 @@ class Lookup(TextTensorOperation):
|
|
|
293
340
|
``CPU``
|
|
294
341
|
|
|
295
342
|
Examples:
|
|
343
|
+
>>> import mindspore.dataset.text as text
|
|
296
344
|
>>> # Load vocabulary from list
|
|
297
345
|
>>> vocab = text.Vocab.from_list(['深', '圳', '欢', '迎', '您'])
|
|
298
|
-
>>> # Use Lookup
|
|
346
|
+
>>> # Use Lookup operation to map tokens to ids
|
|
299
347
|
>>> lookup = text.Lookup(vocab)
|
|
300
348
|
>>> text_file_dataset = text_file_dataset.map(operations=[lookup])
|
|
301
349
|
"""
|
|
@@ -325,13 +373,13 @@ class Ngram(TextTensorOperation):
|
|
|
325
373
|
an empty string produced.
|
|
326
374
|
left_pad (tuple, optional): Padding performed on left side of the sequence shaped like ("pad_token", pad_width).
|
|
327
375
|
`pad_width` will be capped at n-1. For example, specifying left_pad=("_", 2) would pad left side of the
|
|
328
|
-
sequence with "__" (
|
|
376
|
+
sequence with "__". Default: ('', 0).
|
|
329
377
|
right_pad (tuple, optional): Padding performed on right side of the sequence shaped like
|
|
330
378
|
("pad_token", pad_width). `pad_width` will be capped at n-1. For example, specifying right_pad=("_", 2)
|
|
331
|
-
would pad right side of the sequence with "__" (
|
|
379
|
+
would pad right side of the sequence with "__". Default: ('', 0).
|
|
332
380
|
separator (str, optional): Symbol used to join strings together. For example, if 2-gram is
|
|
333
|
-
["mindspore", "amazing"] with separator="-", the result would be ["mindspore-amazing"]
|
|
334
|
-
|
|
381
|
+
["mindspore", "amazing"] with separator="-", the result would be ["mindspore-amazing"].
|
|
382
|
+
Default: ' ', which will use whitespace as separator.
|
|
335
383
|
|
|
336
384
|
Raises:
|
|
337
385
|
TypeError: If values of `n` not positive is not of type int.
|
|
@@ -344,6 +392,7 @@ class Ngram(TextTensorOperation):
|
|
|
344
392
|
``CPU``
|
|
345
393
|
|
|
346
394
|
Examples:
|
|
395
|
+
>>> import mindspore.dataset.text as text
|
|
347
396
|
>>> ngram_op = text.Ngram(3, separator="-")
|
|
348
397
|
>>> output = ngram_op(["WildRose Country", "Canada's Ocean Playground", "Land of Living Skies"])
|
|
349
398
|
>>> # output
|
|
@@ -429,6 +478,7 @@ class SentencePieceTokenizer(TextTensorOperation):
|
|
|
429
478
|
``CPU``
|
|
430
479
|
|
|
431
480
|
Examples:
|
|
481
|
+
>>> import mindspore.dataset.text as text
|
|
432
482
|
>>> from mindspore.dataset.text import SentencePieceModel, SPieceTokenizerOutType
|
|
433
483
|
>>> sentence_piece_vocab_file = "/path/to/sentence/piece/vocab/file"
|
|
434
484
|
>>> vocab = text.SentencePieceVocab.from_file([sentence_piece_vocab_file], 5000, 0.9995,
|
|
@@ -455,7 +505,7 @@ class SlidingWindow(TextTensorOperation):
|
|
|
455
505
|
|
|
456
506
|
Args:
|
|
457
507
|
width (int): The width of the window. It must be an integer and greater than zero.
|
|
458
|
-
axis (int, optional): The axis along which the sliding window is computed
|
|
508
|
+
axis (int, optional): The axis along which the sliding window is computed. Default: 0.
|
|
459
509
|
|
|
460
510
|
Raises:
|
|
461
511
|
TypeError: If `width` is not of type int.
|
|
@@ -466,6 +516,7 @@ class SlidingWindow(TextTensorOperation):
|
|
|
466
516
|
``CPU``
|
|
467
517
|
|
|
468
518
|
Examples:
|
|
519
|
+
>>> import mindspore.dataset as ds
|
|
469
520
|
>>> dataset = ds.NumpySlicesDataset(data=[[1, 2, 3, 4, 5]], column_names="col1")
|
|
470
521
|
>>> # Data before
|
|
471
522
|
>>> # | col1 |
|
|
@@ -512,6 +563,8 @@ class ToNumber(TextTensorOperation):
|
|
|
512
563
|
``CPU``
|
|
513
564
|
|
|
514
565
|
Examples:
|
|
566
|
+
>>> import mindspore.dataset as ds
|
|
567
|
+
>>> import mindspore.dataset.text as text
|
|
515
568
|
>>> from mindspore import dtype as mstype
|
|
516
569
|
>>> data = [["1", "2", "3"]]
|
|
517
570
|
>>> dataset = ds.NumpySlicesDataset(data)
|
|
@@ -535,11 +588,11 @@ class ToVectors(TextTensorOperation):
|
|
|
535
588
|
|
|
536
589
|
Args:
|
|
537
590
|
vectors (Vectors): A vectors object.
|
|
538
|
-
unk_init (sequence, optional): Sequence used to initialize out-of-vectors (OOV) token
|
|
539
|
-
|
|
591
|
+
unk_init (sequence, optional): Sequence used to initialize out-of-vectors (OOV) token.
|
|
592
|
+
Default: None, initialize with zero vectors.
|
|
540
593
|
lower_case_backup (bool, optional): Whether to look up the token in the lower case. If False, each token in the
|
|
541
594
|
original case will be looked up; if True, each token in the original case will be looked up first, if not
|
|
542
|
-
found in the keys of the property stoi, the token in the lower case will be looked up
|
|
595
|
+
found in the keys of the property stoi, the token in the lower case will be looked up. Default: False.
|
|
543
596
|
|
|
544
597
|
Raises:
|
|
545
598
|
TypeError: If `unk_init` is not of type sequence.
|
|
@@ -550,9 +603,10 @@ class ToVectors(TextTensorOperation):
|
|
|
550
603
|
``CPU``
|
|
551
604
|
|
|
552
605
|
Examples:
|
|
606
|
+
>>> import mindspore.dataset.text as text
|
|
553
607
|
>>> # Load vectors from file
|
|
554
608
|
>>> vectors = text.Vectors.from_file("/path/to/vectors/file")
|
|
555
|
-
>>> # Use ToVectors
|
|
609
|
+
>>> # Use ToVectors operation to map tokens to vectors
|
|
556
610
|
>>> to_vectors = text.ToVectors(vectors)
|
|
557
611
|
>>> text_file_dataset = text_file_dataset.map(operations=[to_vectors])
|
|
558
612
|
"""
|
|
@@ -568,6 +622,46 @@ class ToVectors(TextTensorOperation):
|
|
|
568
622
|
return cde.ToVectorsOperation(self.vectors, self.unk_init, self.lower_case_backup)
|
|
569
623
|
|
|
570
624
|
|
|
625
|
+
class Truncate(TextTensorOperation):
|
|
626
|
+
"""
|
|
627
|
+
Truncate the input sequence so that it does not exceed the maximum length.
|
|
628
|
+
|
|
629
|
+
Args:
|
|
630
|
+
max_seq_len (int): Maximum allowable length.
|
|
631
|
+
|
|
632
|
+
Raises:
|
|
633
|
+
TypeError: If `max_length_len` is not of type int.
|
|
634
|
+
ValueError: If value of `max_length_len` is not greater than or equal to 0.
|
|
635
|
+
RuntimeError: If the input tensor is not of dtype bool, int, float, double or str.
|
|
636
|
+
|
|
637
|
+
Supported Platforms:
|
|
638
|
+
``CPU``
|
|
639
|
+
|
|
640
|
+
Examples:
|
|
641
|
+
>>> dataset = ds.NumpySlicesDataset(data=[['a', 'b', 'c', 'd', 'e']], column_names=["text"], shuffle=False)
|
|
642
|
+
>>> # Data before
|
|
643
|
+
>>> # | col1 |
|
|
644
|
+
>>> # +---------------------------+
|
|
645
|
+
>>> # | ['a', 'b', 'c', 'd', 'e'] |
|
|
646
|
+
>>> # +---------------------------+
|
|
647
|
+
>>> truncate = text.Truncate(4)
|
|
648
|
+
>>> dataset = dataset.map(operations=truncate, input_columns=["text"])
|
|
649
|
+
>>> # Data after
|
|
650
|
+
>>> # | col1 |
|
|
651
|
+
>>> # +------------------------+
|
|
652
|
+
>>> # | ['a', 'b', 'c', 'd'] |
|
|
653
|
+
>>> # +------------------------+
|
|
654
|
+
"""
|
|
655
|
+
|
|
656
|
+
@check_truncate
|
|
657
|
+
def __init__(self, max_seq_len):
|
|
658
|
+
super().__init__()
|
|
659
|
+
self.max_seq_len = max_seq_len
|
|
660
|
+
|
|
661
|
+
def parse(self):
|
|
662
|
+
return cde.TruncateOperation(self.max_seq_len)
|
|
663
|
+
|
|
664
|
+
|
|
571
665
|
class TruncateSequencePair(TextTensorOperation):
|
|
572
666
|
"""
|
|
573
667
|
Truncate a pair of rank-1 tensors such that the total length is less than max_length.
|
|
@@ -584,6 +678,7 @@ class TruncateSequencePair(TextTensorOperation):
|
|
|
584
678
|
``CPU``
|
|
585
679
|
|
|
586
680
|
Examples:
|
|
681
|
+
>>> import mindspore.dataset.text as text
|
|
587
682
|
>>> dataset = ds.NumpySlicesDataset(data={"col1": [[1, 2, 3]], "col2": [[4, 5]]})
|
|
588
683
|
>>> # Data before
|
|
589
684
|
>>> # | col1 | col2 |
|
|
@@ -613,7 +708,7 @@ class UnicodeCharTokenizer(TextTensorOperation):
|
|
|
613
708
|
Tokenize a scalar tensor of UTF-8 string to Unicode characters.
|
|
614
709
|
|
|
615
710
|
Args:
|
|
616
|
-
with_offsets (bool, optional): Whether or not output offsets of tokens
|
|
711
|
+
with_offsets (bool, optional): Whether or not output offsets of tokens. Default: False.
|
|
617
712
|
|
|
618
713
|
Raises:
|
|
619
714
|
TypeError: If `with_offsets` is not of type bool.
|
|
@@ -622,6 +717,7 @@ class UnicodeCharTokenizer(TextTensorOperation):
|
|
|
622
717
|
``CPU``
|
|
623
718
|
|
|
624
719
|
Examples:
|
|
720
|
+
>>> import mindspore.dataset.text as text
|
|
625
721
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
626
722
|
>>> tokenizer_op = text.UnicodeCharTokenizer(with_offsets=False)
|
|
627
723
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op)
|
|
@@ -629,8 +725,7 @@ class UnicodeCharTokenizer(TextTensorOperation):
|
|
|
629
725
|
>>> # ["offsets_limit", dtype=uint32]}
|
|
630
726
|
>>> tokenizer_op = text.UnicodeCharTokenizer(with_offsets=True)
|
|
631
727
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op, input_columns=["text"],
|
|
632
|
-
... output_columns=["token", "offsets_start", "offsets_limit"]
|
|
633
|
-
... column_order=["token", "offsets_start", "offsets_limit"])
|
|
728
|
+
... output_columns=["token", "offsets_start", "offsets_limit"])
|
|
634
729
|
"""
|
|
635
730
|
|
|
636
731
|
@check_with_offsets
|
|
@@ -657,7 +752,7 @@ class WordpieceTokenizer(TextTensorOperation):
|
|
|
657
752
|
with_offsets (bool, optional): Whether to return the offsets of tokens. Default: False.
|
|
658
753
|
|
|
659
754
|
Raises:
|
|
660
|
-
TypeError: If `vocab` is not of type :class:`mindspore.dataset.text.Vocab
|
|
755
|
+
TypeError: If `vocab` is not of type :class:`mindspore.dataset.text.Vocab` .
|
|
661
756
|
TypeError: If `suffix_indicator` is not of type str.
|
|
662
757
|
TypeError: If `max_bytes_per_token` is not of type int.
|
|
663
758
|
TypeError: If `unknown_token` is not of type str.
|
|
@@ -668,6 +763,7 @@ class WordpieceTokenizer(TextTensorOperation):
|
|
|
668
763
|
``CPU``
|
|
669
764
|
|
|
670
765
|
Examples:
|
|
766
|
+
>>> import mindspore.dataset.text as text
|
|
671
767
|
>>> vocab_list = ["book", "cholera", "era", "favor", "##ite", "my", "is", "love", "dur", "##ing", "the"]
|
|
672
768
|
>>> vocab = text.Vocab.from_list(vocab_list)
|
|
673
769
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
@@ -679,8 +775,7 @@ class WordpieceTokenizer(TextTensorOperation):
|
|
|
679
775
|
>>> tokenizer_op = text.WordpieceTokenizer(vocab=vocab, unknown_token='[UNK]',
|
|
680
776
|
... max_bytes_per_token=100, with_offsets=True)
|
|
681
777
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op, input_columns=["text"],
|
|
682
|
-
... output_columns=["token", "offsets_start", "offsets_limit"]
|
|
683
|
-
... column_order=["token", "offsets_start", "offsets_limit"])
|
|
778
|
+
... output_columns=["token", "offsets_start", "offsets_limit"])
|
|
684
779
|
"""
|
|
685
780
|
|
|
686
781
|
@check_wordpiece_tokenizer
|
|
@@ -718,10 +813,10 @@ if platform.system().lower() != 'windows':
|
|
|
718
813
|
Args:
|
|
719
814
|
lower_case (bool, optional): Whether to perform lowercase processing on the text. If True, will fold the
|
|
720
815
|
text to lower case and strip accented characters. If False, will only perform normalization on the
|
|
721
|
-
text, with mode specified by `normalization_form
|
|
816
|
+
text, with mode specified by `normalization_form` . Default: False.
|
|
722
817
|
keep_whitespace (bool, optional): If True, the whitespace will be kept in the output. Default: False.
|
|
723
818
|
normalization_form (NormalizeForm, optional):
|
|
724
|
-
`Unicode normalization forms <http://unicode.org/reports/tr15/>`_, only valid when `lower_case`
|
|
819
|
+
`Unicode normalization forms <http://unicode.org/reports/tr15/>`_ , only valid when `lower_case`
|
|
725
820
|
is False, can be NormalizeForm.NONE, NormalizeForm.NFC, NormalizeForm.NFKC, NormalizeForm.NFD or
|
|
726
821
|
NormalizeForm.NFKD. Default: NormalizeForm.NONE.
|
|
727
822
|
|
|
@@ -738,7 +833,7 @@ if platform.system().lower() != 'windows':
|
|
|
738
833
|
Raises:
|
|
739
834
|
TypeError: If `lower_case` is not of type bool.
|
|
740
835
|
TypeError: If `keep_whitespace` is not of type bool.
|
|
741
|
-
TypeError: If `normalization_form` is not of type :class:`mindspore.dataset.text.NormalizeForm
|
|
836
|
+
TypeError: If `normalization_form` is not of type :class:`mindspore.dataset.text.NormalizeForm` .
|
|
742
837
|
TypeError: If `preserve_unused_token` is not of type bool.
|
|
743
838
|
TypeError: If `with_offsets` is not of type bool.
|
|
744
839
|
RuntimeError: If dtype of input Tensor is not str.
|
|
@@ -747,6 +842,7 @@ if platform.system().lower() != 'windows':
|
|
|
747
842
|
``CPU``
|
|
748
843
|
|
|
749
844
|
Examples:
|
|
845
|
+
>>> import mindspore.dataset.text as text
|
|
750
846
|
>>> from mindspore.dataset.text import NormalizeForm
|
|
751
847
|
>>>
|
|
752
848
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
@@ -766,9 +862,7 @@ if platform.system().lower() != 'windows':
|
|
|
766
862
|
... with_offsets=True)
|
|
767
863
|
>>> text_file_dataset_1 = text_file_dataset_1.map(operations=tokenizer_op, input_columns=["text"],
|
|
768
864
|
... output_columns=["token", "offsets_start",
|
|
769
|
-
... "offsets_limit"]
|
|
770
|
-
... column_order=["token", "offsets_start",
|
|
771
|
-
... "offsets_limit"])
|
|
865
|
+
... "offsets_limit"])
|
|
772
866
|
"""
|
|
773
867
|
|
|
774
868
|
@check_basic_tokenizer
|
|
@@ -806,10 +900,10 @@ if platform.system().lower() != 'windows':
|
|
|
806
900
|
output. Default: '[UNK]'.
|
|
807
901
|
lower_case (bool, optional): Whether to perform lowercase processing on the text. If True, will fold the
|
|
808
902
|
text to lower case and strip accented characters. If False, will only perform normalization on the
|
|
809
|
-
text, with mode specified by `normalization_form
|
|
903
|
+
text, with mode specified by `normalization_form` . Default: False.
|
|
810
904
|
keep_whitespace (bool, optional): If True, the whitespace will be kept in the output. Default: False.
|
|
811
905
|
normalization_form (NormalizeForm, optional):
|
|
812
|
-
`Unicode normalization forms <http://unicode.org/reports/tr15/>`_, only valid when `lower_case`
|
|
906
|
+
`Unicode normalization forms <http://unicode.org/reports/tr15/>`_ , only valid when `lower_case`
|
|
813
907
|
is False, can be NormalizeForm.NONE, NormalizeForm.NFC, NormalizeForm.NFKC, NormalizeForm.NFD or
|
|
814
908
|
NormalizeForm.NFKD. Default: NormalizeForm.NONE.
|
|
815
909
|
|
|
@@ -824,14 +918,14 @@ if platform.system().lower() != 'windows':
|
|
|
824
918
|
with_offsets (bool, optional): Whether to return the offsets of tokens. Default: False.
|
|
825
919
|
|
|
826
920
|
Raises:
|
|
827
|
-
TypeError: If `vocab` is not of type :class:`mindspore.dataset.text.Vocab
|
|
921
|
+
TypeError: If `vocab` is not of type :class:`mindspore.dataset.text.Vocab` .
|
|
828
922
|
TypeError: If `suffix_indicator` is not of type str.
|
|
829
923
|
TypeError: If `max_bytes_per_token` is not of type int.
|
|
830
924
|
ValueError: If `max_bytes_per_token` is negative.
|
|
831
925
|
TypeError: If `unknown_token` is not of type str.
|
|
832
926
|
TypeError: If `lower_case` is not of type bool.
|
|
833
927
|
TypeError: If `keep_whitespace` is not of type bool.
|
|
834
|
-
TypeError: If `normalization_form` is not of type :class:`mindspore.dataset.text.NormalizeForm
|
|
928
|
+
TypeError: If `normalization_form` is not of type :class:`mindspore.dataset.text.NormalizeForm` .
|
|
835
929
|
TypeError: If `preserve_unused_token` is not of type bool.
|
|
836
930
|
TypeError: If `with_offsets` is not of type bool.
|
|
837
931
|
|
|
@@ -839,6 +933,7 @@ if platform.system().lower() != 'windows':
|
|
|
839
933
|
``CPU``
|
|
840
934
|
|
|
841
935
|
Examples:
|
|
936
|
+
>>> import mindspore.dataset.text as text
|
|
842
937
|
>>> from mindspore.dataset.text import NormalizeForm
|
|
843
938
|
>>>
|
|
844
939
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
@@ -854,17 +949,15 @@ if platform.system().lower() != 'windows':
|
|
|
854
949
|
... with_offsets=False)
|
|
855
950
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op)
|
|
856
951
|
>>> # If with_offsets=True, then output three columns {["token", dtype=str],
|
|
857
|
-
>>> #
|
|
858
|
-
>>> #
|
|
952
|
+
>>> # ["offsets_start", dtype=uint32],
|
|
953
|
+
>>> # ["offsets_limit", dtype=uint32]}
|
|
859
954
|
>>> tokenizer_op = text.BertTokenizer(vocab=vocab, suffix_indicator='##', max_bytes_per_token=100,
|
|
860
955
|
... unknown_token='[UNK]', lower_case=False, keep_whitespace=False,
|
|
861
956
|
... normalization_form=NormalizeForm.NONE, preserve_unused_token=True,
|
|
862
957
|
... with_offsets=True)
|
|
863
958
|
>>> text_file_dataset_1 = text_file_dataset_1.map(operations=tokenizer_op, input_columns=["text"],
|
|
864
959
|
... output_columns=["token", "offsets_start",
|
|
865
|
-
... "offsets_limit"]
|
|
866
|
-
... column_order=["token", "offsets_start",
|
|
867
|
-
... "offsets_limit"])
|
|
960
|
+
... "offsets_limit"])
|
|
868
961
|
"""
|
|
869
962
|
|
|
870
963
|
@check_bert_tokenizer
|
|
@@ -894,7 +987,7 @@ if platform.system().lower() != 'windows':
|
|
|
894
987
|
class CaseFold(TextTensorOperation):
|
|
895
988
|
"""
|
|
896
989
|
Apply case fold operation on UTF-8 string tensor, which is aggressive that can convert more characters into
|
|
897
|
-
lower case than :
|
|
990
|
+
lower case than :code:`str.lower` . For supported normalization forms, please refer to
|
|
898
991
|
`ICU_Normalizer2 <https://unicode-org.github.io/icu-docs/apidoc/released/icu4c/classicu_1_1Normalizer2.html>`_ .
|
|
899
992
|
|
|
900
993
|
Note:
|
|
@@ -904,6 +997,7 @@ if platform.system().lower() != 'windows':
|
|
|
904
997
|
``CPU``
|
|
905
998
|
|
|
906
999
|
Examples:
|
|
1000
|
+
>>> import mindspore.dataset.text as text
|
|
907
1001
|
>>> case_op = text.CaseFold()
|
|
908
1002
|
>>> text_file_dataset = text_file_dataset.map(operations=case_op)
|
|
909
1003
|
"""
|
|
@@ -924,7 +1018,7 @@ if platform.system().lower() != 'windows':
|
|
|
924
1018
|
``CPU``
|
|
925
1019
|
|
|
926
1020
|
Examples:
|
|
927
|
-
>>> import mindspore.dataset.text
|
|
1021
|
+
>>> import mindspore.dataset.text as text
|
|
928
1022
|
>>>
|
|
929
1023
|
>>> replace_op = text.FilterWikipediaXML()
|
|
930
1024
|
>>> text_file_dataset = text_file_dataset.map(operations=replace_op)
|
|
@@ -944,7 +1038,7 @@ if platform.system().lower() != 'windows':
|
|
|
944
1038
|
Args:
|
|
945
1039
|
normalize_form (NormalizeForm, optional): Valid values can be [NormalizeForm.NONE, NormalizeForm.NFC,
|
|
946
1040
|
NormalizeForm.NFKC, NormalizeForm.NFD, NormalizeForm.NFKD] any of the four unicode
|
|
947
|
-
normalized forms
|
|
1041
|
+
normalized forms. Default: NormalizeForm.NFKC.
|
|
948
1042
|
See http://unicode.org/reports/tr15/ for details.
|
|
949
1043
|
|
|
950
1044
|
- NormalizeForm.NONE, do nothing for input string tensor.
|
|
@@ -960,6 +1054,7 @@ if platform.system().lower() != 'windows':
|
|
|
960
1054
|
``CPU``
|
|
961
1055
|
|
|
962
1056
|
Examples:
|
|
1057
|
+
>>> import mindspore.dataset.text as text
|
|
963
1058
|
>>> from mindspore.dataset.text import NormalizeForm
|
|
964
1059
|
>>> normalize_op = text.NormalizeUTF8(normalize_form=NormalizeForm.NFC)
|
|
965
1060
|
>>> text_file_dataset = text_file_dataset.map(operations=normalize_op)
|
|
@@ -990,7 +1085,7 @@ if platform.system().lower() != 'windows':
|
|
|
990
1085
|
pattern (str): the regex expression patterns.
|
|
991
1086
|
replace (str): the string to replace matched element.
|
|
992
1087
|
replace_all (bool, optional): If False, only replace first matched element;
|
|
993
|
-
if True, replace all matched elements
|
|
1088
|
+
if True, replace all matched elements. Default: True.
|
|
994
1089
|
|
|
995
1090
|
Raises:
|
|
996
1091
|
TypeError: If `pattern` is not of type string.
|
|
@@ -1001,6 +1096,7 @@ if platform.system().lower() != 'windows':
|
|
|
1001
1096
|
``CPU``
|
|
1002
1097
|
|
|
1003
1098
|
Examples:
|
|
1099
|
+
>>> import mindspore.dataset.text as text
|
|
1004
1100
|
>>> pattern = 'Canada'
|
|
1005
1101
|
>>> replace = 'China'
|
|
1006
1102
|
>>> replace_op = text.RegexReplace(pattern, replace)
|
|
@@ -1032,8 +1128,8 @@ if platform.system().lower() != 'windows':
|
|
|
1032
1128
|
The original string will be split by matched elements.
|
|
1033
1129
|
keep_delim_pattern (str, optional): The string matched by 'delim_pattern' can be kept as a token
|
|
1034
1130
|
if it can be matched by 'keep_delim_pattern'. The default value is an empty str
|
|
1035
|
-
which means that delimiters will not be kept as an output token
|
|
1036
|
-
with_offsets (bool, optional): Whether or not output offsets of tokens
|
|
1131
|
+
which means that delimiters will not be kept as an output token. Default: ''.
|
|
1132
|
+
with_offsets (bool, optional): Whether or not output offsets of tokens. Default: False.
|
|
1037
1133
|
|
|
1038
1134
|
Raises:
|
|
1039
1135
|
TypeError: If `delim_pattern` is not of type string.
|
|
@@ -1044,6 +1140,7 @@ if platform.system().lower() != 'windows':
|
|
|
1044
1140
|
``CPU``
|
|
1045
1141
|
|
|
1046
1142
|
Examples:
|
|
1143
|
+
>>> import mindspore.dataset.text as text
|
|
1047
1144
|
>>> # If with_offsets=False, default output is one column {["text", dtype=str]}
|
|
1048
1145
|
>>> delim_pattern = r"[ |,]"
|
|
1049
1146
|
>>> tokenizer_op = text.RegexTokenizer(delim_pattern, with_offsets=False)
|
|
@@ -1054,9 +1151,7 @@ if platform.system().lower() != 'windows':
|
|
|
1054
1151
|
>>> tokenizer_op = text.RegexTokenizer(delim_pattern, with_offsets=True)
|
|
1055
1152
|
>>> text_file_dataset_1 = text_file_dataset_1.map(operations=tokenizer_op, input_columns=["text"],
|
|
1056
1153
|
... output_columns=["token", "offsets_start",
|
|
1057
|
-
... "offsets_limit"]
|
|
1058
|
-
... column_order=["token", "offsets_start",
|
|
1059
|
-
... "offsets_limit"])
|
|
1154
|
+
... "offsets_limit"])
|
|
1060
1155
|
"""
|
|
1061
1156
|
|
|
1062
1157
|
@check_regex_tokenizer
|
|
@@ -1078,8 +1173,8 @@ if platform.system().lower() != 'windows':
|
|
|
1078
1173
|
UnicodeScriptTokenizer is not supported on Windows platform yet.
|
|
1079
1174
|
|
|
1080
1175
|
Args:
|
|
1081
|
-
keep_whitespace (bool, optional): Whether or not emit whitespace tokens
|
|
1082
|
-
with_offsets (bool, optional): Whether or not output offsets of tokens
|
|
1176
|
+
keep_whitespace (bool, optional): Whether or not emit whitespace tokens. Default: False.
|
|
1177
|
+
with_offsets (bool, optional): Whether or not output offsets of tokens. Default: False.
|
|
1083
1178
|
|
|
1084
1179
|
Raises:
|
|
1085
1180
|
TypeError: If `keep_whitespace` is not of type bool.
|
|
@@ -1089,6 +1184,7 @@ if platform.system().lower() != 'windows':
|
|
|
1089
1184
|
``CPU``
|
|
1090
1185
|
|
|
1091
1186
|
Examples:
|
|
1187
|
+
>>> import mindspore.dataset.text as text
|
|
1092
1188
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
1093
1189
|
>>> tokenizer_op = text.UnicodeScriptTokenizer(keep_whitespace=True, with_offsets=False)
|
|
1094
1190
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op)
|
|
@@ -1097,8 +1193,7 @@ if platform.system().lower() != 'windows':
|
|
|
1097
1193
|
>>> # ["offsets_limit", dtype=uint32]}
|
|
1098
1194
|
>>> tokenizer_op = text.UnicodeScriptTokenizer(keep_whitespace=True, with_offsets=True)
|
|
1099
1195
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op, input_columns=["text"],
|
|
1100
|
-
... output_columns=["token", "offsets_start", "offsets_limit"]
|
|
1101
|
-
... column_order=["token", "offsets_start", "offsets_limit"])
|
|
1196
|
+
... output_columns=["token", "offsets_start", "offsets_limit"])
|
|
1102
1197
|
|
|
1103
1198
|
"""
|
|
1104
1199
|
|
|
@@ -1122,7 +1217,7 @@ if platform.system().lower() != 'windows':
|
|
|
1122
1217
|
WhitespaceTokenizer is not supported on Windows platform yet.
|
|
1123
1218
|
|
|
1124
1219
|
Args:
|
|
1125
|
-
with_offsets (bool, optional): Whether or not output offsets of tokens
|
|
1220
|
+
with_offsets (bool, optional): Whether or not output offsets of tokens. Default: False.
|
|
1126
1221
|
|
|
1127
1222
|
Raises:
|
|
1128
1223
|
TypeError: If `with_offsets` is not of type bool.
|
|
@@ -1131,6 +1226,7 @@ if platform.system().lower() != 'windows':
|
|
|
1131
1226
|
``CPU``
|
|
1132
1227
|
|
|
1133
1228
|
Examples:
|
|
1229
|
+
>>> import mindspore.dataset.text as text
|
|
1134
1230
|
>>> # If with_offsets=False, default output one column {["text", dtype=str]}
|
|
1135
1231
|
>>> tokenizer_op = text.WhitespaceTokenizer(with_offsets=False)
|
|
1136
1232
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op)
|
|
@@ -1139,8 +1235,7 @@ if platform.system().lower() != 'windows':
|
|
|
1139
1235
|
>>> # ["offsets_limit", dtype=uint32]}
|
|
1140
1236
|
>>> tokenizer_op = text.WhitespaceTokenizer(with_offsets=True)
|
|
1141
1237
|
>>> text_file_dataset = text_file_dataset.map(operations=tokenizer_op, input_columns=["text"],
|
|
1142
|
-
... output_columns=["token", "offsets_start", "offsets_limit"]
|
|
1143
|
-
... column_order=["token", "offsets_start", "offsets_limit"])
|
|
1238
|
+
... output_columns=["token", "offsets_start", "offsets_limit"])
|
|
1144
1239
|
"""
|
|
1145
1240
|
|
|
1146
1241
|
@check_with_offsets
|