mindspore 2.4.10__cp39-cp39-manylinux1_x86_64.whl → 2.5.0__cp39-cp39-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (706) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-39-x86_64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-39-x86_64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-39-x86_64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libmindspore_backend.so +0 -0
  97. mindspore/lib/libmindspore_common.so +0 -0
  98. mindspore/lib/libmindspore_core.so +0 -0
  99. mindspore/lib/libmindspore_glog.so.0 +0 -0
  100. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  101. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  102. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  103. mindspore/lib/libmindspore_ops.so +0 -0
  104. mindspore/lib/libmpi_adapter.so +0 -0
  105. mindspore/lib/libmpi_collective.so +0 -0
  106. mindspore/lib/libnnacl.so +0 -0
  107. mindspore/lib/libopencv_core.so.4.5 +0 -0
  108. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  110. mindspore/lib/libps_cache.so +0 -0
  111. mindspore/lib/libswresample.so.4 +0 -0
  112. mindspore/lib/libswscale.so.6 +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  114. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  121. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  174. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  175. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  177. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  178. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  179. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  180. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  181. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +960 -958
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  263. mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
  264. mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
  265. mindspore/lib/plugin/gpu10.1/libnccl.so.2 +0 -0
  266. mindspore/lib/plugin/gpu10.1/libnvidia_collective.so +0 -0
  267. mindspore/lib/plugin/gpu11.1/libnccl.so.2 +0 -0
  268. mindspore/lib/plugin/gpu11.1/libnvidia_collective.so +0 -0
  269. mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
  270. mindspore/lib/plugin/gpu11.6/libnvidia_collective.so +0 -0
  271. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  272. mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
  273. mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
  274. mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
  275. mindspore/log.py +12 -0
  276. mindspore/mindrecord/__init__.py +1 -1
  277. mindspore/mindrecord/config.py +17 -316
  278. mindspore/mindrecord/filereader.py +1 -9
  279. mindspore/mindrecord/filewriter.py +5 -15
  280. mindspore/mindrecord/mindpage.py +1 -9
  281. mindspore/mint/__init__.py +824 -218
  282. mindspore/mint/distributed/__init__.py +66 -4
  283. mindspore/mint/distributed/distributed.py +2594 -44
  284. mindspore/mint/linalg/__init__.py +6 -0
  285. mindspore/mint/nn/__init__.py +473 -14
  286. mindspore/mint/nn/functional.py +486 -11
  287. mindspore/mint/nn/layer/__init__.py +17 -4
  288. mindspore/mint/nn/layer/_functions.py +330 -0
  289. mindspore/mint/nn/layer/activation.py +169 -1
  290. mindspore/mint/nn/layer/basic.py +123 -0
  291. mindspore/mint/nn/layer/conv.py +727 -0
  292. mindspore/mint/nn/layer/normalization.py +215 -19
  293. mindspore/mint/nn/layer/padding.py +797 -0
  294. mindspore/mint/nn/layer/pooling.py +170 -0
  295. mindspore/mint/optim/__init__.py +2 -1
  296. mindspore/mint/optim/adam.py +223 -0
  297. mindspore/mint/optim/adamw.py +26 -19
  298. mindspore/mint/special/__init__.py +2 -1
  299. mindspore/multiprocessing/__init__.py +5 -0
  300. mindspore/nn/cell.py +126 -19
  301. mindspore/nn/dynamic_lr.py +2 -1
  302. mindspore/nn/layer/activation.py +6 -6
  303. mindspore/nn/layer/basic.py +35 -25
  304. mindspore/nn/layer/channel_shuffle.py +3 -3
  305. mindspore/nn/layer/embedding.py +3 -3
  306. mindspore/nn/layer/normalization.py +8 -7
  307. mindspore/nn/layer/padding.py +4 -3
  308. mindspore/nn/layer/pooling.py +47 -13
  309. mindspore/nn/layer/rnn_cells.py +1 -1
  310. mindspore/nn/layer/rnns.py +2 -1
  311. mindspore/nn/layer/timedistributed.py +5 -5
  312. mindspore/nn/layer/transformer.py +48 -26
  313. mindspore/nn/learning_rate_schedule.py +5 -3
  314. mindspore/nn/loss/loss.py +31 -36
  315. mindspore/nn/optim/ada_grad.py +1 -0
  316. mindspore/nn/optim/adadelta.py +2 -2
  317. mindspore/nn/optim/adam.py +1 -1
  318. mindspore/nn/optim/lars.py +1 -4
  319. mindspore/nn/optim/optimizer.py +1 -1
  320. mindspore/nn/optim/rprop.py +2 -2
  321. mindspore/nn/optim/thor.py +2 -1
  322. mindspore/nn/utils/init.py +13 -11
  323. mindspore/nn/wrap/cell_wrapper.py +4 -6
  324. mindspore/nn/wrap/loss_scale.py +3 -4
  325. mindspore/numpy/array_creations.py +60 -62
  326. mindspore/numpy/array_ops.py +148 -143
  327. mindspore/numpy/logic_ops.py +41 -42
  328. mindspore/numpy/math_ops.py +361 -359
  329. mindspore/numpy/utils.py +16 -16
  330. mindspore/numpy/utils_const.py +4 -4
  331. mindspore/ops/__init__.py +2 -1
  332. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  333. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  334. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  335. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  336. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  337. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  338. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  339. mindspore/ops/_vmap/vmap_base.py +0 -2
  340. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  341. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  342. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  343. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  344. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  345. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  346. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  347. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  348. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  349. mindspore/ops/composite/base.py +1 -1
  350. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  351. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  352. mindspore/ops/function/__init__.py +12 -0
  353. mindspore/ops/function/array_func.py +561 -159
  354. mindspore/ops/function/clip_func.py +64 -0
  355. mindspore/ops/function/debug_func.py +28 -20
  356. mindspore/ops/function/image_func.py +1 -1
  357. mindspore/ops/function/linalg_func.py +5 -4
  358. mindspore/ops/function/math_func.py +1659 -290
  359. mindspore/ops/function/nn_func.py +988 -317
  360. mindspore/ops/function/parameter_func.py +3 -56
  361. mindspore/ops/function/random_func.py +243 -33
  362. mindspore/ops/function/sparse_unary_func.py +1 -1
  363. mindspore/ops/functional.py +18 -5
  364. mindspore/ops/functional_overload.py +897 -0
  365. mindspore/ops/operations/__init__.py +3 -2
  366. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  367. mindspore/ops/operations/_grad_ops.py +2 -34
  368. mindspore/ops/operations/_infer_ops.py +2 -1
  369. mindspore/ops/operations/_inner_ops.py +38 -8
  370. mindspore/ops/operations/array_ops.py +45 -303
  371. mindspore/ops/operations/comm_ops.py +19 -16
  372. mindspore/ops/operations/custom_ops.py +11 -55
  373. mindspore/ops/operations/debug_ops.py +42 -47
  374. mindspore/ops/operations/inner_ops.py +6 -4
  375. mindspore/ops/operations/linalg_ops.py +3 -2
  376. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  377. mindspore/ops/operations/math_ops.py +11 -216
  378. mindspore/ops/operations/nn_ops.py +146 -308
  379. mindspore/ops/primitive.py +23 -21
  380. mindspore/ops/tensor_method.py +1669 -0
  381. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  382. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  383. mindspore/ops_generate/arg_handler.py +0 -61
  384. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  385. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  386. mindspore/ops_generate/base_generator.py +11 -0
  387. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  388. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  389. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  390. mindspore/ops_generate/functions_cc_generator.py +233 -0
  391. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  392. mindspore/ops_generate/gen_constants.py +157 -3
  393. mindspore/ops_generate/gen_ops.py +245 -990
  394. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  395. mindspore/ops_generate/gen_utils.py +119 -33
  396. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  397. mindspore/ops_generate/op_api_proto.py +206 -0
  398. mindspore/ops_generate/op_def_py_generator.py +131 -0
  399. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  400. mindspore/ops_generate/op_proto.py +373 -108
  401. mindspore/ops_generate/op_template_parser.py +436 -0
  402. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  403. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  404. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  405. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  406. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  407. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  408. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  409. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  410. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  411. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  412. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  413. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  414. mindspore/ops_generate/pyboost_utils.py +92 -33
  415. mindspore/ops_generate/template.py +294 -44
  416. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  417. mindspore/parallel/__init__.py +3 -3
  418. mindspore/parallel/_auto_parallel_context.py +24 -33
  419. mindspore/parallel/_parallel_serialization.py +13 -2
  420. mindspore/parallel/_utils.py +4 -1
  421. mindspore/parallel/algo_parameter_config.py +1 -1
  422. mindspore/parallel/checkpoint_transform.py +44 -0
  423. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  424. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  425. mindspore/parallel/cluster/run.py +20 -3
  426. mindspore/parallel/parameter_broadcast.py +1 -1
  427. mindspore/parallel/shard.py +3 -0
  428. mindspore/parallel/transform_safetensors.py +119 -253
  429. mindspore/profiler/__init__.py +17 -4
  430. mindspore/profiler/analysis/__init__.py +0 -0
  431. mindspore/profiler/analysis/parser/__init__.py +0 -0
  432. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  433. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  434. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  435. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  436. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  437. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  438. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  439. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  440. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  441. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  442. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  443. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  444. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  445. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  446. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  447. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  448. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  449. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  450. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  451. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  452. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  453. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  454. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  455. mindspore/profiler/analysis/task_manager.py +131 -0
  456. mindspore/profiler/analysis/time_converter.py +84 -0
  457. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  458. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  459. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  460. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  461. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  462. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  463. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  464. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  465. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  466. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  467. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  468. mindspore/profiler/analysis/work_flow.py +73 -0
  469. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  470. mindspore/profiler/common/command_executor.py +90 -0
  471. mindspore/profiler/common/constant.py +174 -3
  472. mindspore/profiler/common/file_manager.py +208 -0
  473. mindspore/profiler/common/log.py +130 -0
  474. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  475. mindspore/profiler/common/path_manager.py +371 -0
  476. mindspore/profiler/common/process_bar.py +168 -0
  477. mindspore/profiler/common/process_pool.py +9 -3
  478. mindspore/profiler/common/profiler_context.py +476 -0
  479. mindspore/profiler/common/profiler_info.py +304 -0
  480. mindspore/profiler/common/profiler_output_path.py +284 -0
  481. mindspore/profiler/common/profiler_parameters.py +210 -0
  482. mindspore/profiler/common/profiler_path_manager.py +120 -0
  483. mindspore/profiler/common/record_function.py +76 -0
  484. mindspore/profiler/common/tlv_decoder.py +76 -0
  485. mindspore/profiler/common/util.py +75 -2
  486. mindspore/profiler/dynamic_profiler.py +270 -37
  487. mindspore/profiler/envprofiler.py +138 -0
  488. mindspore/profiler/mstx.py +199 -0
  489. mindspore/profiler/platform/__init__.py +21 -0
  490. mindspore/profiler/platform/base_profiler.py +40 -0
  491. mindspore/profiler/platform/cpu_profiler.py +124 -0
  492. mindspore/profiler/platform/gpu_profiler.py +74 -0
  493. mindspore/profiler/platform/npu_profiler.py +309 -0
  494. mindspore/profiler/profiler.py +580 -93
  495. mindspore/profiler/profiler_action_controller.py +187 -0
  496. mindspore/profiler/profiler_interface.py +114 -0
  497. mindspore/profiler/schedule.py +208 -0
  498. mindspore/rewrite/api/symbol_tree.py +1 -2
  499. mindspore/run_check/_check_version.py +2 -6
  500. mindspore/runtime/__init__.py +37 -0
  501. mindspore/runtime/device.py +27 -0
  502. mindspore/runtime/event.py +209 -0
  503. mindspore/runtime/executor.py +148 -0
  504. mindspore/runtime/memory.py +392 -0
  505. mindspore/runtime/stream.py +460 -0
  506. mindspore/runtime/thread_bind_core.py +401 -0
  507. mindspore/train/__init__.py +2 -2
  508. mindspore/train/_utils.py +53 -18
  509. mindspore/train/amp.py +8 -4
  510. mindspore/train/callback/_checkpoint.py +32 -18
  511. mindspore/train/callback/_early_stop.py +1 -1
  512. mindspore/train/callback/_flops_collector.py +105 -69
  513. mindspore/train/callback/_history.py +1 -1
  514. mindspore/train/callback/_summary_collector.py +44 -6
  515. mindspore/train/callback/_tft_register.py +31 -10
  516. mindspore/train/dataset_helper.py +11 -11
  517. mindspore/train/metrics/precision.py +4 -5
  518. mindspore/train/mind_ir_pb2.py +167 -46
  519. mindspore/train/model.py +13 -15
  520. mindspore/train/serialization.py +462 -76
  521. mindspore/train/summary/summary_record.py +1 -2
  522. mindspore/train/train_thor/model_thor.py +1 -1
  523. mindspore/utils/__init__.py +4 -2
  524. mindspore/utils/bin/dataset-cache +0 -0
  525. mindspore/utils/bin/dataset-cache-server +0 -0
  526. mindspore/utils/dryrun.py +138 -0
  527. mindspore/utils/runtime_execution_order_check.py +550 -0
  528. mindspore/version.py +1 -1
  529. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  530. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +533 -467
  531. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  532. mindspore/_data_dump.cpython-39-x86_64-linux-gnu.so +0 -0
  533. mindspore/bin/cache_admin +0 -0
  534. mindspore/bin/cache_server +0 -0
  535. mindspore/common/_tensor_overload.py +0 -139
  536. mindspore/lib/libmindspore_np_dtype.so +0 -0
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_impl.so +0 -0
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  687. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  688. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  689. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  690. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  691. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  692. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  693. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  694. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  695. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  696. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  697. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  698. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  699. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  700. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  701. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  702. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  703. mindspore/profiler/envprofiling.py +0 -254
  704. mindspore/profiler/profiling.py +0 -1926
  705. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  706. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
mindspore/numpy/utils.py CHANGED
@@ -19,8 +19,8 @@ import types
19
19
 
20
20
  from mindspore.common import Tensor
21
21
  from mindspore._c_expression import Tensor as Tensor_
22
- from mindspore.ops import functional as F
23
22
  from mindspore.common import dtype as mstype
23
+ from mindspore import ops
24
24
 
25
25
  from mindspore.numpy.utils_const import _tile_size, _add_unit_axes, _raise_type_error, _type_convert, \
26
26
  _tuple_setitem, _callable_const, _check_is_float, _get_device
@@ -65,7 +65,7 @@ def _check_input_for_asarray(array_like):
65
65
 
66
66
  def _is_scalar(shape):
67
67
  """check whether input shape is a scalar"""
68
- return F.shape_mul(shape) == 1
68
+ return ops.shape_mul(shape) == 1
69
69
 
70
70
 
71
71
  def _convert_list_tensor_to_tuple_tensor(list_of_tensor):
@@ -80,27 +80,27 @@ def _convert_list_tensor_to_tuple_tensor(list_of_tensor):
80
80
 
81
81
  def _expand(x, ndim, axis=0):
82
82
  """Expand x to ndim from axis, which can be 0 or -1."""
83
- shape = _add_unit_axes(F.shape(x), ndim, axis == -1)
84
- return F.reshape(x, shape)
83
+ shape = _add_unit_axes(ops.shape(x), ndim, axis == -1)
84
+ return ops.reshape(x, shape)
85
85
 
86
86
 
87
87
  def _broadcast_to(x, shape_cur, shape_to, ndim_to):
88
88
  """Broadcasts x from shape_cur to shape_to."""
89
89
  size = _tile_size(shape_cur, shape_to, ndim_to)
90
- return F.tile(x, size)
90
+ return ops.tile(x, size)
91
91
 
92
92
 
93
93
  def _broadcast_to_shape(x, shape):
94
94
  """Broadcasts x from current shape to shape"""
95
95
  ndim_to = len(shape)
96
96
  x = _expand(x, ndim_to)
97
- return _broadcast_to(x, F.shape(x), shape, ndim_to)
97
+ return _broadcast_to(x, ops.shape(x), shape, ndim_to)
98
98
 
99
99
 
100
100
  def _get_size(x, axis=None):
101
101
  """Get the number of elements along the given axis of tensor x."""
102
- if axis is None or F.tuple_len(axis) == 0:
103
- axis = F.make_range(x.ndim)
102
+ if axis is None or ops.tuple_len(axis) == 0:
103
+ axis = ops.make_range(x.ndim)
104
104
  nums = 1
105
105
  for ax in axis:
106
106
  nums *= x.shape[ax]
@@ -110,7 +110,7 @@ def _get_size(x, axis=None):
110
110
  def _check_input_tensor(*tensors):
111
111
  for tensor in tensors:
112
112
  if not isinstance(tensor, Tensor):
113
- _raise_type_error('expect Tensor, but got ', F.typeof(tensor))
113
+ _raise_type_error('expect Tensor, but got ', ops.typeof(tensor))
114
114
  return True
115
115
 
116
116
 
@@ -141,7 +141,7 @@ def _to_tensor(*args):
141
141
 
142
142
  def _get_dtype_from_scalar(*input_numbers):
143
143
  """
144
- Get the final dtype from series of input numbers, compared with F.typeof, we
144
+ Get the final dtype from series of input numbers, compared with ops.typeof, we
145
145
  return int32/float32 for python int/float instead.
146
146
  """
147
147
  bool_flag = True
@@ -184,7 +184,7 @@ def _slice_along_axis(f, axis, slice_start, slice_end):
184
184
  slice_size = slice_end - slice_start
185
185
  index_start = _tuple_setitem(index_start, axis, slice_start)
186
186
  index_end = _tuple_setitem(index_end, axis, slice_size)
187
- return F.tensor_slice(f, index_start, index_end)
187
+ return ops.tensor_slice(f, index_start, index_end)
188
188
 
189
189
 
190
190
  def _to_tensor_origin_dtype(*args):
@@ -203,12 +203,12 @@ def _to_tensor_origin_dtype(*args):
203
203
 
204
204
  def _callable(tensor, obj):
205
205
  """Returns True if `obj` is a function."""
206
- if F.isconstant(tensor):
206
+ if ops.isconstant(tensor):
207
207
  return isinstance(obj, types.FunctionType)
208
- return _callable_const(F.typeof(obj))
208
+ return _callable_const(ops.typeof(obj))
209
209
 
210
210
 
211
211
  def _isnan(x):
212
- if _get_device() == 'Ascend' and not _check_is_float(F.dtype(x)):
213
- return F.fill(mstype.bool_, F.shape(x), False)
214
- return F.isnan(x)
212
+ if _get_device() == 'Ascend' and not _check_is_float(ops.dtype(x)):
213
+ return ops.fill(mstype.bool_, ops.shape(x), False)
214
+ return ops.isnan(x)
@@ -20,7 +20,6 @@ from itertools import accumulate
20
20
  import operator
21
21
 
22
22
  import mindspore.context as context
23
- from mindspore.ops import functional as F
24
23
  from mindspore.ops.primitive import constexpr
25
24
  from mindspore.ops.primitive import _primexpr
26
25
  from mindspore.common import dtype as mstype
@@ -28,6 +27,7 @@ from mindspore.common import Tensor
28
27
  from mindspore._c_expression import Tensor as Tensor_
29
28
  from mindspore._c_expression import typing
30
29
  from mindspore import _checkparam as validator
30
+ from mindspore import ops
31
31
 
32
32
  from mindspore.numpy.dtypes import promotion_rule, dtype_tuple, all_types, dtype_map, rule_for_trigonometric
33
33
 
@@ -80,13 +80,13 @@ def _check_dtype(dtype):
80
80
  @_primexpr
81
81
  def _is_shape_empty(shp):
82
82
  """Check whether shape contains zero"""
83
- if F.is_sequence_shape_unknown(shp):
83
+ if ops.is_sequence_shape_unknown(shp):
84
84
  return False
85
85
  if isinstance(shp, int):
86
86
  return shp == 0
87
87
  if isinstance(shp, (tuple, list)):
88
88
  return 0 in shp
89
- return F.shape_mul(shp) == 0
89
+ return ops.shape_mul(shp) == 0
90
90
 
91
91
 
92
92
  @_primexpr
@@ -189,7 +189,7 @@ def _check_axis_valid(axes, ndim):
189
189
  raise ValueError('duplicate value in "axis"')
190
190
 
191
191
  if axes is None:
192
- axes = F.make_range(ndim)
192
+ axes = ops.make_range(ndim)
193
193
  return axes
194
194
  if isinstance(axes, (tuple, list)):
195
195
  axes = tuple(map(lambda x: _check_axis_in_range(x, ndim), axes))
mindspore/ops/__init__.py CHANGED
@@ -33,6 +33,7 @@ from mindspore.ops import composite, operations, functional, function
33
33
  from mindspore.ops import signature
34
34
  from mindspore.ops.auto_generate import cpp_create_prim_instance_helper, gen_arg_dtype_cast, gen_arg_handler, \
35
35
  gen_extend_func, gen_ops_def, gen_ops_prim, pyboost_inner_prim
36
+ from mindspore.ops.functional_overload import all_gather_matmul, matmul_reduce_scatter
36
37
  from mindspore.ops.composite import *
37
38
  from mindspore.ops.operations import *
38
39
  from mindspore.ops.function import *
@@ -47,7 +48,7 @@ __all__ = ["get_vm_impl_fn", "vm_impl_registry",
47
48
  "CpuRegOp", "CustomRegOp", "DataType",
48
49
  "constexpr", "reshard",
49
50
  "cpp_create_prim_instance_helper", "gen_arg_dtype_cast", "gen_arg_handler", "gen_extend_func", "gen_ops_def",
50
- "gen_ops_prim", "pyboost_inner_prim"]
51
+ "gen_ops_prim", "pyboost_inner_prim", "all_gather_matmul", "matmul_reduce_scatter"]
51
52
  __all__.extend(__primitive__)
52
53
  __all__.extend(composite.__all__)
53
54
  __all__.extend(operations.__all__)
@@ -37,9 +37,24 @@ from mindspore.ops._grad_experimental.grad_base import bprop_getters
37
37
  from mindspore.ops.operations import _grad_ops as G
38
38
  import mindspore as ms
39
39
 
40
- _device_local_norm = None
41
- if ms.get_auto_parallel_context("dump_device_local_norm"):
42
- _device_local_norm = Parameter(Tensor(0.0, mstype.float32), name="_device_local_norm", requires_grad=False)
40
+ _squared_device_local_norm = None
41
+
42
+
43
+ def get_squared_device_local_norm_param():
44
+ """
45
+ Get Parameter `_squared_device_local_norm`.
46
+ `_squared_device_local_norm` will accumulate squared local norm of each grad in bprop under GRAPH_MODE.
47
+ User need to reset it to zero after network propagation each step.
48
+ """
49
+ global _squared_device_local_norm
50
+ if _squared_device_local_norm is None:
51
+ if ms.get_auto_parallel_context("dump_device_local_norm"):
52
+ _squared_device_local_norm = Parameter(Tensor(0.0, mstype.float32), name="_squared_device_local_norm",
53
+ requires_grad=False)
54
+ else:
55
+ raise ValueError("The parallel config 'dump_device_local_norm' is False.")
56
+ return _squared_device_local_norm
57
+
43
58
 
44
59
  @bprop_getters.register(AllReduce)
45
60
  def get_bprop_all_reduce(self):
@@ -195,7 +210,7 @@ def get_bprop_virtual_assign_kv_cache(self):
195
210
  dout_update = dout + y
196
211
  kv_equal = F.equal(seq_chunk, 0)
197
212
  update_kv = F.select(kv_equal, F.broadcast_to(cast(out_tensor, dtype(y)), F.shape(y)), dout_update)
198
- return F.depend((dout_update, cast(out_tensor, dtype(y)),
213
+ return F.depend((cast(dout_update, dtype(dout)), cast(out_tensor, dtype(y)),
199
214
  cast(out_tensor, dtype(seq_chunk))), assign(y, update_kv))
200
215
 
201
216
  return bprop
@@ -221,6 +236,7 @@ def get_bprop_mirror_micro_step_operator(self):
221
236
  allgather for sparse feature.
222
237
  """
223
238
  group = self.group
239
+ global_rank = get_rank()
224
240
  dev_num = self.dev_num
225
241
  mean_flag = self.mean_flag
226
242
  param_name = " "
@@ -247,18 +263,29 @@ def get_bprop_mirror_micro_step_operator(self):
247
263
  out_tensor = Tensor(1.0, mstype.float16)
248
264
  opt_shard = _get_enable_parallel_optimizer()
249
265
  ln_print = P.Print()
266
+ tensor_dump = P.TensorDump()
250
267
  reduce_sum = P.ReduceSum(keep_dims=False)
251
268
  square = P.Square()
269
+ sqrt = P.Sqrt()
252
270
  dump_local_norm = ms.get_auto_parallel_context("dump_local_norm")
271
+ dump_local_norm_path = ms.get_auto_parallel_context("dump_local_norm_path")
253
272
  dump_device_local_norm = ms.get_auto_parallel_context("dump_device_local_norm")
273
+ if dump_device_local_norm:
274
+ # init _squared _squared_device_local_norm
275
+ squared_device_local_norm = get_squared_device_local_norm_param()
254
276
 
255
277
  def bprop(x, z, out, dout):
256
278
  if dump_local_norm or dump_device_local_norm:
257
- _norm = reduce_sum(square((z)))
279
+ squared_norm = reduce_sum(square((z)))
258
280
  if dump_local_norm:
259
- z = F.depend(z, ln_print("dump local norm: ", param_name, _norm))
281
+ if dump_local_norm_path:
282
+ z = F.depend(z, tensor_dump(dump_local_norm_path + "/rank_" + str(global_rank) +
283
+ "/local_norm__" + param_name, sqrt(squared_norm)))
284
+ else:
285
+ z = F.depend(z, ln_print("dump local norm: ", param_name, sqrt(squared_norm)))
260
286
  if dump_device_local_norm:
261
- z = F.depend(z, F.assign_add(_device_local_norm, cast(_norm, _device_local_norm.dtype)))
287
+ z = F.depend(z, F.assign_add(squared_device_local_norm,
288
+ cast(squared_norm, squared_device_local_norm.dtype)))
262
289
  real_grad = z
263
290
  assign_out = dout
264
291
  if issubclass_(F.typeof(dout), mstype.tensor_type):
@@ -301,8 +328,38 @@ def get_bprop_all_gather(self):
301
328
  if self.rank_size == 0:
302
329
  raise ValueError(f"The 'rank_size' can not be zero, but got {self.rank_size}.")
303
330
  scale = 1.0 / self.rank_size
331
+ param_name = ""
332
+ if 'mirror_user_id' in self.get_attr_dict():
333
+ param_name = self.get_attr_dict()['mirror_user_id']
334
+ # monitor local norm
335
+ dump_local_norm = ms.get_auto_parallel_context("dump_local_norm")
336
+ dump_local_norm_path = ms.get_auto_parallel_context("dump_local_norm_path")
337
+ dump_device_local_norm = ms.get_auto_parallel_context("dump_device_local_norm")
338
+ if param_name and (dump_local_norm or dump_device_local_norm):
339
+ global_rank = get_rank()
340
+ cast = P.Cast()
341
+ ln_print = P.Print()
342
+ tensor_dump = P.TensorDump()
343
+ reduce_sum = P.ReduceSum(keep_dims=False)
344
+ square = P.Square()
345
+ sqrt = P.Sqrt()
346
+ if dump_device_local_norm:
347
+ # init _squared _squared_device_local_norm
348
+ squared_device_local_norm = get_squared_device_local_norm_param()
304
349
 
305
350
  def bprop(x, out, dout):
351
+ if param_name and (dump_local_norm or dump_device_local_norm):
352
+ squared_norm = reduce_sum(square((dout)))
353
+ if dump_local_norm:
354
+ if dump_local_norm_path:
355
+ dout = F.depend(dout, tensor_dump(dump_local_norm_path + "/rank_" + str(global_rank) +
356
+ "/local_norm__" + param_name, sqrt(squared_norm)))
357
+ else:
358
+ dout = F.depend(dout, ln_print("dump local norm: ", param_name, sqrt(squared_norm)))
359
+ if dump_device_local_norm:
360
+ dout = F.depend(dout, F.assign_add(squared_device_local_norm,
361
+ cast(squared_norm, squared_device_local_norm.dtype)))
362
+
306
363
  dx = reduce_scatter(dout)
307
364
  if mean_flag:
308
365
  dx = F.tensor_mul(dx, scale)
@@ -373,15 +430,22 @@ def get_bprop_micro_step_all_gather(self):
373
430
  if self.instance_name:
374
431
  instance_name = "grad_" + self.instance_name
375
432
  reduce_scatter.set_prim_instance_name(instance_name)
433
+ global_rank = get_rank()
376
434
  cast = P.Cast()
377
435
  dtype = P.DType()
378
436
  out_tensor = Tensor(1.0, mstype.float16)
379
437
  with_mirror_operator = self.get_attr_dict()["with_mirror_operator"]
380
438
  ln_print = P.Print()
439
+ tensor_dump = P.TensorDump()
381
440
  reduce_sum = P.ReduceSum(keep_dims=False)
382
441
  square = P.Square()
442
+ sqrt = P.Sqrt()
383
443
  dump_local_norm = ms.get_auto_parallel_context("dump_local_norm")
444
+ dump_local_norm_path = ms.get_auto_parallel_context("dump_local_norm_path")
384
445
  dump_device_local_norm = ms.get_auto_parallel_context("dump_device_local_norm")
446
+ if dump_device_local_norm:
447
+ # init _squared _squared_device_local_norm
448
+ squared_device_local_norm = get_squared_device_local_norm_param()
385
449
 
386
450
  def bprop(x, z, out, dout):
387
451
  if with_mirror_operator:
@@ -393,11 +457,16 @@ def get_bprop_micro_step_all_gather(self):
393
457
  return (real_grad, cast(out_tensor, dtype(z)))
394
458
  z = F.depend(z, dout)
395
459
  if dump_local_norm or dump_device_local_norm:
396
- _norm = reduce_sum(square((z)))
460
+ squared_norm = reduce_sum(square((z)))
397
461
  if dump_local_norm:
398
- z = F.depend(z, ln_print("dump local norm: ", param_name, _norm))
462
+ if dump_local_norm_path:
463
+ z = F.depend(z, tensor_dump(dump_local_norm_path + "/rank_" + str(global_rank) +
464
+ "/local_norm__" + param_name, sqrt(squared_norm)))
465
+ else:
466
+ z = F.depend(z, ln_print("dump local norm: ", param_name, sqrt(squared_norm)))
399
467
  if dump_device_local_norm:
400
- z = F.depend(z, F.assign_add(_device_local_norm, cast(_norm, _device_local_norm.dtype)))
468
+ z = F.depend(z, F.assign_add(squared_device_local_norm,
469
+ cast(squared_norm, squared_device_local_norm.dtype)))
401
470
  if not do_mirror:
402
471
  return (z, cast(out_tensor, dtype(z)))
403
472
  real_grad = reduce_scatter(z)
@@ -599,16 +668,23 @@ def get_bprop_mirror_operator(self):
599
668
 
600
669
  dev_num_r = 1.0
601
670
  dump_local_norm = ms.get_auto_parallel_context("dump_local_norm")
671
+ dump_local_norm_path = ms.get_auto_parallel_context("dump_local_norm_path")
602
672
  dump_device_local_norm = ms.get_auto_parallel_context("dump_device_local_norm")
673
+ if dump_device_local_norm:
674
+ # init _squared _squared_device_local_norm
675
+ squared_device_local_norm = get_squared_device_local_norm_param()
603
676
  if dev_num > 1:
677
+ global_rank = get_rank()
604
678
  dev_num_r = 1.0 / dev_num
605
679
  all_reduce = AllReduce(group=group)
606
680
  all_gather = AllGather(group=group)
607
681
  mul = P.Mul()
608
682
  cast = P.Cast()
609
683
  ln_print = P.Print()
684
+ tensor_dump = P.TensorDump()
610
685
  reduce_sum = P.ReduceSum(keep_dims=False)
611
686
  square = P.Square()
687
+ sqrt = P.Sqrt()
612
688
 
613
689
  fusion = self.get_attr_dict()["fusion"]
614
690
  all_reduce.add_prim_attr("fusion", fusion)
@@ -623,11 +699,16 @@ def get_bprop_mirror_operator(self):
623
699
 
624
700
  def bprop(x, out, dout):
625
701
  if dump_local_norm or dump_device_local_norm:
626
- _norm = reduce_sum(square((dout)))
702
+ squared_norm = reduce_sum(square((dout)))
627
703
  if dump_local_norm:
628
- dout = F.depend(dout, ln_print("dump local norm: ", param_name, _norm))
704
+ if dump_local_norm_path:
705
+ dout = F.depend(dout, tensor_dump(dump_local_norm_path + "/rank_" + str(global_rank) +
706
+ "/local_norm__" + param_name, sqrt(squared_norm)))
707
+ else:
708
+ dout = F.depend(dout, ln_print("dump local norm: ", param_name, sqrt(squared_norm)))
629
709
  if dump_device_local_norm:
630
- dout = F.depend(dout, F.assign_add(_device_local_norm, cast(_norm, _device_local_norm.dtype)))
710
+ dout = F.depend(dout, F.assign_add(squared_device_local_norm,
711
+ cast(squared_norm, squared_device_local_norm.dtype)))
631
712
 
632
713
  if dev_num == 1:
633
714
  return (dout,)
@@ -15,6 +15,7 @@
15
15
 
16
16
  """Generate bprop for debug ops"""
17
17
 
18
+ import mindspore.ops.functional as F
18
19
  from mindspore.ops import operations as P
19
20
  from mindspore.ops._grad_experimental.grad_base import bprop_getters
20
21
 
@@ -27,5 +28,9 @@ def get_bprop_insert_gradient_of(self):
27
28
  f = self.f
28
29
 
29
30
  def bprop(x, out, dout):
30
- return (f(dout),)
31
+ fdout = f(dout)
32
+ if fdout is None:
33
+ dout = F.depend(dout, fdout)
34
+ return (dout,)
35
+ return (fdout,)
31
36
  return bprop
@@ -23,6 +23,15 @@ from mindspore.ops.composite.multitype_ops.zeros_like_impl import zeros_like
23
23
  from mindspore.ops._grad_experimental.grad_base import bprop_getters
24
24
 
25
25
 
26
+ @bprop_getters.register("raise")
27
+ def get_bprop_raise(self):
28
+ """Grad definition for `raise` operation."""
29
+ def bprop(x, y, z, out, dout):
30
+ return x, y, z
31
+
32
+ return bprop
33
+
34
+
26
35
  @bprop_getters.register(inner.ParallelResizeBilinear)
27
36
  def get_bprop_parallel_resize_bilinear(self):
28
37
  """Grad definition for `ParallelResizeBilinear` operation."""
@@ -657,7 +657,8 @@ def get_bprop_fft_with_size(self):
657
657
  dx = rfft_fn(dout)
658
658
  dx = reverse_branch(dx, onesided, dout_shape, offset_shape,
659
659
  output_type, dout, norm, inverse, signal_ndim, offset_size)
660
- return (dx,)
660
+ return dx, zeros_like(signal_ndim), zeros_like(inverse), zeros_like(real), zeros_like(norm_enum), \
661
+ zeros_like(onesided), zeros_like(signal_sizes)
661
662
 
662
663
  return bprop
663
664
 
@@ -71,6 +71,7 @@ from .pyexecute import _pyexecute_cpu
71
71
  from .pyfunc import _pyfunc_cpu
72
72
  from .buffer_append import _buffer_append_cpu
73
73
  from .buffer_get import _buffer_get_cpu
74
+ from .raise_op import _raise_cpu
74
75
  from .buffer_sample import _buffer_sample_cpu
75
76
  from .priority_replay_buffer import _prb_push_op_cpu
76
77
  from .priority_replay_buffer import _prb_sample_op_cpu
@@ -0,0 +1,28 @@
1
+ # Copyright 2024 Huawei Technologies Co., Ltd
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+ # ============================================================================
15
+ """storeattrgrad op"""
16
+ from mindspore.ops.op_info_register import op_info_register, CpuRegOp, DataType
17
+
18
+ raise_op_info = CpuRegOp("raise") \
19
+ .input(0, "x", "dynamic") \
20
+ .output(0, "y", "dynamic") \
21
+ .dtype_format(DataType.I32_Default, DataType.I32_Default) \
22
+ .get_op_info()
23
+
24
+
25
+ @op_info_register(raise_op_info)
26
+ def _raise_cpu():
27
+ """_getattrgrad_cpu cpu register"""
28
+ return
@@ -15,6 +15,7 @@
15
15
 
16
16
  """array_ops vmap impl."""
17
17
  from __future__ import absolute_import
18
+ from enum import Enum
18
19
 
19
20
  import mindspore
20
21
  import mindspore.numpy as mnp
@@ -1488,16 +1489,19 @@ def get_meshgrid_vmap_rule(prim, axis_size):
1488
1489
  """VmapRule for `P.Meshgrid` operation."""
1489
1490
  if isinstance(prim, str):
1490
1491
  prim = Primitive(prim)
1491
- indexing = prim.indexing
1492
1492
 
1493
- def vmap_rule(*inputs_bdim):
1494
- is_all_none, result = vmap_general_preprocess(prim, *inputs_bdim)
1493
+ class Indexing(Enum):
1494
+ ij = 0
1495
+ xy = 1
1496
+
1497
+ def vmap_rule(inputs_bdim, indexing_bdim):
1498
+ is_all_none, result = vmap_general_preprocess(prim, inputs_bdim, indexing_bdim)
1495
1499
  if is_all_none:
1496
1500
  return result
1497
1501
 
1498
1502
  if not isinstance(inputs_bdim, (tuple)):
1499
1503
  _raise_value_error("The inputs of P.Meshgrid is not tuple.")
1500
- args = inputs_bdim[0]
1504
+ args = inputs_bdim
1501
1505
  if len(args) <= 1:
1502
1506
  _raise_value_error(
1503
1507
  "The input number of P.Meshgrid must be greater than 1.")
@@ -1518,7 +1522,9 @@ def get_meshgrid_vmap_rule(prim, axis_size):
1518
1522
  output_shape.insert(0, axis_size)
1519
1523
  ones_shape.insert(0, axis_size)
1520
1524
 
1521
- if indexing == "xy":
1525
+ indexing, _ = indexing_bdim
1526
+
1527
+ if indexing == Indexing.xy.value:
1522
1528
  output_shape[1], output_shape[2] = output_shape[2], output_shape[1]
1523
1529
  shape = tuple(output_shape)
1524
1530
 
@@ -1531,7 +1537,7 @@ def get_meshgrid_vmap_rule(prim, axis_size):
1531
1537
  for each_arg in args:
1532
1538
  x, bdim = each_arg
1533
1539
  x = _bdim_at_front(x, bdim, axis_size)
1534
- shape_index = (1 - index) if (index <= 1 and indexing == "xy") else index
1540
+ shape_index = (1 - index) if (index <= 1 and indexing == Indexing.xy.value) else index
1535
1541
  ones_shape[shape_index + 1] = output_shape[shape_index + 1]
1536
1542
  x = P.Reshape()(x, tuple(ones_shape))
1537
1543
  output = P.Mul()(x, ones_tensor)
@@ -1889,10 +1895,6 @@ def get_slice_vmap_rule(prim, axis_size):
1889
1895
  @vmap_rules_getters.register(P.Squeeze)
1890
1896
  def get_squeeze_vmap_rule(prim, axis_size):
1891
1897
  """VmapRule for `Squeeze`."""
1892
- if hasattr(prim, 'axis'):
1893
- prim_axis = prim.axis
1894
- else:
1895
- prim_axis = None
1896
1898
 
1897
1899
  @_primexpr
1898
1900
  def move_axis(axes):
@@ -1911,27 +1913,26 @@ def get_squeeze_vmap_rule(prim, axis_size):
1911
1913
  new_axis += (i,)
1912
1914
  return new_axis
1913
1915
 
1914
- def vmap_rule(x_bdim):
1915
- is_all_none, result = vmap_general_preprocess(prim, x_bdim)
1916
+ def vmap_rule(x_bdim, axis_bdim):
1917
+ is_all_none, result = vmap_general_preprocess(prim, x_bdim, axis_bdim)
1916
1918
  if is_all_none:
1917
1919
  return result
1918
1920
 
1919
1921
  x, x_dim = x_bdim
1922
+ axis, _ = axis_bdim
1920
1923
  x = _bdim_at_front(x, x_dim, axis_size)
1921
1924
 
1922
- if prim_axis is None:
1925
+ if axis is None:
1923
1926
  if axis_size == 1:
1924
1927
  new_axis = generate_all_axis_except_first(F.rank(x))
1925
- batch_squeeze = P.Squeeze(axis=new_axis)
1926
- out = batch_squeeze(x)
1928
+ out = prim(x, new_axis)
1927
1929
  return out, 0
1928
1930
 
1929
- out = prim(x)
1931
+ out = prim(x, axis)
1930
1932
  return out, 0
1931
1933
 
1932
- new_axis = move_axis(prim_axis)
1933
- batch_squeeze = P.Squeeze(axis=new_axis)
1934
- out = batch_squeeze(x)
1934
+ new_axis = move_axis(axis)
1935
+ out = prim(x, new_axis)
1935
1936
  return out, 0
1936
1937
 
1937
1938
  return vmap_rule
@@ -512,8 +512,6 @@ _ops_vmap_clone_prim_dict = {
512
512
  "ApplyAdagradV2": P.ApplyAdagradV2,
513
513
  "UniformCandidateSampler": UniformCandidateSampler,
514
514
  "UniqueWithPad": P.UniqueWithPad,
515
- "CdistGrad": G.CdistGrad,
516
- "Cdist": P.Cdist,
517
515
  "STFT": math_ops.STFT,
518
516
  "Conv2D": P.Conv2D,
519
517
  "Conv3D": P.Conv3D,
@@ -26,6 +26,7 @@ from mindspore.ops.function import _VmapGeneralRule
26
26
  from mindspore.ops._vmap.vmap_base import vmap_rules_getters, vmap_general_preprocess, _raise_value_error, \
27
27
  _bdim_at_front, _vmap_clone_prim, _bdim_at_any, _handle_broadcasting
28
28
  from mindspore.ops.auto_generate.gen_arg_handler import Format, Reduction
29
+ from mindspore.ops import auto_generate as gen
29
30
 
30
31
 
31
32
  @vmap_rules_getters.register(G.NLLLossGrad)
@@ -225,33 +226,35 @@ def get_max_pool3d_grad_with_argmax_vmap_rule(prim, axis_size):
225
226
  return vmap_rule
226
227
 
227
228
 
228
- @vmap_rules_getters.register(G.CdistGrad)
229
+ @vmap_rules_getters.register(gen.CdistGrad)
229
230
  def get_cdist_grad_vmap_rule(prim, axis_size):
230
231
  """VmapRule for `cdist grad` operation."""
231
- if hasattr(prim, 'batch_rank'):
232
- batch_rank = prim.batch_rank + 1
232
+ if prim.has_label("batch_rank"):
233
+ batch_rank = prim.get_label("batch_rank") + 1
233
234
  else:
234
235
  batch_rank = 1
235
236
 
236
- batch_prim = _vmap_clone_prim(prim)
237
- batch_prim.add_prim_attr("batch_rank", batch_rank)
237
+ prim = prim.clone()
238
+ prim.set_label('batch_rank', batch_rank)
238
239
 
239
- def vmap_rule(grad_bdim, x_bdim, y_bdim, cdist_bdim):
240
- is_all_none, result = vmap_general_preprocess(prim,
241
- grad_bdim, x_bdim, y_bdim, cdist_bdim)
240
+ def vmap_rule(grad_bdim, x_bdim, y_bdim, cdist_bdim, p_bdim):
241
+ is_all_none, result = vmap_general_preprocess(
242
+ prim, grad_bdim, x_bdim, y_bdim, cdist_bdim, p_bdim
243
+ )
242
244
  if is_all_none:
243
245
  return result
244
246
  grad, grad_dim = grad_bdim
245
247
  x, x_dim = x_bdim
246
248
  y, y_dim = y_bdim
247
249
  cdist, cdist_dim = cdist_bdim
250
+ p, _ = p_bdim
248
251
 
249
252
  grad = _bdim_at_front(grad, grad_dim, axis_size)
250
253
  x = _bdim_at_front(x, x_dim, axis_size)
251
254
  y = _bdim_at_front(y, y_dim, axis_size)
252
255
  cdist = _bdim_at_front(cdist, cdist_dim, axis_size)
253
256
 
254
- out = batch_prim(grad, x, y, cdist)
257
+ out = prim(grad, x, y, cdist, p)
255
258
  return out, 0
256
259
 
257
260
  return vmap_rule
@@ -673,10 +676,11 @@ def get_grid_sampler_grad_vmap_rule(prim, axis_size):
673
676
  else:
674
677
  _raise_value_error("The prim name must be `GridSampler2D` or `GridSampler3D`, but got {}.".format(prim_name))
675
678
 
676
-
677
- def vmap_rule(grad_bdim, input_x_bdim, grid_bdim, interpolation_mode_bdim, padding_mode_bdim, align_corners_bdim):
679
+ def vmap_rule(grad_bdim, input_x_bdim, grid_bdim, interpolation_mode_bdim, padding_mode_bdim, align_corners_bdim,
680
+ output_mask_bdim):
678
681
  is_all_none, result = vmap_general_preprocess(
679
- prim, grad_bdim, input_x_bdim, grid_bdim, interpolation_mode_bdim, padding_mode_bdim, align_corners_bdim)
682
+ prim, grad_bdim, input_x_bdim, grid_bdim, interpolation_mode_bdim, padding_mode_bdim, align_corners_bdim,
683
+ output_mask_bdim)
680
684
  if is_all_none:
681
685
  return result
682
686
 
@@ -686,6 +690,7 @@ def get_grid_sampler_grad_vmap_rule(prim, axis_size):
686
690
  interpolation_mode, _ = interpolation_mode_bdim
687
691
  padding_mode, _ = padding_mode_bdim
688
692
  align_corners, _ = align_corners_bdim
693
+ output_mask, _ = output_mask_bdim
689
694
 
690
695
  grad = _bdim_at_front(grad, grad_dim, axis_size)
691
696
  grad_shape = F.shape(grad)
@@ -699,7 +704,8 @@ def get_grid_sampler_grad_vmap_rule(prim, axis_size):
699
704
  grid_shape = F.shape(grid)
700
705
  grid = F.reshape(grid, (-1,) + grid_shape[non_batch_dim_index:])
701
706
 
702
- dx, dgrid = prim(grad, input_x, grid, interpolation_mode, padding_mode, align_corners)
707
+ dx, dgrid = prim(grad, input_x, grid, interpolation_mode,
708
+ padding_mode, align_corners, output_mask)
703
709
  dx_shape = F.shape(dx)
704
710
  dx_return_shape = input_x_shape[:non_batch_dim_index] + dx_shape[non_batch_dim_index:]
705
711
  dx = F.reshape(dx, dx_return_shape)