mindspore 2.4.10__cp310-none-any.whl → 2.5.0__cp310-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (688) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-310-aarch64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-310-aarch64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-310-aarch64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libmindspore_backend.so +0 -0
  97. mindspore/lib/libmindspore_common.so +0 -0
  98. mindspore/lib/libmindspore_core.so +0 -0
  99. mindspore/lib/libmindspore_glog.so.0 +0 -0
  100. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  101. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  102. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  103. mindspore/lib/libmindspore_ops.so +0 -0
  104. mindspore/lib/libmpi_adapter.so +0 -0
  105. mindspore/lib/libmpi_collective.so +0 -0
  106. mindspore/lib/libnnacl.so +0 -0
  107. mindspore/lib/libopencv_core.so.4.5 +0 -0
  108. mindspore/lib/libps_cache.so +0 -0
  109. mindspore/lib/libswresample.so.4 +0 -0
  110. mindspore/lib/libswscale.so.6 +0 -0
  111. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  112. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  114. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  121. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  172. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  173. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  174. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  175. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  177. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  178. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  179. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  180. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +957 -955
  181. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops_static.a +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/liblcal_static.a +0 -0
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_layer_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so} +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  263. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  264. mindspore/log.py +12 -0
  265. mindspore/mindrecord/__init__.py +1 -1
  266. mindspore/mindrecord/config.py +17 -316
  267. mindspore/mindrecord/filereader.py +1 -9
  268. mindspore/mindrecord/filewriter.py +5 -15
  269. mindspore/mindrecord/mindpage.py +1 -9
  270. mindspore/mint/__init__.py +824 -218
  271. mindspore/mint/distributed/__init__.py +66 -4
  272. mindspore/mint/distributed/distributed.py +2594 -44
  273. mindspore/mint/linalg/__init__.py +6 -0
  274. mindspore/mint/nn/__init__.py +473 -14
  275. mindspore/mint/nn/functional.py +486 -11
  276. mindspore/mint/nn/layer/__init__.py +17 -4
  277. mindspore/mint/nn/layer/_functions.py +330 -0
  278. mindspore/mint/nn/layer/activation.py +169 -1
  279. mindspore/mint/nn/layer/basic.py +123 -0
  280. mindspore/mint/nn/layer/conv.py +727 -0
  281. mindspore/mint/nn/layer/normalization.py +215 -19
  282. mindspore/mint/nn/layer/padding.py +797 -0
  283. mindspore/mint/nn/layer/pooling.py +170 -0
  284. mindspore/mint/optim/__init__.py +2 -1
  285. mindspore/mint/optim/adam.py +223 -0
  286. mindspore/mint/optim/adamw.py +26 -19
  287. mindspore/mint/special/__init__.py +2 -1
  288. mindspore/multiprocessing/__init__.py +5 -0
  289. mindspore/nn/cell.py +126 -19
  290. mindspore/nn/dynamic_lr.py +2 -1
  291. mindspore/nn/layer/activation.py +6 -6
  292. mindspore/nn/layer/basic.py +35 -25
  293. mindspore/nn/layer/channel_shuffle.py +3 -3
  294. mindspore/nn/layer/embedding.py +3 -3
  295. mindspore/nn/layer/normalization.py +8 -7
  296. mindspore/nn/layer/padding.py +4 -3
  297. mindspore/nn/layer/pooling.py +47 -13
  298. mindspore/nn/layer/rnn_cells.py +1 -1
  299. mindspore/nn/layer/rnns.py +2 -1
  300. mindspore/nn/layer/timedistributed.py +5 -5
  301. mindspore/nn/layer/transformer.py +48 -26
  302. mindspore/nn/learning_rate_schedule.py +5 -3
  303. mindspore/nn/loss/loss.py +31 -36
  304. mindspore/nn/optim/ada_grad.py +1 -0
  305. mindspore/nn/optim/adadelta.py +2 -2
  306. mindspore/nn/optim/adam.py +1 -1
  307. mindspore/nn/optim/lars.py +1 -4
  308. mindspore/nn/optim/optimizer.py +1 -1
  309. mindspore/nn/optim/rprop.py +2 -2
  310. mindspore/nn/optim/thor.py +2 -1
  311. mindspore/nn/utils/init.py +13 -11
  312. mindspore/nn/wrap/cell_wrapper.py +4 -6
  313. mindspore/nn/wrap/loss_scale.py +3 -4
  314. mindspore/numpy/array_creations.py +60 -62
  315. mindspore/numpy/array_ops.py +148 -143
  316. mindspore/numpy/logic_ops.py +41 -42
  317. mindspore/numpy/math_ops.py +361 -359
  318. mindspore/numpy/utils.py +16 -16
  319. mindspore/numpy/utils_const.py +4 -4
  320. mindspore/ops/__init__.py +2 -1
  321. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  322. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  323. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  324. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  325. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  326. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  327. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  328. mindspore/ops/_vmap/vmap_base.py +0 -2
  329. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  330. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  331. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  332. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  333. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  334. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  335. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  336. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  337. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  338. mindspore/ops/composite/base.py +1 -1
  339. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  340. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  341. mindspore/ops/function/__init__.py +12 -0
  342. mindspore/ops/function/array_func.py +561 -159
  343. mindspore/ops/function/clip_func.py +64 -0
  344. mindspore/ops/function/debug_func.py +28 -20
  345. mindspore/ops/function/image_func.py +1 -1
  346. mindspore/ops/function/linalg_func.py +5 -4
  347. mindspore/ops/function/math_func.py +1659 -290
  348. mindspore/ops/function/nn_func.py +988 -317
  349. mindspore/ops/function/parameter_func.py +3 -56
  350. mindspore/ops/function/random_func.py +243 -33
  351. mindspore/ops/function/sparse_unary_func.py +1 -1
  352. mindspore/ops/functional.py +18 -5
  353. mindspore/ops/functional_overload.py +897 -0
  354. mindspore/ops/operations/__init__.py +3 -2
  355. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  356. mindspore/ops/operations/_grad_ops.py +2 -34
  357. mindspore/ops/operations/_infer_ops.py +2 -1
  358. mindspore/ops/operations/_inner_ops.py +38 -8
  359. mindspore/ops/operations/array_ops.py +45 -303
  360. mindspore/ops/operations/comm_ops.py +19 -16
  361. mindspore/ops/operations/custom_ops.py +11 -55
  362. mindspore/ops/operations/debug_ops.py +42 -47
  363. mindspore/ops/operations/inner_ops.py +6 -4
  364. mindspore/ops/operations/linalg_ops.py +3 -2
  365. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  366. mindspore/ops/operations/math_ops.py +11 -216
  367. mindspore/ops/operations/nn_ops.py +146 -308
  368. mindspore/ops/primitive.py +23 -21
  369. mindspore/ops/tensor_method.py +1669 -0
  370. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  371. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  372. mindspore/ops_generate/arg_handler.py +0 -61
  373. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  374. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  375. mindspore/ops_generate/base_generator.py +11 -0
  376. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  377. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  378. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  379. mindspore/ops_generate/functions_cc_generator.py +233 -0
  380. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  381. mindspore/ops_generate/gen_constants.py +157 -3
  382. mindspore/ops_generate/gen_ops.py +245 -990
  383. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  384. mindspore/ops_generate/gen_utils.py +119 -33
  385. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  386. mindspore/ops_generate/op_api_proto.py +206 -0
  387. mindspore/ops_generate/op_def_py_generator.py +131 -0
  388. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  389. mindspore/ops_generate/op_proto.py +373 -108
  390. mindspore/ops_generate/op_template_parser.py +436 -0
  391. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  392. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  393. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  394. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  395. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  396. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  397. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  398. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  399. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  400. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  401. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  402. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  403. mindspore/ops_generate/pyboost_utils.py +92 -33
  404. mindspore/ops_generate/template.py +294 -44
  405. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  406. mindspore/parallel/__init__.py +3 -3
  407. mindspore/parallel/_auto_parallel_context.py +24 -33
  408. mindspore/parallel/_parallel_serialization.py +13 -2
  409. mindspore/parallel/_utils.py +4 -1
  410. mindspore/parallel/algo_parameter_config.py +1 -1
  411. mindspore/parallel/checkpoint_transform.py +44 -0
  412. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  413. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  414. mindspore/parallel/cluster/run.py +20 -3
  415. mindspore/parallel/parameter_broadcast.py +1 -1
  416. mindspore/parallel/shard.py +3 -0
  417. mindspore/parallel/transform_safetensors.py +119 -253
  418. mindspore/profiler/__init__.py +17 -4
  419. mindspore/profiler/analysis/__init__.py +0 -0
  420. mindspore/profiler/analysis/parser/__init__.py +0 -0
  421. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  422. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  423. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  424. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  425. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  426. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  427. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  428. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  429. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  430. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  431. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  432. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  433. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  434. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  435. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  436. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  437. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  438. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  439. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  440. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  441. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  442. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  443. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  444. mindspore/profiler/analysis/task_manager.py +131 -0
  445. mindspore/profiler/analysis/time_converter.py +84 -0
  446. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  447. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  448. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  449. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  450. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  451. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  452. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  453. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  454. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  455. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  456. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  457. mindspore/profiler/analysis/work_flow.py +73 -0
  458. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  459. mindspore/profiler/common/command_executor.py +90 -0
  460. mindspore/profiler/common/constant.py +174 -3
  461. mindspore/profiler/common/file_manager.py +208 -0
  462. mindspore/profiler/common/log.py +130 -0
  463. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  464. mindspore/profiler/common/path_manager.py +371 -0
  465. mindspore/profiler/common/process_bar.py +168 -0
  466. mindspore/profiler/common/process_pool.py +9 -3
  467. mindspore/profiler/common/profiler_context.py +476 -0
  468. mindspore/profiler/common/profiler_info.py +304 -0
  469. mindspore/profiler/common/profiler_output_path.py +284 -0
  470. mindspore/profiler/common/profiler_parameters.py +210 -0
  471. mindspore/profiler/common/profiler_path_manager.py +120 -0
  472. mindspore/profiler/common/record_function.py +76 -0
  473. mindspore/profiler/common/tlv_decoder.py +76 -0
  474. mindspore/profiler/common/util.py +75 -2
  475. mindspore/profiler/dynamic_profiler.py +270 -37
  476. mindspore/profiler/envprofiler.py +138 -0
  477. mindspore/profiler/mstx.py +199 -0
  478. mindspore/profiler/platform/__init__.py +21 -0
  479. mindspore/profiler/platform/base_profiler.py +40 -0
  480. mindspore/profiler/platform/cpu_profiler.py +124 -0
  481. mindspore/profiler/platform/gpu_profiler.py +74 -0
  482. mindspore/profiler/platform/npu_profiler.py +309 -0
  483. mindspore/profiler/profiler.py +580 -93
  484. mindspore/profiler/profiler_action_controller.py +187 -0
  485. mindspore/profiler/profiler_interface.py +114 -0
  486. mindspore/profiler/schedule.py +208 -0
  487. mindspore/rewrite/api/symbol_tree.py +1 -2
  488. mindspore/run_check/_check_version.py +2 -6
  489. mindspore/runtime/__init__.py +37 -0
  490. mindspore/runtime/device.py +27 -0
  491. mindspore/runtime/event.py +209 -0
  492. mindspore/runtime/executor.py +148 -0
  493. mindspore/runtime/memory.py +392 -0
  494. mindspore/runtime/stream.py +460 -0
  495. mindspore/runtime/thread_bind_core.py +401 -0
  496. mindspore/train/__init__.py +2 -2
  497. mindspore/train/_utils.py +53 -18
  498. mindspore/train/amp.py +8 -4
  499. mindspore/train/callback/_checkpoint.py +32 -18
  500. mindspore/train/callback/_early_stop.py +1 -1
  501. mindspore/train/callback/_flops_collector.py +105 -69
  502. mindspore/train/callback/_history.py +1 -1
  503. mindspore/train/callback/_summary_collector.py +44 -6
  504. mindspore/train/callback/_tft_register.py +31 -10
  505. mindspore/train/dataset_helper.py +11 -11
  506. mindspore/train/metrics/precision.py +4 -5
  507. mindspore/train/mind_ir_pb2.py +167 -46
  508. mindspore/train/model.py +13 -15
  509. mindspore/train/serialization.py +462 -76
  510. mindspore/train/summary/summary_record.py +1 -2
  511. mindspore/train/train_thor/model_thor.py +1 -1
  512. mindspore/utils/__init__.py +4 -2
  513. mindspore/utils/bin/dataset-cache +0 -0
  514. mindspore/utils/bin/dataset-cache-server +0 -0
  515. mindspore/utils/dryrun.py +138 -0
  516. mindspore/utils/runtime_execution_order_check.py +550 -0
  517. mindspore/version.py +1 -1
  518. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  519. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +522 -456
  520. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  521. mindspore/_data_dump.cpython-310-aarch64-linux-gnu.so +0 -0
  522. mindspore/bin/cache_admin +0 -0
  523. mindspore/bin/cache_server +0 -0
  524. mindspore/common/_tensor_overload.py +0 -139
  525. mindspore/lib/libmindspore_np_dtype.so +0 -0
  526. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  527. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  528. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  529. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  530. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  531. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  532. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  533. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  534. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  535. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  536. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  685. mindspore/profiler/envprofiling.py +0 -254
  686. mindspore/profiler/profiling.py +0 -1926
  687. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  688. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -1,29 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
18
- #include "elewise_binary_impl.h"
19
- namespace mindspore {
20
- namespace internal {
21
- class DivImpl : public ElewiseBinaryImpl {
22
- public:
23
- DivImpl(const OpParamPtr &param) : ElewiseBinaryImpl(param) {}
24
- virtual ~DivImpl() {}
25
- int Launch() override;
26
- };
27
- } // namespace internal
28
- } // namespace mindspore
29
- #endif // MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
@@ -1,48 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
18
-
19
- #include <vector>
20
- #include "include/internal_kernel.h"
21
- #include "include/param/elewise_param.h"
22
-
23
- namespace mindspore {
24
- namespace internal {
25
- class ElewiseBinaryImpl : public InternelKernelImpl {
26
- public:
27
- ElewiseBinaryImpl(const OpParamPtr &param) : InternelKernelImpl(param) {}
28
- virtual ~ElewiseBinaryImpl() {}
29
- bool Init(const ValidateInfo &info) override;
30
- int Launch() { return -1; };
31
- int Tiling(HostRawBuf &tilingBuf) override;
32
- void SetStream(const void *stream_ptr) override;
33
- void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
34
- uint64_t GetTilingBufSize() override;
35
- std::vector<uint64_t> GetWorkSpaceSize() override;
36
- int InferShape(const std::vector<DIMS> &input_shapes, std::vector<DIMS> &output_shapes) override;
37
- virtual int32_t GetMaxUbCount(uint32_t op_dtype);
38
- bool IsSupported() override;
39
-
40
- protected:
41
- void *stream_ptr_ = nullptr;
42
- uint8_t *device_tiling_ = nullptr;
43
- uint32_t aligned_factor_ = 128;
44
- uint32_t ub_dtype = 0;
45
- };
46
- } // namespace internal
47
- } // namespace mindspore
48
- #endif // MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
@@ -1,25 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
17
- #define MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
18
- #include "utils/elewise_tiling.h"
19
- namespace mindspore::internal {
20
- struct ElewiseBinaryTilingData : public ElewiseTailTilingData {
21
- uint32_t broadcast_mode_{0};
22
- uint32_t op_dtype_{0};
23
- };
24
- } // namespace mindspore::internal
25
- #endif // MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
@@ -1,46 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class AndI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline AndI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::And); }
26
- };
27
-
28
- template <typename T = uint16_t>
29
- class AndU16 : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline AndU16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::And); }
32
- };
33
-
34
- extern "C" __global__ __aicore__ void and_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
35
- if (dtype == 6) { // int16
36
- AndI16<int16_t> op;
37
- op.InitBinary(x1, x2, y, tiling);
38
- op.ProcessBinary();
39
- } else if (dtype == 7) { // uint16
40
- AndU16<uint16_t> op;
41
- op.InitBinary(x1, x2, y, tiling);
42
- op.ProcessBinary();
43
- }
44
- }
45
-
46
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
@@ -1,46 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = half>
23
- class DivFp16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline DivFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Div); }
26
- };
27
-
28
- template <typename T = float>
29
- class DivFp32 : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline DivFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Div); }
32
- };
33
-
34
- extern "C" __global__ __aicore__ void div_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
35
- if (dtype == 1) { // fp16
36
- DivFp16<half> op;
37
- op.InitBinary(x1, x2, y, tiling);
38
- op.ProcessBinary();
39
- } else if (dtype == 0) { // fp32
40
- DivFp32<float> op;
41
- op.InitBinary(x1, x2, y, tiling);
42
- op.ProcessBinary();
43
- }
44
- }
45
-
46
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
@@ -1,260 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
19
-
20
- #include "kernel_operator.h"
21
-
22
- using namespace AscendC;
23
-
24
- template <typename IN_TYPE>
25
- class ElewiseBaseWide {
26
- public:
27
- __aicore__ inline ElewiseBaseWide(){};
28
- __aicore__ inline void InitBinary(GM_ADDR in1, GM_ADDR in2, GM_ADDR out, GM_ADDR tiling) {
29
- gm_in1 = reinterpret_cast<__gm__ IN_TYPE *>(in1);
30
- gm_in2 = reinterpret_cast<__gm__ IN_TYPE *>(in2);
31
- gm_out = reinterpret_cast<__gm__ IN_TYPE *>(out);
32
- SetTilingInfo(tiling);
33
- }
34
-
35
- __aicore__ inline void ProcessBinary() {
36
- if (broadcast_mode == 0) {
37
- return BroadcastNone();
38
- } else if (broadcast_mode == 3) {
39
- return ScalarLeft();
40
- } else if (broadcast_mode == 4) {
41
- return ScalarRight();
42
- }
43
- }
44
- __aicore__ inline void SetBinaryFunc(void (*func)(const LocalTensor<IN_TYPE> &dstLocal,
45
- const LocalTensor<IN_TYPE> &src0Local,
46
- const LocalTensor<IN_TYPE> &src1Local, const int &calCount)) {
47
- elewise_binary_func_ = func;
48
- }
49
-
50
- private:
51
- __aicore__ inline void SetTilingInfo(GM_ADDR tiling) {
52
- core_idx = get_block_idx();
53
- core_num = get_block_num();
54
-
55
- avg_block_count = (uint32_t)(*((__gm__ uint32_t *)tiling + 0));
56
- avg_block_ub_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 1));
57
- avg_block_ub_tail = (uint32_t)(*((__gm__ uint32_t *)tiling + 2));
58
- avg_block_ub_loop = (uint32_t)(*((__gm__ uint32_t *)tiling + 3));
59
- tail_block_count = (uint32_t)(*((__gm__ uint32_t *)tiling + 4));
60
- tail_block_ub_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 5));
61
- tail_block_ub_tail = (uint32_t)(*((__gm__ uint32_t *)tiling + 6));
62
- tail_block_ub_loop = (uint32_t)(*((__gm__ uint32_t *)tiling + 7));
63
-
64
- buffer_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 8));
65
- broadcast_mode = (uint32_t)(*((__gm__ uint32_t *)tiling + 10));
66
- }
67
- __aicore__ inline void SetUbParam(uint32_t &ub_count, uint32_t &ub_loop, uint32_t &ub_tail) {
68
- ub_count = avg_block_ub_num;
69
- ub_loop = avg_block_ub_loop;
70
- ub_tail = avg_block_ub_tail;
71
-
72
- if (core_idx == core_num - 1) {
73
- ub_count = tail_block_ub_num;
74
- ub_loop = tail_block_ub_loop;
75
- ub_tail = tail_block_ub_tail;
76
- }
77
- }
78
- __aicore__ inline void InitInOut(uint32_t count) {
79
- pipe.InitBuffer(in1Que, buffer_num, count * sizeof(IN_TYPE));
80
- pipe.InitBuffer(in2Que, buffer_num, count * sizeof(IN_TYPE));
81
- pipe.InitBuffer(outQue, buffer_num, count * sizeof(IN_TYPE));
82
- }
83
-
84
- __aicore__ inline void CopyOut(uint32_t idx, uint32_t stride, uint32_t count) {
85
- LocalTensor<IN_TYPE> out = outQue.DeQue<IN_TYPE>();
86
- DataCopy(outGm[idx * stride], out, count);
87
- outQue.FreeTensor(out);
88
- }
89
-
90
- __aicore__ inline void CopyIn1(uint32_t idx, uint32_t stride, uint32_t count) {
91
- LocalTensor<IN_TYPE> in1 = in1Que.AllocTensor<IN_TYPE>();
92
- DataCopy(in1, in1Gm[idx * stride], count);
93
- in1Que.EnQue(in1);
94
- }
95
-
96
- __aicore__ inline void CopyIn2(uint32_t idx, uint32_t stride, uint32_t count) {
97
- LocalTensor<IN_TYPE> in2 = in2Que.AllocTensor<IN_TYPE>();
98
- DataCopy(in2, in2Gm[idx * stride], count);
99
- in2Que.EnQue(in2);
100
- }
101
-
102
- __aicore__ inline void BroadcastNone() {
103
- uint32_t ub_count, ub_loop, ub_tail;
104
- SetUbParam(ub_count, ub_loop, ub_tail);
105
-
106
- in1Gm.SetGlobalBuffer(gm_in1 + core_idx * avg_block_count);
107
- in2Gm.SetGlobalBuffer(gm_in2 + core_idx * avg_block_count);
108
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
109
-
110
- InitInOut(ub_count);
111
-
112
- uint32_t loop = 0;
113
- for (; loop < ub_loop - 1; loop++) {
114
- CopyIn1(loop, ub_count, ub_count);
115
- CopyIn2(loop, ub_count, ub_count);
116
- ComputeNone(ub_count);
117
- CopyOut(loop, ub_count, ub_count);
118
- }
119
-
120
- /* for ub tail */
121
- if (ub_tail <= 0) {
122
- return;
123
- }
124
- CopyIn1(loop, ub_count, ub_count);
125
- CopyIn2(loop, ub_count, ub_tail);
126
- ComputeNone(ub_tail);
127
- CopyOut(loop, ub_count, ub_tail);
128
- }
129
- __aicore__ inline void ScalarLeft() {
130
- uint32_t ub_count, ub_loop, ub_tail;
131
- SetUbParam(ub_count, ub_loop, ub_tail);
132
-
133
- in1Gm.SetGlobalBuffer(gm_in1);
134
- in2Gm.SetGlobalBuffer(gm_in2 + core_idx * avg_block_count);
135
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
136
-
137
- InitInOut(ub_count);
138
-
139
- /* input tensor init once */
140
- LocalTensor<IN_TYPE> scalar_t = in1Que.AllocTensor<IN_TYPE>();
141
- IN_TYPE scalar_value = in1Gm.GetValue(0);
142
- Duplicate(scalar_t, scalar_value, ub_count);
143
- pipe_barrier(PIPE_ALL);
144
-
145
- uint32_t loop = 0;
146
- for (; loop < ub_loop - 1; loop++) {
147
- CopyIn2(loop, ub_count, ub_count);
148
- ComputeLeft(ub_count, scalar_t);
149
- CopyOut(loop, ub_count, ub_count);
150
- }
151
-
152
- /* for ub tail */
153
- if (ub_tail <= 0) {
154
- return;
155
- }
156
- CopyIn2(loop, ub_count, ub_tail);
157
- ComputeLeft(ub_tail, scalar_t);
158
- CopyOut(loop, ub_count, ub_tail);
159
-
160
- /* free*/
161
- in1Que.FreeTensor(scalar_t);
162
- }
163
- __aicore__ inline void ScalarRight() {
164
- uint32_t ub_count, ub_loop, ub_tail;
165
- SetUbParam(ub_count, ub_loop, ub_tail);
166
-
167
- in1Gm.SetGlobalBuffer(gm_in1 + core_idx * avg_block_count);
168
- in2Gm.SetGlobalBuffer(gm_in2);
169
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
170
-
171
- InitInOut(ub_count);
172
-
173
- /* input tensor init once */
174
- LocalTensor<IN_TYPE> scalar_t = in2Que.AllocTensor<IN_TYPE>();
175
- IN_TYPE scalar_value = in2Gm.GetValue(0);
176
- Duplicate(scalar_t, scalar_value, ub_count);
177
- pipe_barrier(PIPE_ALL);
178
-
179
- uint32_t loop = 0;
180
- for (; loop < ub_loop - 1; loop++) {
181
- CopyIn1(loop, ub_count, ub_count);
182
- ComputeRight(ub_count, scalar_t);
183
- CopyOut(loop, ub_count, ub_count);
184
- }
185
-
186
- /* for ub tail */
187
- if (ub_tail <= 0) {
188
- return;
189
- }
190
- CopyIn1(loop, ub_count, ub_tail);
191
- ComputeRight(ub_tail, scalar_t);
192
- CopyOut(loop, ub_count, ub_tail);
193
-
194
- /* free*/
195
- in2Que.FreeTensor(scalar_t);
196
- }
197
-
198
- __aicore__ inline void ComputeLeft(uint32_t count, LocalTensor<IN_TYPE> &scalar_t) {
199
- LocalTensor<IN_TYPE> in2 = in2Que.DeQue<IN_TYPE>();
200
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
201
- elewise_binary_func_(out, scalar_t, in2, count);
202
- in2Que.FreeTensor(in2);
203
- pipe_barrier(PIPE_ALL);
204
- outQue.EnQue(out);
205
- }
206
-
207
- __aicore__ inline void ComputeRight(uint32_t count, LocalTensor<IN_TYPE> &scalar_t) {
208
- LocalTensor<IN_TYPE> in1 = in1Que.DeQue<IN_TYPE>();
209
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
210
- elewise_binary_func_(out, in1, scalar_t, count);
211
- in1Que.FreeTensor(in1);
212
- pipe_barrier(PIPE_ALL);
213
- outQue.EnQue(out);
214
- }
215
-
216
- __aicore__ inline void ComputeNone(uint32_t count) {
217
- LocalTensor<IN_TYPE> in1 = in1Que.DeQue<IN_TYPE>();
218
- LocalTensor<IN_TYPE> in2 = in2Que.DeQue<IN_TYPE>();
219
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
220
- elewise_binary_func_(out, in1, in2, count);
221
- in1Que.FreeTensor(in1);
222
- in2Que.FreeTensor(in2);
223
- pipe_barrier(PIPE_ALL);
224
- outQue.EnQue(out);
225
- }
226
-
227
- private:
228
- void (*elewise_binary_func_)(const LocalTensor<IN_TYPE> &dstLocal, const LocalTensor<IN_TYPE> &src0Local,
229
- const LocalTensor<IN_TYPE> &src1Local, const int &calCount);
230
-
231
- TPipe pipe;
232
- TQue<AscendC::QuePosition::VECIN, 1> in1Que;
233
- TQue<AscendC::QuePosition::VECIN, 1> in2Que;
234
- TQue<AscendC::QuePosition::VECOUT, 1> outQue;
235
-
236
- __gm__ IN_TYPE *__restrict__ gm_in1{nullptr};
237
- __gm__ IN_TYPE *__restrict__ gm_in2{nullptr};
238
- __gm__ IN_TYPE *__restrict__ gm_out{nullptr};
239
-
240
- GlobalTensor<IN_TYPE> in1Gm;
241
- GlobalTensor<IN_TYPE> in2Gm;
242
- GlobalTensor<IN_TYPE> outGm;
243
-
244
- uint32_t core_idx{0};
245
- uint32_t core_num{0};
246
- uint32_t buffer_num{0};
247
- uint32_t broadcast_mode{0};
248
-
249
- uint32_t avg_block_count{0};
250
- uint32_t avg_block_ub_num{0};
251
- uint32_t avg_block_ub_tail{0};
252
- uint32_t avg_block_ub_loop{0};
253
-
254
- uint32_t tail_block_count{0};
255
- uint32_t tail_block_ub_num{0};
256
- uint32_t tail_block_ub_tail{0};
257
- uint32_t tail_block_ub_loop{0};
258
- };
259
-
260
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
@@ -1,35 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
19
-
20
- void elewise_sub(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
21
- uint8_t *tiling, int dtype);
22
- void elewise_mul(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
23
- uint8_t *tiling, int dtype);
24
- void elewise_div(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
25
- uint8_t *tiling, int dtype);
26
- void elewise_min(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
27
- uint8_t *tiling, int dtype);
28
- void elewise_max(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
29
- uint8_t *tiling, int dtype);
30
- void elewise_and(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
31
- uint8_t *tiling, int dtype);
32
- void elewise_or(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
33
- uint8_t *tiling, int dtype);
34
-
35
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
@@ -1,66 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class MaxI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline MaxI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
26
- };
27
-
28
- template <typename T = int32_t>
29
- class MaxInt : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline MaxInt() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
32
- };
33
-
34
- template <typename T = half>
35
- class MaxFp16 : public ElewiseBaseWide<T> {
36
- public:
37
- __aicore__ inline MaxFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
38
- };
39
-
40
- template <typename T = float>
41
- class MaxFp32 : public ElewiseBaseWide<T> {
42
- public:
43
- __aicore__ inline MaxFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
44
- };
45
-
46
- extern "C" __global__ __aicore__ void max_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
47
- if (dtype == 3) { // int32
48
- MaxInt<int32_t> op;
49
- op.InitBinary(x1, x2, y, tiling);
50
- op.ProcessBinary();
51
- } else if (dtype == 1) { // fp16
52
- MaxFp16<half> op;
53
- op.InitBinary(x1, x2, y, tiling);
54
- op.ProcessBinary();
55
- } else if (dtype == 0) { // fp32
56
- MaxFp32<float> op;
57
- op.InitBinary(x1, x2, y, tiling);
58
- op.ProcessBinary();
59
- } else if (dtype == 6) { // int16
60
- MaxI16<int16_t> op;
61
- op.InitBinary(x1, x2, y, tiling);
62
- op.ProcessBinary();
63
- }
64
- }
65
-
66
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
@@ -1,66 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class MinI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline MinI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
26
- };
27
-
28
- template <typename T = int32_t>
29
- class MinInt : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline MinInt() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
32
- };
33
-
34
- template <typename T = half>
35
- class MinFp16 : public ElewiseBaseWide<T> {
36
- public:
37
- __aicore__ inline MinFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
38
- };
39
-
40
- template <typename T = float>
41
- class MinFp32 : public ElewiseBaseWide<T> {
42
- public:
43
- __aicore__ inline MinFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
44
- };
45
-
46
- extern "C" __global__ __aicore__ void min_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
47
- if (dtype == 3) { // int32
48
- MinInt<int32_t> op;
49
- op.InitBinary(x1, x2, y, tiling);
50
- op.ProcessBinary();
51
- } else if (dtype == 1) { // fp16
52
- MinFp16<half> op;
53
- op.InitBinary(x1, x2, y, tiling);
54
- op.ProcessBinary();
55
- } else if (dtype == 0) { // fp32
56
- MinFp32<float> op;
57
- op.InitBinary(x1, x2, y, tiling);
58
- op.ProcessBinary();
59
- } else if (dtype == 6) { // int16
60
- MinI16<int16_t> op;
61
- op.InitBinary(x1, x2, y, tiling);
62
- op.ProcessBinary();
63
- }
64
- }
65
-
66
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_