mindspore 2.4.10__cp311-none-any.whl → 2.5.0__cp311-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (690) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-311-aarch64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-311-aarch64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-311-aarch64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libmindspore_backend.so +0 -0
  97. mindspore/lib/libmindspore_common.so +0 -0
  98. mindspore/lib/libmindspore_core.so +0 -0
  99. mindspore/lib/libmindspore_glog.so.0 +0 -0
  100. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  101. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  102. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  103. mindspore/lib/libmindspore_ops.so +0 -0
  104. mindspore/lib/libmpi_adapter.so +0 -0
  105. mindspore/lib/libmpi_collective.so +0 -0
  106. mindspore/lib/libnnacl.so +0 -0
  107. mindspore/lib/libopencv_core.so.4.5 +0 -0
  108. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  110. mindspore/lib/libps_cache.so +0 -0
  111. mindspore/lib/libswresample.so.4 +0 -0
  112. mindspore/lib/libswscale.so.6 +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  114. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  121. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  174. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  175. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  177. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  178. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  179. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  180. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  181. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +957 -955
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops_static.a +0 -0
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/liblcal_static.a +0 -0
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_layer_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so} +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  263. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  264. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  265. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  266. mindspore/log.py +12 -0
  267. mindspore/mindrecord/__init__.py +1 -1
  268. mindspore/mindrecord/config.py +17 -316
  269. mindspore/mindrecord/filereader.py +1 -9
  270. mindspore/mindrecord/filewriter.py +5 -15
  271. mindspore/mindrecord/mindpage.py +1 -9
  272. mindspore/mint/__init__.py +824 -218
  273. mindspore/mint/distributed/__init__.py +66 -4
  274. mindspore/mint/distributed/distributed.py +2594 -44
  275. mindspore/mint/linalg/__init__.py +6 -0
  276. mindspore/mint/nn/__init__.py +473 -14
  277. mindspore/mint/nn/functional.py +486 -11
  278. mindspore/mint/nn/layer/__init__.py +17 -4
  279. mindspore/mint/nn/layer/_functions.py +330 -0
  280. mindspore/mint/nn/layer/activation.py +169 -1
  281. mindspore/mint/nn/layer/basic.py +123 -0
  282. mindspore/mint/nn/layer/conv.py +727 -0
  283. mindspore/mint/nn/layer/normalization.py +215 -19
  284. mindspore/mint/nn/layer/padding.py +797 -0
  285. mindspore/mint/nn/layer/pooling.py +170 -0
  286. mindspore/mint/optim/__init__.py +2 -1
  287. mindspore/mint/optim/adam.py +223 -0
  288. mindspore/mint/optim/adamw.py +26 -19
  289. mindspore/mint/special/__init__.py +2 -1
  290. mindspore/multiprocessing/__init__.py +5 -0
  291. mindspore/nn/cell.py +126 -19
  292. mindspore/nn/dynamic_lr.py +2 -1
  293. mindspore/nn/layer/activation.py +6 -6
  294. mindspore/nn/layer/basic.py +35 -25
  295. mindspore/nn/layer/channel_shuffle.py +3 -3
  296. mindspore/nn/layer/embedding.py +3 -3
  297. mindspore/nn/layer/normalization.py +8 -7
  298. mindspore/nn/layer/padding.py +4 -3
  299. mindspore/nn/layer/pooling.py +47 -13
  300. mindspore/nn/layer/rnn_cells.py +1 -1
  301. mindspore/nn/layer/rnns.py +2 -1
  302. mindspore/nn/layer/timedistributed.py +5 -5
  303. mindspore/nn/layer/transformer.py +48 -26
  304. mindspore/nn/learning_rate_schedule.py +5 -3
  305. mindspore/nn/loss/loss.py +31 -36
  306. mindspore/nn/optim/ada_grad.py +1 -0
  307. mindspore/nn/optim/adadelta.py +2 -2
  308. mindspore/nn/optim/adam.py +1 -1
  309. mindspore/nn/optim/lars.py +1 -4
  310. mindspore/nn/optim/optimizer.py +1 -1
  311. mindspore/nn/optim/rprop.py +2 -2
  312. mindspore/nn/optim/thor.py +2 -1
  313. mindspore/nn/utils/init.py +13 -11
  314. mindspore/nn/wrap/cell_wrapper.py +4 -6
  315. mindspore/nn/wrap/loss_scale.py +3 -4
  316. mindspore/numpy/array_creations.py +60 -62
  317. mindspore/numpy/array_ops.py +148 -143
  318. mindspore/numpy/logic_ops.py +41 -42
  319. mindspore/numpy/math_ops.py +361 -359
  320. mindspore/numpy/utils.py +16 -16
  321. mindspore/numpy/utils_const.py +4 -4
  322. mindspore/ops/__init__.py +2 -1
  323. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  324. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  325. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  326. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  327. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  328. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  329. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  330. mindspore/ops/_vmap/vmap_base.py +0 -2
  331. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  332. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  333. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  334. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  335. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  336. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  337. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  338. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  339. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  340. mindspore/ops/composite/base.py +1 -1
  341. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  342. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  343. mindspore/ops/function/__init__.py +12 -0
  344. mindspore/ops/function/array_func.py +561 -159
  345. mindspore/ops/function/clip_func.py +64 -0
  346. mindspore/ops/function/debug_func.py +28 -20
  347. mindspore/ops/function/image_func.py +1 -1
  348. mindspore/ops/function/linalg_func.py +5 -4
  349. mindspore/ops/function/math_func.py +1659 -290
  350. mindspore/ops/function/nn_func.py +988 -317
  351. mindspore/ops/function/parameter_func.py +3 -56
  352. mindspore/ops/function/random_func.py +243 -33
  353. mindspore/ops/function/sparse_unary_func.py +1 -1
  354. mindspore/ops/functional.py +18 -5
  355. mindspore/ops/functional_overload.py +897 -0
  356. mindspore/ops/operations/__init__.py +3 -2
  357. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  358. mindspore/ops/operations/_grad_ops.py +2 -34
  359. mindspore/ops/operations/_infer_ops.py +2 -1
  360. mindspore/ops/operations/_inner_ops.py +38 -8
  361. mindspore/ops/operations/array_ops.py +45 -303
  362. mindspore/ops/operations/comm_ops.py +19 -16
  363. mindspore/ops/operations/custom_ops.py +11 -55
  364. mindspore/ops/operations/debug_ops.py +42 -47
  365. mindspore/ops/operations/inner_ops.py +6 -4
  366. mindspore/ops/operations/linalg_ops.py +3 -2
  367. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  368. mindspore/ops/operations/math_ops.py +11 -216
  369. mindspore/ops/operations/nn_ops.py +146 -308
  370. mindspore/ops/primitive.py +23 -21
  371. mindspore/ops/tensor_method.py +1669 -0
  372. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  373. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  374. mindspore/ops_generate/arg_handler.py +0 -61
  375. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  376. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  377. mindspore/ops_generate/base_generator.py +11 -0
  378. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  379. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  380. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  381. mindspore/ops_generate/functions_cc_generator.py +233 -0
  382. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  383. mindspore/ops_generate/gen_constants.py +157 -3
  384. mindspore/ops_generate/gen_ops.py +245 -990
  385. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  386. mindspore/ops_generate/gen_utils.py +119 -33
  387. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  388. mindspore/ops_generate/op_api_proto.py +206 -0
  389. mindspore/ops_generate/op_def_py_generator.py +131 -0
  390. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  391. mindspore/ops_generate/op_proto.py +373 -108
  392. mindspore/ops_generate/op_template_parser.py +436 -0
  393. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  394. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  395. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  396. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  397. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  398. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  399. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  400. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  401. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  402. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  403. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  404. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  405. mindspore/ops_generate/pyboost_utils.py +92 -33
  406. mindspore/ops_generate/template.py +294 -44
  407. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  408. mindspore/parallel/__init__.py +3 -3
  409. mindspore/parallel/_auto_parallel_context.py +24 -33
  410. mindspore/parallel/_parallel_serialization.py +13 -2
  411. mindspore/parallel/_utils.py +4 -1
  412. mindspore/parallel/algo_parameter_config.py +1 -1
  413. mindspore/parallel/checkpoint_transform.py +44 -0
  414. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  415. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  416. mindspore/parallel/cluster/run.py +20 -3
  417. mindspore/parallel/parameter_broadcast.py +1 -1
  418. mindspore/parallel/shard.py +3 -0
  419. mindspore/parallel/transform_safetensors.py +119 -253
  420. mindspore/profiler/__init__.py +17 -4
  421. mindspore/profiler/analysis/__init__.py +0 -0
  422. mindspore/profiler/analysis/parser/__init__.py +0 -0
  423. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  424. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  425. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  426. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  427. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  428. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  429. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  430. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  431. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  432. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  433. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  434. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  435. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  436. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  437. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  438. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  439. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  440. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  441. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  442. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  443. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  444. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  445. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  446. mindspore/profiler/analysis/task_manager.py +131 -0
  447. mindspore/profiler/analysis/time_converter.py +84 -0
  448. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  449. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  450. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  451. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  452. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  453. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  454. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  455. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  456. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  457. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  458. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  459. mindspore/profiler/analysis/work_flow.py +73 -0
  460. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  461. mindspore/profiler/common/command_executor.py +90 -0
  462. mindspore/profiler/common/constant.py +174 -3
  463. mindspore/profiler/common/file_manager.py +208 -0
  464. mindspore/profiler/common/log.py +130 -0
  465. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  466. mindspore/profiler/common/path_manager.py +371 -0
  467. mindspore/profiler/common/process_bar.py +168 -0
  468. mindspore/profiler/common/process_pool.py +9 -3
  469. mindspore/profiler/common/profiler_context.py +476 -0
  470. mindspore/profiler/common/profiler_info.py +304 -0
  471. mindspore/profiler/common/profiler_output_path.py +284 -0
  472. mindspore/profiler/common/profiler_parameters.py +210 -0
  473. mindspore/profiler/common/profiler_path_manager.py +120 -0
  474. mindspore/profiler/common/record_function.py +76 -0
  475. mindspore/profiler/common/tlv_decoder.py +76 -0
  476. mindspore/profiler/common/util.py +75 -2
  477. mindspore/profiler/dynamic_profiler.py +270 -37
  478. mindspore/profiler/envprofiler.py +138 -0
  479. mindspore/profiler/mstx.py +199 -0
  480. mindspore/profiler/platform/__init__.py +21 -0
  481. mindspore/profiler/platform/base_profiler.py +40 -0
  482. mindspore/profiler/platform/cpu_profiler.py +124 -0
  483. mindspore/profiler/platform/gpu_profiler.py +74 -0
  484. mindspore/profiler/platform/npu_profiler.py +309 -0
  485. mindspore/profiler/profiler.py +580 -93
  486. mindspore/profiler/profiler_action_controller.py +187 -0
  487. mindspore/profiler/profiler_interface.py +114 -0
  488. mindspore/profiler/schedule.py +208 -0
  489. mindspore/rewrite/api/symbol_tree.py +1 -2
  490. mindspore/run_check/_check_version.py +2 -6
  491. mindspore/runtime/__init__.py +37 -0
  492. mindspore/runtime/device.py +27 -0
  493. mindspore/runtime/event.py +209 -0
  494. mindspore/runtime/executor.py +148 -0
  495. mindspore/runtime/memory.py +392 -0
  496. mindspore/runtime/stream.py +460 -0
  497. mindspore/runtime/thread_bind_core.py +401 -0
  498. mindspore/train/__init__.py +2 -2
  499. mindspore/train/_utils.py +53 -18
  500. mindspore/train/amp.py +8 -4
  501. mindspore/train/callback/_checkpoint.py +32 -18
  502. mindspore/train/callback/_early_stop.py +1 -1
  503. mindspore/train/callback/_flops_collector.py +105 -69
  504. mindspore/train/callback/_history.py +1 -1
  505. mindspore/train/callback/_summary_collector.py +44 -6
  506. mindspore/train/callback/_tft_register.py +31 -10
  507. mindspore/train/dataset_helper.py +11 -11
  508. mindspore/train/metrics/precision.py +4 -5
  509. mindspore/train/mind_ir_pb2.py +167 -46
  510. mindspore/train/model.py +13 -15
  511. mindspore/train/serialization.py +462 -76
  512. mindspore/train/summary/summary_record.py +1 -2
  513. mindspore/train/train_thor/model_thor.py +1 -1
  514. mindspore/utils/__init__.py +4 -2
  515. mindspore/utils/bin/dataset-cache +0 -0
  516. mindspore/utils/bin/dataset-cache-server +0 -0
  517. mindspore/utils/dryrun.py +138 -0
  518. mindspore/utils/runtime_execution_order_check.py +550 -0
  519. mindspore/version.py +1 -1
  520. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  521. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +524 -458
  522. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  523. mindspore/_data_dump.cpython-311-aarch64-linux-gnu.so +0 -0
  524. mindspore/bin/cache_admin +0 -0
  525. mindspore/bin/cache_server +0 -0
  526. mindspore/common/_tensor_overload.py +0 -139
  527. mindspore/lib/libmindspore_np_dtype.so +0 -0
  528. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  529. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  530. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  531. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  532. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  533. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  534. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  535. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  536. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  687. mindspore/profiler/envprofiling.py +0 -254
  688. mindspore/profiler/profiling.py +0 -1926
  689. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  690. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -1,29 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
18
- #include "elewise_binary_impl.h"
19
- namespace mindspore {
20
- namespace internal {
21
- class DivImpl : public ElewiseBinaryImpl {
22
- public:
23
- DivImpl(const OpParamPtr &param) : ElewiseBinaryImpl(param) {}
24
- virtual ~DivImpl() {}
25
- int Launch() override;
26
- };
27
- } // namespace internal
28
- } // namespace mindspore
29
- #endif // MS_KERNELS_INTERNAL_KERNEL_DIV_IMPL_H_
@@ -1,48 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
18
-
19
- #include <vector>
20
- #include "include/internal_kernel.h"
21
- #include "include/param/elewise_param.h"
22
-
23
- namespace mindspore {
24
- namespace internal {
25
- class ElewiseBinaryImpl : public InternelKernelImpl {
26
- public:
27
- ElewiseBinaryImpl(const OpParamPtr &param) : InternelKernelImpl(param) {}
28
- virtual ~ElewiseBinaryImpl() {}
29
- bool Init(const ValidateInfo &info) override;
30
- int Launch() { return -1; };
31
- int Tiling(HostRawBuf &tilingBuf) override;
32
- void SetStream(const void *stream_ptr) override;
33
- void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
34
- uint64_t GetTilingBufSize() override;
35
- std::vector<uint64_t> GetWorkSpaceSize() override;
36
- int InferShape(const std::vector<DIMS> &input_shapes, std::vector<DIMS> &output_shapes) override;
37
- virtual int32_t GetMaxUbCount(uint32_t op_dtype);
38
- bool IsSupported() override;
39
-
40
- protected:
41
- void *stream_ptr_ = nullptr;
42
- uint8_t *device_tiling_ = nullptr;
43
- uint32_t aligned_factor_ = 128;
44
- uint32_t ub_dtype = 0;
45
- };
46
- } // namespace internal
47
- } // namespace mindspore
48
- #endif // MS_KERNELS_INTERNAL_KERNEL_ELEWISE_BINARY_IMPL_H_
@@ -1,25 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
17
- #define MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
18
- #include "utils/elewise_tiling.h"
19
- namespace mindspore::internal {
20
- struct ElewiseBinaryTilingData : public ElewiseTailTilingData {
21
- uint32_t broadcast_mode_{0};
22
- uint32_t op_dtype_{0};
23
- };
24
- } // namespace mindspore::internal
25
- #endif // MS_KERNELS_INTERNAL_ASCENDC_ELEWISE_BINARY_TILING_H_
@@ -1,46 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class AndI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline AndI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::And); }
26
- };
27
-
28
- template <typename T = uint16_t>
29
- class AndU16 : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline AndU16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::And); }
32
- };
33
-
34
- extern "C" __global__ __aicore__ void and_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
35
- if (dtype == 6) { // int16
36
- AndI16<int16_t> op;
37
- op.InitBinary(x1, x2, y, tiling);
38
- op.ProcessBinary();
39
- } else if (dtype == 7) { // uint16
40
- AndU16<uint16_t> op;
41
- op.InitBinary(x1, x2, y, tiling);
42
- op.ProcessBinary();
43
- }
44
- }
45
-
46
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_AND_KERNEL_H_
@@ -1,46 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = half>
23
- class DivFp16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline DivFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Div); }
26
- };
27
-
28
- template <typename T = float>
29
- class DivFp32 : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline DivFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Div); }
32
- };
33
-
34
- extern "C" __global__ __aicore__ void div_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
35
- if (dtype == 1) { // fp16
36
- DivFp16<half> op;
37
- op.InitBinary(x1, x2, y, tiling);
38
- op.ProcessBinary();
39
- } else if (dtype == 0) { // fp32
40
- DivFp32<float> op;
41
- op.InitBinary(x1, x2, y, tiling);
42
- op.ProcessBinary();
43
- }
44
- }
45
-
46
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_DIV_KERNEL_H_
@@ -1,260 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
19
-
20
- #include "kernel_operator.h"
21
-
22
- using namespace AscendC;
23
-
24
- template <typename IN_TYPE>
25
- class ElewiseBaseWide {
26
- public:
27
- __aicore__ inline ElewiseBaseWide(){};
28
- __aicore__ inline void InitBinary(GM_ADDR in1, GM_ADDR in2, GM_ADDR out, GM_ADDR tiling) {
29
- gm_in1 = reinterpret_cast<__gm__ IN_TYPE *>(in1);
30
- gm_in2 = reinterpret_cast<__gm__ IN_TYPE *>(in2);
31
- gm_out = reinterpret_cast<__gm__ IN_TYPE *>(out);
32
- SetTilingInfo(tiling);
33
- }
34
-
35
- __aicore__ inline void ProcessBinary() {
36
- if (broadcast_mode == 0) {
37
- return BroadcastNone();
38
- } else if (broadcast_mode == 3) {
39
- return ScalarLeft();
40
- } else if (broadcast_mode == 4) {
41
- return ScalarRight();
42
- }
43
- }
44
- __aicore__ inline void SetBinaryFunc(void (*func)(const LocalTensor<IN_TYPE> &dstLocal,
45
- const LocalTensor<IN_TYPE> &src0Local,
46
- const LocalTensor<IN_TYPE> &src1Local, const int &calCount)) {
47
- elewise_binary_func_ = func;
48
- }
49
-
50
- private:
51
- __aicore__ inline void SetTilingInfo(GM_ADDR tiling) {
52
- core_idx = get_block_idx();
53
- core_num = get_block_num();
54
-
55
- avg_block_count = (uint32_t)(*((__gm__ uint32_t *)tiling + 0));
56
- avg_block_ub_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 1));
57
- avg_block_ub_tail = (uint32_t)(*((__gm__ uint32_t *)tiling + 2));
58
- avg_block_ub_loop = (uint32_t)(*((__gm__ uint32_t *)tiling + 3));
59
- tail_block_count = (uint32_t)(*((__gm__ uint32_t *)tiling + 4));
60
- tail_block_ub_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 5));
61
- tail_block_ub_tail = (uint32_t)(*((__gm__ uint32_t *)tiling + 6));
62
- tail_block_ub_loop = (uint32_t)(*((__gm__ uint32_t *)tiling + 7));
63
-
64
- buffer_num = (uint32_t)(*((__gm__ uint32_t *)tiling + 8));
65
- broadcast_mode = (uint32_t)(*((__gm__ uint32_t *)tiling + 10));
66
- }
67
- __aicore__ inline void SetUbParam(uint32_t &ub_count, uint32_t &ub_loop, uint32_t &ub_tail) {
68
- ub_count = avg_block_ub_num;
69
- ub_loop = avg_block_ub_loop;
70
- ub_tail = avg_block_ub_tail;
71
-
72
- if (core_idx == core_num - 1) {
73
- ub_count = tail_block_ub_num;
74
- ub_loop = tail_block_ub_loop;
75
- ub_tail = tail_block_ub_tail;
76
- }
77
- }
78
- __aicore__ inline void InitInOut(uint32_t count) {
79
- pipe.InitBuffer(in1Que, buffer_num, count * sizeof(IN_TYPE));
80
- pipe.InitBuffer(in2Que, buffer_num, count * sizeof(IN_TYPE));
81
- pipe.InitBuffer(outQue, buffer_num, count * sizeof(IN_TYPE));
82
- }
83
-
84
- __aicore__ inline void CopyOut(uint32_t idx, uint32_t stride, uint32_t count) {
85
- LocalTensor<IN_TYPE> out = outQue.DeQue<IN_TYPE>();
86
- DataCopy(outGm[idx * stride], out, count);
87
- outQue.FreeTensor(out);
88
- }
89
-
90
- __aicore__ inline void CopyIn1(uint32_t idx, uint32_t stride, uint32_t count) {
91
- LocalTensor<IN_TYPE> in1 = in1Que.AllocTensor<IN_TYPE>();
92
- DataCopy(in1, in1Gm[idx * stride], count);
93
- in1Que.EnQue(in1);
94
- }
95
-
96
- __aicore__ inline void CopyIn2(uint32_t idx, uint32_t stride, uint32_t count) {
97
- LocalTensor<IN_TYPE> in2 = in2Que.AllocTensor<IN_TYPE>();
98
- DataCopy(in2, in2Gm[idx * stride], count);
99
- in2Que.EnQue(in2);
100
- }
101
-
102
- __aicore__ inline void BroadcastNone() {
103
- uint32_t ub_count, ub_loop, ub_tail;
104
- SetUbParam(ub_count, ub_loop, ub_tail);
105
-
106
- in1Gm.SetGlobalBuffer(gm_in1 + core_idx * avg_block_count);
107
- in2Gm.SetGlobalBuffer(gm_in2 + core_idx * avg_block_count);
108
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
109
-
110
- InitInOut(ub_count);
111
-
112
- uint32_t loop = 0;
113
- for (; loop < ub_loop - 1; loop++) {
114
- CopyIn1(loop, ub_count, ub_count);
115
- CopyIn2(loop, ub_count, ub_count);
116
- ComputeNone(ub_count);
117
- CopyOut(loop, ub_count, ub_count);
118
- }
119
-
120
- /* for ub tail */
121
- if (ub_tail <= 0) {
122
- return;
123
- }
124
- CopyIn1(loop, ub_count, ub_count);
125
- CopyIn2(loop, ub_count, ub_tail);
126
- ComputeNone(ub_tail);
127
- CopyOut(loop, ub_count, ub_tail);
128
- }
129
- __aicore__ inline void ScalarLeft() {
130
- uint32_t ub_count, ub_loop, ub_tail;
131
- SetUbParam(ub_count, ub_loop, ub_tail);
132
-
133
- in1Gm.SetGlobalBuffer(gm_in1);
134
- in2Gm.SetGlobalBuffer(gm_in2 + core_idx * avg_block_count);
135
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
136
-
137
- InitInOut(ub_count);
138
-
139
- /* input tensor init once */
140
- LocalTensor<IN_TYPE> scalar_t = in1Que.AllocTensor<IN_TYPE>();
141
- IN_TYPE scalar_value = in1Gm.GetValue(0);
142
- Duplicate(scalar_t, scalar_value, ub_count);
143
- pipe_barrier(PIPE_ALL);
144
-
145
- uint32_t loop = 0;
146
- for (; loop < ub_loop - 1; loop++) {
147
- CopyIn2(loop, ub_count, ub_count);
148
- ComputeLeft(ub_count, scalar_t);
149
- CopyOut(loop, ub_count, ub_count);
150
- }
151
-
152
- /* for ub tail */
153
- if (ub_tail <= 0) {
154
- return;
155
- }
156
- CopyIn2(loop, ub_count, ub_tail);
157
- ComputeLeft(ub_tail, scalar_t);
158
- CopyOut(loop, ub_count, ub_tail);
159
-
160
- /* free*/
161
- in1Que.FreeTensor(scalar_t);
162
- }
163
- __aicore__ inline void ScalarRight() {
164
- uint32_t ub_count, ub_loop, ub_tail;
165
- SetUbParam(ub_count, ub_loop, ub_tail);
166
-
167
- in1Gm.SetGlobalBuffer(gm_in1 + core_idx * avg_block_count);
168
- in2Gm.SetGlobalBuffer(gm_in2);
169
- outGm.SetGlobalBuffer(gm_out + core_idx * avg_block_count);
170
-
171
- InitInOut(ub_count);
172
-
173
- /* input tensor init once */
174
- LocalTensor<IN_TYPE> scalar_t = in2Que.AllocTensor<IN_TYPE>();
175
- IN_TYPE scalar_value = in2Gm.GetValue(0);
176
- Duplicate(scalar_t, scalar_value, ub_count);
177
- pipe_barrier(PIPE_ALL);
178
-
179
- uint32_t loop = 0;
180
- for (; loop < ub_loop - 1; loop++) {
181
- CopyIn1(loop, ub_count, ub_count);
182
- ComputeRight(ub_count, scalar_t);
183
- CopyOut(loop, ub_count, ub_count);
184
- }
185
-
186
- /* for ub tail */
187
- if (ub_tail <= 0) {
188
- return;
189
- }
190
- CopyIn1(loop, ub_count, ub_tail);
191
- ComputeRight(ub_tail, scalar_t);
192
- CopyOut(loop, ub_count, ub_tail);
193
-
194
- /* free*/
195
- in2Que.FreeTensor(scalar_t);
196
- }
197
-
198
- __aicore__ inline void ComputeLeft(uint32_t count, LocalTensor<IN_TYPE> &scalar_t) {
199
- LocalTensor<IN_TYPE> in2 = in2Que.DeQue<IN_TYPE>();
200
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
201
- elewise_binary_func_(out, scalar_t, in2, count);
202
- in2Que.FreeTensor(in2);
203
- pipe_barrier(PIPE_ALL);
204
- outQue.EnQue(out);
205
- }
206
-
207
- __aicore__ inline void ComputeRight(uint32_t count, LocalTensor<IN_TYPE> &scalar_t) {
208
- LocalTensor<IN_TYPE> in1 = in1Que.DeQue<IN_TYPE>();
209
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
210
- elewise_binary_func_(out, in1, scalar_t, count);
211
- in1Que.FreeTensor(in1);
212
- pipe_barrier(PIPE_ALL);
213
- outQue.EnQue(out);
214
- }
215
-
216
- __aicore__ inline void ComputeNone(uint32_t count) {
217
- LocalTensor<IN_TYPE> in1 = in1Que.DeQue<IN_TYPE>();
218
- LocalTensor<IN_TYPE> in2 = in2Que.DeQue<IN_TYPE>();
219
- LocalTensor<IN_TYPE> out = outQue.AllocTensor<IN_TYPE>();
220
- elewise_binary_func_(out, in1, in2, count);
221
- in1Que.FreeTensor(in1);
222
- in2Que.FreeTensor(in2);
223
- pipe_barrier(PIPE_ALL);
224
- outQue.EnQue(out);
225
- }
226
-
227
- private:
228
- void (*elewise_binary_func_)(const LocalTensor<IN_TYPE> &dstLocal, const LocalTensor<IN_TYPE> &src0Local,
229
- const LocalTensor<IN_TYPE> &src1Local, const int &calCount);
230
-
231
- TPipe pipe;
232
- TQue<AscendC::QuePosition::VECIN, 1> in1Que;
233
- TQue<AscendC::QuePosition::VECIN, 1> in2Que;
234
- TQue<AscendC::QuePosition::VECOUT, 1> outQue;
235
-
236
- __gm__ IN_TYPE *__restrict__ gm_in1{nullptr};
237
- __gm__ IN_TYPE *__restrict__ gm_in2{nullptr};
238
- __gm__ IN_TYPE *__restrict__ gm_out{nullptr};
239
-
240
- GlobalTensor<IN_TYPE> in1Gm;
241
- GlobalTensor<IN_TYPE> in2Gm;
242
- GlobalTensor<IN_TYPE> outGm;
243
-
244
- uint32_t core_idx{0};
245
- uint32_t core_num{0};
246
- uint32_t buffer_num{0};
247
- uint32_t broadcast_mode{0};
248
-
249
- uint32_t avg_block_count{0};
250
- uint32_t avg_block_ub_num{0};
251
- uint32_t avg_block_ub_tail{0};
252
- uint32_t avg_block_ub_loop{0};
253
-
254
- uint32_t tail_block_count{0};
255
- uint32_t tail_block_ub_num{0};
256
- uint32_t tail_block_ub_tail{0};
257
- uint32_t tail_block_ub_loop{0};
258
- };
259
-
260
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_BASE_H_
@@ -1,35 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
19
-
20
- void elewise_sub(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
21
- uint8_t *tiling, int dtype);
22
- void elewise_mul(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
23
- uint8_t *tiling, int dtype);
24
- void elewise_div(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
25
- uint8_t *tiling, int dtype);
26
- void elewise_min(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
27
- uint8_t *tiling, int dtype);
28
- void elewise_max(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
29
- uint8_t *tiling, int dtype);
30
- void elewise_and(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
31
- uint8_t *tiling, int dtype);
32
- void elewise_or(uint32_t blockDim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out,
33
- uint8_t *tiling, int dtype);
34
-
35
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_ELEWISE_BINARY_KERNEL_H_
@@ -1,66 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class MaxI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline MaxI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
26
- };
27
-
28
- template <typename T = int32_t>
29
- class MaxInt : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline MaxInt() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
32
- };
33
-
34
- template <typename T = half>
35
- class MaxFp16 : public ElewiseBaseWide<T> {
36
- public:
37
- __aicore__ inline MaxFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
38
- };
39
-
40
- template <typename T = float>
41
- class MaxFp32 : public ElewiseBaseWide<T> {
42
- public:
43
- __aicore__ inline MaxFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Max); }
44
- };
45
-
46
- extern "C" __global__ __aicore__ void max_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
47
- if (dtype == 3) { // int32
48
- MaxInt<int32_t> op;
49
- op.InitBinary(x1, x2, y, tiling);
50
- op.ProcessBinary();
51
- } else if (dtype == 1) { // fp16
52
- MaxFp16<half> op;
53
- op.InitBinary(x1, x2, y, tiling);
54
- op.ProcessBinary();
55
- } else if (dtype == 0) { // fp32
56
- MaxFp32<float> op;
57
- op.InitBinary(x1, x2, y, tiling);
58
- op.ProcessBinary();
59
- } else if (dtype == 6) { // int16
60
- MaxI16<int16_t> op;
61
- op.InitBinary(x1, x2, y, tiling);
62
- op.ProcessBinary();
63
- }
64
- }
65
-
66
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MAX_KERNEL_H_
@@ -1,66 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_
19
-
20
- #include "elewise_binary_base.h"
21
-
22
- template <typename T = int16_t>
23
- class MinI16 : public ElewiseBaseWide<T> {
24
- public:
25
- __aicore__ inline MinI16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
26
- };
27
-
28
- template <typename T = int32_t>
29
- class MinInt : public ElewiseBaseWide<T> {
30
- public:
31
- __aicore__ inline MinInt() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
32
- };
33
-
34
- template <typename T = half>
35
- class MinFp16 : public ElewiseBaseWide<T> {
36
- public:
37
- __aicore__ inline MinFp16() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
38
- };
39
-
40
- template <typename T = float>
41
- class MinFp32 : public ElewiseBaseWide<T> {
42
- public:
43
- __aicore__ inline MinFp32() { ElewiseBaseWide<T>::SetBinaryFunc(AscendC::Min); }
44
- };
45
-
46
- extern "C" __global__ __aicore__ void min_device_legacy(GM_ADDR x1, GM_ADDR x2, GM_ADDR y, GM_ADDR tiling, int32_t dtype) {
47
- if (dtype == 3) { // int32
48
- MinInt<int32_t> op;
49
- op.InitBinary(x1, x2, y, tiling);
50
- op.ProcessBinary();
51
- } else if (dtype == 1) { // fp16
52
- MinFp16<half> op;
53
- op.InitBinary(x1, x2, y, tiling);
54
- op.ProcessBinary();
55
- } else if (dtype == 0) { // fp32
56
- MinFp32<float> op;
57
- op.InitBinary(x1, x2, y, tiling);
58
- op.ProcessBinary();
59
- } else if (dtype == 6) { // int16
60
- MinI16<int16_t> op;
61
- op.InitBinary(x1, x2, y, tiling);
62
- op.ProcessBinary();
63
- }
64
- }
65
-
66
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ELEWISE_BINARY_MIN_KERNEL_H_