mindspore 2.4.10__cp311-cp311-manylinux1_x86_64.whl → 2.5.0__cp311-cp311-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (706) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-311-x86_64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-311-x86_64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-311-x86_64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libicuuc.so.69 +0 -0
  97. mindspore/lib/libmindspore_backend.so +0 -0
  98. mindspore/lib/libmindspore_common.so +0 -0
  99. mindspore/lib/libmindspore_core.so +0 -0
  100. mindspore/lib/libmindspore_glog.so.0 +0 -0
  101. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  102. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  103. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  104. mindspore/lib/libmindspore_ops.so +0 -0
  105. mindspore/lib/libmpi_adapter.so +0 -0
  106. mindspore/lib/libmpi_collective.so +0 -0
  107. mindspore/lib/libnnacl.so +0 -0
  108. mindspore/lib/libopencv_core.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  110. mindspore/lib/libps_cache.so +0 -0
  111. mindspore/lib/libswresample.so.4 +0 -0
  112. mindspore/lib/libswscale.so.6 +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  114. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  121. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  174. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  175. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  177. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  178. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  179. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  180. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  181. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +960 -958
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  263. mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
  264. mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
  265. mindspore/lib/plugin/gpu10.1/libnccl.so.2 +0 -0
  266. mindspore/lib/plugin/gpu10.1/libnvidia_collective.so +0 -0
  267. mindspore/lib/plugin/gpu11.1/libnccl.so.2 +0 -0
  268. mindspore/lib/plugin/gpu11.1/libnvidia_collective.so +0 -0
  269. mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
  270. mindspore/lib/plugin/gpu11.6/libnvidia_collective.so +0 -0
  271. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  272. mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
  273. mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
  274. mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
  275. mindspore/log.py +12 -0
  276. mindspore/mindrecord/__init__.py +1 -1
  277. mindspore/mindrecord/config.py +17 -316
  278. mindspore/mindrecord/filereader.py +1 -9
  279. mindspore/mindrecord/filewriter.py +5 -15
  280. mindspore/mindrecord/mindpage.py +1 -9
  281. mindspore/mint/__init__.py +824 -218
  282. mindspore/mint/distributed/__init__.py +66 -4
  283. mindspore/mint/distributed/distributed.py +2594 -44
  284. mindspore/mint/linalg/__init__.py +6 -0
  285. mindspore/mint/nn/__init__.py +473 -14
  286. mindspore/mint/nn/functional.py +486 -11
  287. mindspore/mint/nn/layer/__init__.py +17 -4
  288. mindspore/mint/nn/layer/_functions.py +330 -0
  289. mindspore/mint/nn/layer/activation.py +169 -1
  290. mindspore/mint/nn/layer/basic.py +123 -0
  291. mindspore/mint/nn/layer/conv.py +727 -0
  292. mindspore/mint/nn/layer/normalization.py +215 -19
  293. mindspore/mint/nn/layer/padding.py +797 -0
  294. mindspore/mint/nn/layer/pooling.py +170 -0
  295. mindspore/mint/optim/__init__.py +2 -1
  296. mindspore/mint/optim/adam.py +223 -0
  297. mindspore/mint/optim/adamw.py +26 -19
  298. mindspore/mint/special/__init__.py +2 -1
  299. mindspore/multiprocessing/__init__.py +5 -0
  300. mindspore/nn/cell.py +126 -19
  301. mindspore/nn/dynamic_lr.py +2 -1
  302. mindspore/nn/layer/activation.py +6 -6
  303. mindspore/nn/layer/basic.py +35 -25
  304. mindspore/nn/layer/channel_shuffle.py +3 -3
  305. mindspore/nn/layer/embedding.py +3 -3
  306. mindspore/nn/layer/normalization.py +8 -7
  307. mindspore/nn/layer/padding.py +4 -3
  308. mindspore/nn/layer/pooling.py +47 -13
  309. mindspore/nn/layer/rnn_cells.py +1 -1
  310. mindspore/nn/layer/rnns.py +2 -1
  311. mindspore/nn/layer/timedistributed.py +5 -5
  312. mindspore/nn/layer/transformer.py +48 -26
  313. mindspore/nn/learning_rate_schedule.py +5 -3
  314. mindspore/nn/loss/loss.py +31 -36
  315. mindspore/nn/optim/ada_grad.py +1 -0
  316. mindspore/nn/optim/adadelta.py +2 -2
  317. mindspore/nn/optim/adam.py +1 -1
  318. mindspore/nn/optim/lars.py +1 -4
  319. mindspore/nn/optim/optimizer.py +1 -1
  320. mindspore/nn/optim/rprop.py +2 -2
  321. mindspore/nn/optim/thor.py +2 -1
  322. mindspore/nn/utils/init.py +13 -11
  323. mindspore/nn/wrap/cell_wrapper.py +4 -6
  324. mindspore/nn/wrap/loss_scale.py +3 -4
  325. mindspore/numpy/array_creations.py +60 -62
  326. mindspore/numpy/array_ops.py +148 -143
  327. mindspore/numpy/logic_ops.py +41 -42
  328. mindspore/numpy/math_ops.py +361 -359
  329. mindspore/numpy/utils.py +16 -16
  330. mindspore/numpy/utils_const.py +4 -4
  331. mindspore/ops/__init__.py +2 -1
  332. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  333. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  334. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  335. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  336. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  337. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  338. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  339. mindspore/ops/_vmap/vmap_base.py +0 -2
  340. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  341. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  342. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  343. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  344. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  345. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  346. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  347. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  348. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  349. mindspore/ops/composite/base.py +1 -1
  350. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  351. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  352. mindspore/ops/function/__init__.py +12 -0
  353. mindspore/ops/function/array_func.py +561 -159
  354. mindspore/ops/function/clip_func.py +64 -0
  355. mindspore/ops/function/debug_func.py +28 -20
  356. mindspore/ops/function/image_func.py +1 -1
  357. mindspore/ops/function/linalg_func.py +5 -4
  358. mindspore/ops/function/math_func.py +1659 -290
  359. mindspore/ops/function/nn_func.py +988 -317
  360. mindspore/ops/function/parameter_func.py +3 -56
  361. mindspore/ops/function/random_func.py +243 -33
  362. mindspore/ops/function/sparse_unary_func.py +1 -1
  363. mindspore/ops/functional.py +18 -5
  364. mindspore/ops/functional_overload.py +897 -0
  365. mindspore/ops/operations/__init__.py +3 -2
  366. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  367. mindspore/ops/operations/_grad_ops.py +2 -34
  368. mindspore/ops/operations/_infer_ops.py +2 -1
  369. mindspore/ops/operations/_inner_ops.py +38 -8
  370. mindspore/ops/operations/array_ops.py +45 -303
  371. mindspore/ops/operations/comm_ops.py +19 -16
  372. mindspore/ops/operations/custom_ops.py +11 -55
  373. mindspore/ops/operations/debug_ops.py +42 -47
  374. mindspore/ops/operations/inner_ops.py +6 -4
  375. mindspore/ops/operations/linalg_ops.py +3 -2
  376. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  377. mindspore/ops/operations/math_ops.py +11 -216
  378. mindspore/ops/operations/nn_ops.py +146 -308
  379. mindspore/ops/primitive.py +23 -21
  380. mindspore/ops/tensor_method.py +1669 -0
  381. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  382. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  383. mindspore/ops_generate/arg_handler.py +0 -61
  384. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  385. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  386. mindspore/ops_generate/base_generator.py +11 -0
  387. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  388. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  389. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  390. mindspore/ops_generate/functions_cc_generator.py +233 -0
  391. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  392. mindspore/ops_generate/gen_constants.py +157 -3
  393. mindspore/ops_generate/gen_ops.py +245 -990
  394. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  395. mindspore/ops_generate/gen_utils.py +119 -33
  396. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  397. mindspore/ops_generate/op_api_proto.py +206 -0
  398. mindspore/ops_generate/op_def_py_generator.py +131 -0
  399. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  400. mindspore/ops_generate/op_proto.py +373 -108
  401. mindspore/ops_generate/op_template_parser.py +436 -0
  402. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  403. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  404. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  405. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  406. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  407. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  408. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  409. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  410. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  411. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  412. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  413. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  414. mindspore/ops_generate/pyboost_utils.py +92 -33
  415. mindspore/ops_generate/template.py +294 -44
  416. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  417. mindspore/parallel/__init__.py +3 -3
  418. mindspore/parallel/_auto_parallel_context.py +24 -33
  419. mindspore/parallel/_parallel_serialization.py +13 -2
  420. mindspore/parallel/_utils.py +4 -1
  421. mindspore/parallel/algo_parameter_config.py +1 -1
  422. mindspore/parallel/checkpoint_transform.py +44 -0
  423. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  424. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  425. mindspore/parallel/cluster/run.py +20 -3
  426. mindspore/parallel/parameter_broadcast.py +1 -1
  427. mindspore/parallel/shard.py +3 -0
  428. mindspore/parallel/transform_safetensors.py +119 -253
  429. mindspore/profiler/__init__.py +17 -4
  430. mindspore/profiler/analysis/__init__.py +0 -0
  431. mindspore/profiler/analysis/parser/__init__.py +0 -0
  432. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  433. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  434. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  435. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  436. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  437. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  438. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  439. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  440. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  441. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  442. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  443. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  444. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  445. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  446. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  447. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  448. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  449. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  450. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  451. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  452. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  453. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  454. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  455. mindspore/profiler/analysis/task_manager.py +131 -0
  456. mindspore/profiler/analysis/time_converter.py +84 -0
  457. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  458. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  459. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  460. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  461. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  462. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  463. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  464. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  465. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  466. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  467. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  468. mindspore/profiler/analysis/work_flow.py +73 -0
  469. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  470. mindspore/profiler/common/command_executor.py +90 -0
  471. mindspore/profiler/common/constant.py +174 -3
  472. mindspore/profiler/common/file_manager.py +208 -0
  473. mindspore/profiler/common/log.py +130 -0
  474. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  475. mindspore/profiler/common/path_manager.py +371 -0
  476. mindspore/profiler/common/process_bar.py +168 -0
  477. mindspore/profiler/common/process_pool.py +9 -3
  478. mindspore/profiler/common/profiler_context.py +476 -0
  479. mindspore/profiler/common/profiler_info.py +304 -0
  480. mindspore/profiler/common/profiler_output_path.py +284 -0
  481. mindspore/profiler/common/profiler_parameters.py +210 -0
  482. mindspore/profiler/common/profiler_path_manager.py +120 -0
  483. mindspore/profiler/common/record_function.py +76 -0
  484. mindspore/profiler/common/tlv_decoder.py +76 -0
  485. mindspore/profiler/common/util.py +75 -2
  486. mindspore/profiler/dynamic_profiler.py +270 -37
  487. mindspore/profiler/envprofiler.py +138 -0
  488. mindspore/profiler/mstx.py +199 -0
  489. mindspore/profiler/platform/__init__.py +21 -0
  490. mindspore/profiler/platform/base_profiler.py +40 -0
  491. mindspore/profiler/platform/cpu_profiler.py +124 -0
  492. mindspore/profiler/platform/gpu_profiler.py +74 -0
  493. mindspore/profiler/platform/npu_profiler.py +309 -0
  494. mindspore/profiler/profiler.py +580 -93
  495. mindspore/profiler/profiler_action_controller.py +187 -0
  496. mindspore/profiler/profiler_interface.py +114 -0
  497. mindspore/profiler/schedule.py +208 -0
  498. mindspore/rewrite/api/symbol_tree.py +1 -2
  499. mindspore/run_check/_check_version.py +2 -6
  500. mindspore/runtime/__init__.py +37 -0
  501. mindspore/runtime/device.py +27 -0
  502. mindspore/runtime/event.py +209 -0
  503. mindspore/runtime/executor.py +148 -0
  504. mindspore/runtime/memory.py +392 -0
  505. mindspore/runtime/stream.py +460 -0
  506. mindspore/runtime/thread_bind_core.py +401 -0
  507. mindspore/train/__init__.py +2 -2
  508. mindspore/train/_utils.py +53 -18
  509. mindspore/train/amp.py +8 -4
  510. mindspore/train/callback/_checkpoint.py +32 -18
  511. mindspore/train/callback/_early_stop.py +1 -1
  512. mindspore/train/callback/_flops_collector.py +105 -69
  513. mindspore/train/callback/_history.py +1 -1
  514. mindspore/train/callback/_summary_collector.py +44 -6
  515. mindspore/train/callback/_tft_register.py +31 -10
  516. mindspore/train/dataset_helper.py +11 -11
  517. mindspore/train/metrics/precision.py +4 -5
  518. mindspore/train/mind_ir_pb2.py +167 -46
  519. mindspore/train/model.py +13 -15
  520. mindspore/train/serialization.py +462 -76
  521. mindspore/train/summary/summary_record.py +1 -2
  522. mindspore/train/train_thor/model_thor.py +1 -1
  523. mindspore/utils/__init__.py +4 -2
  524. mindspore/utils/bin/dataset-cache +0 -0
  525. mindspore/utils/bin/dataset-cache-server +0 -0
  526. mindspore/utils/dryrun.py +138 -0
  527. mindspore/utils/runtime_execution_order_check.py +550 -0
  528. mindspore/version.py +1 -1
  529. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  530. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +533 -467
  531. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  532. mindspore/_data_dump.cpython-311-x86_64-linux-gnu.so +0 -0
  533. mindspore/bin/cache_admin +0 -0
  534. mindspore/bin/cache_server +0 -0
  535. mindspore/common/_tensor_overload.py +0 -139
  536. mindspore/lib/libmindspore_np_dtype.so +0 -0
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_impl.so +0 -0
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  687. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  688. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  689. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  690. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  691. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  692. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  693. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  694. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  695. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  696. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  697. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  698. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  699. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  700. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  701. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  702. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  703. mindspore/profiler/envprofiling.py +0 -254
  704. mindspore/profiler/profiling.py +0 -1926
  705. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  706. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -1,5 +1,5 @@
1
1
  /**
2
- * Copyright 2023-2024 Huawei Technologies Co., Ltd
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
3
  *
4
4
  * Licensed under the Apache License, Version 2.0 (the "License");
5
5
  * you may not use this file except in compliance with the License.
@@ -13,127 +13,172 @@
13
13
  * See the License for the specific language governing permissions and
14
14
  * limitations under the License.
15
15
  */
16
- #ifndef MS_KERNELS_INTERNAL_OP_PARAM_H_
17
- #define MS_KERNELS_INTERNAL_OP_PARAM_H_
18
- #include "asdops/op_desc.h"
19
- #include "asdops/params/matmul.h"
20
- #include "asdops/params/mix.h"
21
- #include "asdops/params/slice.h"
22
- #include "asdops/params/gather.h"
23
- #include "asdops/params/elewise.h"
24
- #include "asdops/params/activation.h"
25
- #include "asdops/params/concat.h"
26
- #include "asdops/params/transpose.h"
27
- #include "asdops/params/norm.h"
28
- #include "asdops/params/softmax.h"
29
- #include "asdops/params/split.h"
30
- #include "asdops/params/expand.h"
31
- #include "asdops/params/fill.h"
32
- #include "asdops/params/reduce.h"
33
- #include "asdops/params/sort.h"
34
- #include "asdops/params/transdata.h"
35
- #include <memory>
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
19
+
20
+ #include <stdint.h>
36
21
  #include <vector>
37
- #include "ms_int_types.h"
22
+
38
23
  namespace mindspore {
39
24
  namespace internal {
40
- struct DtypesParam {
41
- int op_id_ = 0;
42
- std::vector<int64_t> in_dtypes_;
43
- std::vector<int64_t> out_dtypes_;
25
+ // matmul fused op
26
+ constexpr auto kInternalMatMulOpName = "MatMul";
27
+ constexpr auto kInternalMultiWeightMatmulOpName = "MultiWeightMatmul";
28
+ constexpr auto kInternalMatMulAddRmsNormOpName = "MatMulAddRmsNorm";
29
+ // attention fused op
30
+ constexpr auto kInternalFlashAttentionScoreOpName = "FlashAttentionScore";
31
+ constexpr auto kInternalPagedAttentionOpName = "PagedAttention";
32
+ constexpr auto kInternalReshapeAndCacheOpName = "ReshapeAndCache";
33
+ constexpr auto kInternalReshapeAndCacheNzOpName = "ReshapeAndCacheNz";
34
+ constexpr auto kInternalApplyRotaryPosEmbOpName = "ApplyRotaryPosEmb";
35
+ constexpr auto kInternalApplyRotaryPosEmbNzOpName = "ApplyRotaryPosEmbNz";
36
+ // norm fused op
37
+ constexpr auto kInternalAddLayerNormOpName = "AddLayerNorm";
38
+ constexpr auto kInternalRmsNormOpName = "RmsNorm";
39
+ constexpr auto kInternalAddRmsNormOpName = "AddRmsNorm";
40
+ constexpr auto kInternalRmsNormQuantOpName = "RmsNormQuant";
41
+ constexpr auto kInternalAddRmsNormQuantOpName = "AddRmsNormQuantV2";
42
+ constexpr auto kInternalAddRmsNormDynamicQuantOpName = "AddRmsNormDynamicQuant";
43
+ // activation
44
+ constexpr auto kInternalReluOpName = "Relu";
45
+ constexpr auto kInternalGeLUOpName = "GeLU";
46
+ constexpr auto kInternalFastGeLUOpName = "FastGeLU";
47
+ constexpr auto kInternalSwishOpName = "Swish";
48
+ constexpr auto kInternalSwiGLUOpName = "SwiGLU";
49
+ // elewise unary
50
+ constexpr auto kInternalCastOpName = "Cast";
51
+ constexpr auto kInternalExpOpName = "Exp";
52
+ constexpr auto kInternalLnOpName = "Ln";
53
+ constexpr auto kInternalRsqrtOpName = "Rsqrt";
54
+ constexpr auto kInternalSqrtOpName = "Sqrt";
55
+ constexpr auto kInternalAbsOpName = "Abs";
56
+ constexpr auto kInternalReciprocalOpName = "Reciprocal";
57
+ // elewise binary
58
+ constexpr auto kInternalAddOpName = "Add";
59
+ constexpr auto kInternalSubOpName = "Sub";
60
+ constexpr auto kInternalMulOpName = "Mul";
61
+ constexpr auto kInternalDivOpName = "Div";
62
+ constexpr auto kInternalRealDivOpName = "RealDiv";
63
+ constexpr auto kInternalMaxOpName = "Max";
64
+ constexpr auto kInternalMinOpName = "Min";
65
+ constexpr auto kInternalNotOpName = "Not";
66
+ constexpr auto kInternalOrOpName = "Or";
67
+ constexpr auto kInternalAndOpName = "And";
68
+ constexpr auto kInternalEqualOpName = "Equal";
69
+ constexpr auto kInternalNotEqualOpName = "NotEqual";
70
+ constexpr auto kInternalLessOpName = "Less";
71
+ constexpr auto kInternalLessEqualOpName = "LessEqual";
72
+ constexpr auto kInternalGreaterOpName = "Greater";
73
+ constexpr auto kInternalGreaterEqualOpName = "GreaterEqual";
74
+ constexpr auto kInternalLogicalNotOpName = "LogicalNot";
75
+ // others
76
+ constexpr auto kInternalGatherOpName = "Gather";
77
+ constexpr auto kInternalTransposeOpName = "Transpose";
78
+ constexpr auto kInternalTransDataOpName = "TransData";
79
+ constexpr auto kInternalQuantPerChannelOpName = "QuantPerChannel";
80
+ constexpr auto kInternalSoftmaxOpName = "Softmax";
81
+ constexpr auto kInternalReduceSumOpName = "ReduceSum";
82
+ constexpr auto kInternalQuantLinearSparseOpName = "QuantLinearSparse";
83
+
84
+ struct AxesParam {
85
+ std::vector<int64_t> axes;
86
+ };
87
+
88
+ using TransposeParam = AxesParam;
89
+ using SoftmaxParam = AxesParam;
90
+ using ReduceSumParam = AxesParam;
91
+
92
+ struct GatherParam {
93
+ int64_t batch_dims;
94
+ std::vector<int64_t> axes;
95
+ };
96
+
97
+ struct SwiGLUParam {
98
+ int64_t axis;
99
+ };
100
+
101
+ struct MatmulParam {
102
+ bool transpose_a{false};
103
+ bool transpose_b{false};
104
+ bool enable_dequant{false};
105
+ bool with_relu{false};
106
+ bool with_gelu{false};
107
+ bool with_fastgelu{false};
108
+ bool with_bias{false};
109
+ bool with_bias_fastgelu{false};
110
+ bool enable_shuffle{false};
111
+ uint32_t tilingN = 0; // 压缩算法透传参数, 单压缩块 n 方向的基块数
112
+ uint32_t tilingK = 0; // 压缩算法透传参数, 单压缩块 k 方向的基块数
44
113
  };
45
- struct OpParam : public AsdOps::OpDesc {
46
- int dtype_ = 0;
47
- std::vector<int64_t> in_dtypes_;
48
- std::vector<int64_t> out_dtypes_;
49
- std::string op_fullname_;
114
+
115
+ struct MatmulAddRmsNormParam {
116
+ bool transpose_a{false};
117
+ bool transpose_b{false};
118
+ float eps{1e-6};
50
119
  };
51
- enum OpId : int {
52
- MatMul,
53
- ReshapeAndCache,
54
- ReshapeAndCacheNz,
55
- Slice,
56
- Gather,
57
- ApplyRotaryPosEmb,
58
- ApplyRotaryPosEmbNz,
59
- Add,
60
- Sub,
61
- Exp,
62
- Relu,
63
- FlashAttentionScore,
64
- PagedAttention,
65
- Cast,
66
- Gelu,
67
- Transpose,
68
- Equal,
69
- NotEqual,
70
- LogicalNot,
71
- Less,
72
- LessEqual,
73
- Greater,
74
- GreaterEqual,
75
- Mul,
76
- RealDiv,
77
- QuantPerChannel,
78
- LayerNorm,
79
- AddLayerNorm,
80
- RmsNorm,
81
- AddRmsNorm,
82
- RmsNormQuant,
83
- AddRmsNormQuant,
84
- MatmulAddRmsNorm,
85
- Softmax,
86
- Split,
87
- Swish,
88
- SwiGLU,
89
- Concat,
90
- MatmulQkv,
91
- MaskedFill,
92
- BroadcastTo,
93
- ReduceSum,
94
- TopK,
95
- Tile,
96
- GroupedMatmul,
97
- OpId_END,
98
- FastGeLU,
99
- TransData,
100
- QuantLinearSparse,
120
+
121
+ struct MultiWeightMatmulParam {
122
+ uint32_t n0_len{0};
123
+ uint32_t n1_len{0};
124
+ uint32_t n2_len{0};
125
+ bool transpose_a;
126
+ bool transpose_b;
127
+ int32_t silu_position{-1};
128
+ bool with_bias{false};
101
129
  };
102
- using MatMulParam = AsdOps::OpParam::MatMul;
103
- using MixParam = AsdOps::OpParam::Mix;
104
- using GatherParam = AsdOps::OpParam::Gather;
105
- using ElewiseParam = AsdOps::OpParam::Elewise;
106
- using SliceParam = AsdOps::OpParam::Slice;
107
- using ActivationParam = AsdOps::OpParam::Activation;
108
- using TransposeParam = AsdOps::OpParam::Transpose;
109
- using NormParam = AsdOps::OpParam::Norm;
110
- using SoftmaxParam = AsdOps::OpParam::Softmax;
111
- using SplitParam = AsdOps::OpParam::Split;
112
- using ConcatParam = AsdOps::OpParam::Concat;
113
- using MaskedFillParam = AsdOps::OpParam::Fill;
114
- using BroadcastToParam = AsdOps::OpParam::Expand;
115
- using ReduceParam = AsdOps::OpParam::Reduce;
116
- using SortParam = AsdOps::OpParam::Sort;
117
- using ExpandParam = AsdOps::OpParam::Expand;
118
- using TransDataParam = AsdOps::OpParam::Transdata;
119
-
120
- struct AddLayerNormParam {
130
+
131
+ struct NormParam {
121
132
  float eps;
122
- bool operator==(const AddLayerNormParam &other) const { return this->eps == other.eps; }
133
+ bool operator==(const NormParam &other) const { return this->eps == other.eps; }
123
134
  };
124
135
 
125
136
  struct ApplyRotaryPosEmbParam {
126
- // cosFormat=0 shape是[maxSeqLen, headDim], cos/sin不交替
127
- // cosFormat=1 shape是[maxSeqLen, headDim], cos/sin交替
128
- // cosFormat=2 shape是[batch*seqLen, headDim], cos/sin不交替
129
- // cosFormat=3 shape是[batch*seqLen, headDim], cos/sin交替
130
- int32_t cosFormat{0};
137
+ // cos_format=0 shape是[maxSeqLen, headDim], cos/sin不交替
138
+ // cos_format=1 shape是[maxSeqLen, headDim], cos/sin交替
139
+ // cos_format=2 shape是[batch*seqLen, headDim], cos/sin不交替
140
+ // cos_format=3 shape是[batch*seqLen, headDim], cos/sin交替
141
+ int32_t cos_format{0};
142
+ int32_t rotary_coeff{-1};
143
+ std::vector<int32_t> batch_valid_length;
131
144
  };
132
145
 
133
- struct AddRmsNormParam {
134
- float eps;
135
- bool operator==(const AddRmsNormParam &other) const { return this->eps == other.eps; }
146
+ struct TransDataParam {
147
+ enum TransdataType { UNDEFINED = 0, FRACTAL_NZ_TO_ND, ND_TO_FRACTAL_NZ };
148
+ TransdataType transdataType = UNDEFINED;
149
+ enum SpecialType { NORMAL = 0, ATTENTION_INPUT_QKV, ATTENTION_INPUT_MASK };
150
+ int64_t specialTransdata = NORMAL;
151
+ };
152
+
153
+ struct FlashAttentionScoreParam {
154
+ int32_t head_num = 0;
155
+ int32_t inner_precise = 0;
156
+ int32_t pre_tokens = 2147483647;
157
+ int32_t next_tokens = 0;
158
+ int32_t sparse_mode = 0;
159
+ int32_t mask_dtype = 0;
160
+ int32_t input_layout = 0;
161
+ std::vector<int64_t> mask_dims;
162
+ std::vector<int32_t> kv_seq_len;
163
+ std::vector<int32_t> q_seq_len;
164
+ float tor = 0;
165
+
166
+ enum InputLayoutMode : int64_t { BSH = 0, BNSD = 1, SBH = 2, BSND = 3, TND = 4, TH = 5, NSD = 6, SH = 7 };
167
+ };
168
+
169
+ struct PagedAttentionParam {
170
+ int32_t inner_precise = 0;
171
+ int32_t head_num = 0;
172
+ int32_t kv_head_num = 0;
173
+ std::vector<int32_t> kv_seq_len;
174
+ std::vector<int32_t> q_seq_len;
175
+ float tor = 0;
176
+
177
+ enum MaskType : uint32_t { kMaskTypeNone = 0, kMaskTypeAlibi = 1, kMaskTypeLookAhead = 2 };
178
+ MaskType mask_type = kMaskTypeNone;
179
+ int32_t kv_cache_quant_mode = 0;
136
180
  };
137
181
  } // namespace internal
138
182
  } // namespace mindspore
139
- #endif
183
+
184
+ #endif // MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
@@ -14,21 +14,22 @@
14
14
  * limitations under the License.
15
15
  */
16
16
 
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
19
19
 
20
20
  #include <sstream>
21
21
 
22
- #include "acme/include/base_type.h"
22
+ #include "include/base_type.h"
23
23
 
24
24
  namespace mindspore {
25
- namespace acme {
25
+ namespace internal {
26
26
  class HostRunInfo {
27
27
  public:
28
28
  HostRunInfo() = default;
29
29
  virtual ~HostRunInfo() = default;
30
30
  void SetWorkSpaceSize(const std::vector<size_t> &workSpaceSize) { this->ws_size_ = workSpaceSize; }
31
31
  std::vector<size_t> GetWorkSpaceSize() const { return this->ws_size_; }
32
+ virtual uint32_t GetBlockDim() const = 0;
32
33
 
33
34
  private:
34
35
  std::vector<size_t> ws_size_;
@@ -37,10 +38,12 @@ using HostRunInfoPtr = std::shared_ptr<HostRunInfo>;
37
38
 
38
39
  class HostRunInfoComm : public HostRunInfo {
39
40
  public:
40
- HostRunInfoComm() = default;
41
- explicit HostRunInfoComm(size_t block_dim) : block_dims_(block_dim) {}
41
+ explicit HostRunInfoComm(uint32_t block_dim);
42
42
  ~HostRunInfoComm() = default;
43
- uint32_t block_dims_{0};
43
+
44
+ uint32_t GetBlockDim() const override;
45
+
46
+ uint32_t block_dim_{0};
44
47
  uint64_t any_value0_{0};
45
48
  uint64_t any_value1_{0};
46
49
  uint64_t any_value2_{0};
@@ -61,7 +64,7 @@ class TilingInfo {
61
64
  HostRunInfoPtr host_run_info_{nullptr};
62
65
  };
63
66
  using TilingInfoPtr = std::shared_ptr<TilingInfo>;
64
- } // namespace acme
67
+ } // namespace internal
65
68
  } // namespace mindspore
66
69
 
67
- #endif // MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
70
+ #endif // MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
@@ -0,0 +1,178 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_
19
+
20
+ #include <cstdint>
21
+ #include <functional>
22
+ #include <memory>
23
+ #include <sstream>
24
+ #include <string>
25
+ #include <unordered_map>
26
+ #include <vector>
27
+
28
+ #include "include/internal_op.h"
29
+
30
+ namespace mindspore {
31
+ namespace internal {
32
+ void Encrypt(char **src, size_t str_len, char *dest, bool offset_src = false);
33
+ void Decrypt(char **src, size_t str_len, char *dest, bool offset_src = true);
34
+
35
+ struct ScopeData {
36
+ uint32_t begin;
37
+ uint32_t end;
38
+ uint32_t offset;
39
+ uint32_t num;
40
+ };
41
+
42
+ struct ScopeInfo {
43
+ std::vector<uint16_t> types;
44
+ std::vector<ScopeData> scopes;
45
+ };
46
+
47
+ struct TilingData {
48
+ uint16_t version;
49
+ uint32_t base_offset;
50
+ uint16_t key_len;
51
+ uint16_t value_len;
52
+ uint32_t item_num;
53
+ uint16_t type_len;
54
+ std::vector<ScopeInfo> scope_infos;
55
+ };
56
+
57
+ template <typename T>
58
+ struct ArrayHasher {
59
+ std::size_t operator()(const std::vector<T> &arr) const {
60
+ std::size_t hash = 0;
61
+ for (T num : arr) {
62
+ hash ^= std::hash<T>{}(num) + 0x9e3779b9 + (hash << 6) + (hash >> 2);
63
+ }
64
+ return hash;
65
+ }
66
+ };
67
+
68
+ using Repo = std::unordered_map<std::vector<int>, std::vector<int>, ArrayHasher<int>>;
69
+ using RepoMap = std::unordered_map<std::vector<uint16_t>, Repo, ArrayHasher<uint16_t>>;
70
+
71
+ class TilingLoadUtil {
72
+ public:
73
+ explicit TilingLoadUtil(const std::string &db_file, bool is_full_path = false)
74
+ : db_file_(db_file), is_full_(is_full_path) {}
75
+ ~TilingLoadUtil();
76
+ InternalStatus LoadTilingData(TilingData *tiling_data_out);
77
+ InternalStatus LoadScopeTilings(uint32_t base, uint16_t key_len, uint16_t value_len, const ScopeData &scope, Repo *repo);
78
+
79
+ private:
80
+ std::string GetDataFileFullPath(const std::string &db_name) const;
81
+ InternalStatus InitData();
82
+ InternalStatus ReadTilingData(TilingData *tiling_data);
83
+ InternalStatus ReadScopeData(TilingData *tiling_data);
84
+
85
+ std::string db_file_;
86
+ bool is_full_;
87
+ int f_{-1};
88
+ size_t memory_size_{0};
89
+ char *data_{nullptr};
90
+ };
91
+
92
+ using KeyScope = std::pair<int, int>;
93
+
94
+ class TilingRepo {
95
+ public:
96
+ TilingRepo(const TilingRepo &flags) = delete;
97
+ TilingRepo(TilingRepo &&flags) = delete;
98
+ TilingRepo &operator=(const TilingRepo &flags) = delete;
99
+ TilingRepo &operator=(TilingRepo &&flags) = delete;
100
+ ~TilingRepo() = default;
101
+
102
+ static TilingRepo &Instance();
103
+ void Register(const std::string &name, const std::string &db_name);
104
+ InternalStatus GetTiling(const std::string &name, const std::vector<uint16_t> &types, const std::vector<int> &key,
105
+ std::vector<int> *out,
106
+ const std::function<KeyScope(const std::vector<int> &)> &gen_scope_func = nullptr);
107
+ using LoadRecord = std::unordered_map<std::vector<uint16_t>, std::vector<KeyScope>, ArrayHasher<uint16_t>>;
108
+
109
+ private:
110
+ TilingRepo() = default;
111
+ bool IsRegistered(const std::string &name) const;
112
+ std::vector<int> Get(const std::string &name, const std::vector<uint16_t> &types, const std::vector<int> &key) const;
113
+ InternalStatus LoadScopeData(const std::string &name, const std::vector<uint16_t> &types,
114
+ const KeyScope &scope = std::make_pair(0, 0));
115
+
116
+ std::unordered_map<std::string, size_t> name_idx_map_;
117
+ std::unordered_map<std::string, size_t> db_name_idx_map_;
118
+ std::vector<std::string> db_names_;
119
+ std::vector<TilingData> tiling_datas_;
120
+ std::vector<RepoMap> repo_maps_;
121
+ std::vector<LoadRecord> loaded_;
122
+ };
123
+
124
+ class TilingDBLoad {
125
+ public:
126
+ TilingDBLoad(const std::string &op_name, const std::string &db_name) {
127
+ TilingRepo::Instance().Register(op_name, db_name);
128
+ }
129
+ };
130
+
131
+ struct RuningInfo {
132
+ internal::ShapeInfoList input_shapes;
133
+ internal::InputsImmutableInfoList input_infos;
134
+ internal::ShapeInfoList output_shapes;
135
+ internal::InputsImmutableInfoList output_infos;
136
+ };
137
+
138
+ class Tunable {
139
+ public:
140
+ Tunable() = default;
141
+ virtual ~Tunable() = default;
142
+ virtual InternalOpPtr CreateOpByKey(const std::vector<int64_t> &key) = 0;
143
+ virtual RuningInfo GetRuningInfo(const std::vector<int64_t> &key) const = 0;
144
+ };
145
+ using TunablePtr = std::shared_ptr<Tunable>;
146
+
147
+ using TunableCreator = std::function<TunablePtr()>;
148
+ class TunableBuilder {
149
+ public:
150
+ ~TunableBuilder() = default;
151
+ TunableBuilder(const TunableBuilder &) = delete;
152
+ TunableBuilder &operator=(const TunableBuilder &) = delete;
153
+ static TunableBuilder &Instance();
154
+
155
+ void Register(const std::string &op_name, TunableCreator &&creator);
156
+ TunablePtr Create(const std::string &op_name) const;
157
+
158
+ private:
159
+ TunableBuilder() = default;
160
+ std::unordered_map<std::string, TunableCreator> tunable_creators_;
161
+ };
162
+
163
+ class TuneRegister {
164
+ public:
165
+ TuneRegister(const std::string &op_name, TunableCreator creator) noexcept {
166
+ TunableBuilder::Instance().Register(op_name, std::move(creator));
167
+ }
168
+ ~TuneRegister() = default;
169
+ };
170
+
171
+ #define REG_OP_TUNABLE(op_name, TargetClass) \
172
+ static_assert(std::is_base_of<Tunable, TargetClass>::value, #TargetClass " must be derived from Tunable!"); \
173
+ static const TuneRegister g_##op_name##_tunable_reg(#op_name, \
174
+ []() -> TunablePtr { return std::make_shared<TargetClass>(); })
175
+ } // namespace internal
176
+ } // namespace mindspore
177
+
178
+ #endif // MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_