mindspore 2.4.10__cp310-none-any.whl → 2.5.0__cp310-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (688) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-310-aarch64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-310-aarch64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-310-aarch64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libmindspore_backend.so +0 -0
  97. mindspore/lib/libmindspore_common.so +0 -0
  98. mindspore/lib/libmindspore_core.so +0 -0
  99. mindspore/lib/libmindspore_glog.so.0 +0 -0
  100. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  101. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  102. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  103. mindspore/lib/libmindspore_ops.so +0 -0
  104. mindspore/lib/libmpi_adapter.so +0 -0
  105. mindspore/lib/libmpi_collective.so +0 -0
  106. mindspore/lib/libnnacl.so +0 -0
  107. mindspore/lib/libopencv_core.so.4.5 +0 -0
  108. mindspore/lib/libps_cache.so +0 -0
  109. mindspore/lib/libswresample.so.4 +0 -0
  110. mindspore/lib/libswscale.so.6 +0 -0
  111. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  112. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  114. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  121. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  172. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  173. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  174. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  175. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  177. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  178. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  179. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  180. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +957 -955
  181. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops_static.a +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/liblcal_static.a +0 -0
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_layer_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so} +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  263. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  264. mindspore/log.py +12 -0
  265. mindspore/mindrecord/__init__.py +1 -1
  266. mindspore/mindrecord/config.py +17 -316
  267. mindspore/mindrecord/filereader.py +1 -9
  268. mindspore/mindrecord/filewriter.py +5 -15
  269. mindspore/mindrecord/mindpage.py +1 -9
  270. mindspore/mint/__init__.py +824 -218
  271. mindspore/mint/distributed/__init__.py +66 -4
  272. mindspore/mint/distributed/distributed.py +2594 -44
  273. mindspore/mint/linalg/__init__.py +6 -0
  274. mindspore/mint/nn/__init__.py +473 -14
  275. mindspore/mint/nn/functional.py +486 -11
  276. mindspore/mint/nn/layer/__init__.py +17 -4
  277. mindspore/mint/nn/layer/_functions.py +330 -0
  278. mindspore/mint/nn/layer/activation.py +169 -1
  279. mindspore/mint/nn/layer/basic.py +123 -0
  280. mindspore/mint/nn/layer/conv.py +727 -0
  281. mindspore/mint/nn/layer/normalization.py +215 -19
  282. mindspore/mint/nn/layer/padding.py +797 -0
  283. mindspore/mint/nn/layer/pooling.py +170 -0
  284. mindspore/mint/optim/__init__.py +2 -1
  285. mindspore/mint/optim/adam.py +223 -0
  286. mindspore/mint/optim/adamw.py +26 -19
  287. mindspore/mint/special/__init__.py +2 -1
  288. mindspore/multiprocessing/__init__.py +5 -0
  289. mindspore/nn/cell.py +126 -19
  290. mindspore/nn/dynamic_lr.py +2 -1
  291. mindspore/nn/layer/activation.py +6 -6
  292. mindspore/nn/layer/basic.py +35 -25
  293. mindspore/nn/layer/channel_shuffle.py +3 -3
  294. mindspore/nn/layer/embedding.py +3 -3
  295. mindspore/nn/layer/normalization.py +8 -7
  296. mindspore/nn/layer/padding.py +4 -3
  297. mindspore/nn/layer/pooling.py +47 -13
  298. mindspore/nn/layer/rnn_cells.py +1 -1
  299. mindspore/nn/layer/rnns.py +2 -1
  300. mindspore/nn/layer/timedistributed.py +5 -5
  301. mindspore/nn/layer/transformer.py +48 -26
  302. mindspore/nn/learning_rate_schedule.py +5 -3
  303. mindspore/nn/loss/loss.py +31 -36
  304. mindspore/nn/optim/ada_grad.py +1 -0
  305. mindspore/nn/optim/adadelta.py +2 -2
  306. mindspore/nn/optim/adam.py +1 -1
  307. mindspore/nn/optim/lars.py +1 -4
  308. mindspore/nn/optim/optimizer.py +1 -1
  309. mindspore/nn/optim/rprop.py +2 -2
  310. mindspore/nn/optim/thor.py +2 -1
  311. mindspore/nn/utils/init.py +13 -11
  312. mindspore/nn/wrap/cell_wrapper.py +4 -6
  313. mindspore/nn/wrap/loss_scale.py +3 -4
  314. mindspore/numpy/array_creations.py +60 -62
  315. mindspore/numpy/array_ops.py +148 -143
  316. mindspore/numpy/logic_ops.py +41 -42
  317. mindspore/numpy/math_ops.py +361 -359
  318. mindspore/numpy/utils.py +16 -16
  319. mindspore/numpy/utils_const.py +4 -4
  320. mindspore/ops/__init__.py +2 -1
  321. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  322. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  323. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  324. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  325. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  326. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  327. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  328. mindspore/ops/_vmap/vmap_base.py +0 -2
  329. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  330. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  331. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  332. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  333. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  334. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  335. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  336. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  337. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  338. mindspore/ops/composite/base.py +1 -1
  339. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  340. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  341. mindspore/ops/function/__init__.py +12 -0
  342. mindspore/ops/function/array_func.py +561 -159
  343. mindspore/ops/function/clip_func.py +64 -0
  344. mindspore/ops/function/debug_func.py +28 -20
  345. mindspore/ops/function/image_func.py +1 -1
  346. mindspore/ops/function/linalg_func.py +5 -4
  347. mindspore/ops/function/math_func.py +1659 -290
  348. mindspore/ops/function/nn_func.py +988 -317
  349. mindspore/ops/function/parameter_func.py +3 -56
  350. mindspore/ops/function/random_func.py +243 -33
  351. mindspore/ops/function/sparse_unary_func.py +1 -1
  352. mindspore/ops/functional.py +18 -5
  353. mindspore/ops/functional_overload.py +897 -0
  354. mindspore/ops/operations/__init__.py +3 -2
  355. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  356. mindspore/ops/operations/_grad_ops.py +2 -34
  357. mindspore/ops/operations/_infer_ops.py +2 -1
  358. mindspore/ops/operations/_inner_ops.py +38 -8
  359. mindspore/ops/operations/array_ops.py +45 -303
  360. mindspore/ops/operations/comm_ops.py +19 -16
  361. mindspore/ops/operations/custom_ops.py +11 -55
  362. mindspore/ops/operations/debug_ops.py +42 -47
  363. mindspore/ops/operations/inner_ops.py +6 -4
  364. mindspore/ops/operations/linalg_ops.py +3 -2
  365. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  366. mindspore/ops/operations/math_ops.py +11 -216
  367. mindspore/ops/operations/nn_ops.py +146 -308
  368. mindspore/ops/primitive.py +23 -21
  369. mindspore/ops/tensor_method.py +1669 -0
  370. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  371. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  372. mindspore/ops_generate/arg_handler.py +0 -61
  373. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  374. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  375. mindspore/ops_generate/base_generator.py +11 -0
  376. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  377. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  378. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  379. mindspore/ops_generate/functions_cc_generator.py +233 -0
  380. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  381. mindspore/ops_generate/gen_constants.py +157 -3
  382. mindspore/ops_generate/gen_ops.py +245 -990
  383. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  384. mindspore/ops_generate/gen_utils.py +119 -33
  385. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  386. mindspore/ops_generate/op_api_proto.py +206 -0
  387. mindspore/ops_generate/op_def_py_generator.py +131 -0
  388. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  389. mindspore/ops_generate/op_proto.py +373 -108
  390. mindspore/ops_generate/op_template_parser.py +436 -0
  391. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  392. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  393. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  394. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  395. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  396. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  397. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  398. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  399. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  400. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  401. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  402. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  403. mindspore/ops_generate/pyboost_utils.py +92 -33
  404. mindspore/ops_generate/template.py +294 -44
  405. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  406. mindspore/parallel/__init__.py +3 -3
  407. mindspore/parallel/_auto_parallel_context.py +24 -33
  408. mindspore/parallel/_parallel_serialization.py +13 -2
  409. mindspore/parallel/_utils.py +4 -1
  410. mindspore/parallel/algo_parameter_config.py +1 -1
  411. mindspore/parallel/checkpoint_transform.py +44 -0
  412. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  413. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  414. mindspore/parallel/cluster/run.py +20 -3
  415. mindspore/parallel/parameter_broadcast.py +1 -1
  416. mindspore/parallel/shard.py +3 -0
  417. mindspore/parallel/transform_safetensors.py +119 -253
  418. mindspore/profiler/__init__.py +17 -4
  419. mindspore/profiler/analysis/__init__.py +0 -0
  420. mindspore/profiler/analysis/parser/__init__.py +0 -0
  421. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  422. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  423. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  424. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  425. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  426. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  427. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  428. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  429. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  430. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  431. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  432. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  433. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  434. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  435. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  436. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  437. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  438. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  439. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  440. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  441. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  442. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  443. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  444. mindspore/profiler/analysis/task_manager.py +131 -0
  445. mindspore/profiler/analysis/time_converter.py +84 -0
  446. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  447. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  448. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  449. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  450. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  451. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  452. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  453. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  454. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  455. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  456. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  457. mindspore/profiler/analysis/work_flow.py +73 -0
  458. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  459. mindspore/profiler/common/command_executor.py +90 -0
  460. mindspore/profiler/common/constant.py +174 -3
  461. mindspore/profiler/common/file_manager.py +208 -0
  462. mindspore/profiler/common/log.py +130 -0
  463. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  464. mindspore/profiler/common/path_manager.py +371 -0
  465. mindspore/profiler/common/process_bar.py +168 -0
  466. mindspore/profiler/common/process_pool.py +9 -3
  467. mindspore/profiler/common/profiler_context.py +476 -0
  468. mindspore/profiler/common/profiler_info.py +304 -0
  469. mindspore/profiler/common/profiler_output_path.py +284 -0
  470. mindspore/profiler/common/profiler_parameters.py +210 -0
  471. mindspore/profiler/common/profiler_path_manager.py +120 -0
  472. mindspore/profiler/common/record_function.py +76 -0
  473. mindspore/profiler/common/tlv_decoder.py +76 -0
  474. mindspore/profiler/common/util.py +75 -2
  475. mindspore/profiler/dynamic_profiler.py +270 -37
  476. mindspore/profiler/envprofiler.py +138 -0
  477. mindspore/profiler/mstx.py +199 -0
  478. mindspore/profiler/platform/__init__.py +21 -0
  479. mindspore/profiler/platform/base_profiler.py +40 -0
  480. mindspore/profiler/platform/cpu_profiler.py +124 -0
  481. mindspore/profiler/platform/gpu_profiler.py +74 -0
  482. mindspore/profiler/platform/npu_profiler.py +309 -0
  483. mindspore/profiler/profiler.py +580 -93
  484. mindspore/profiler/profiler_action_controller.py +187 -0
  485. mindspore/profiler/profiler_interface.py +114 -0
  486. mindspore/profiler/schedule.py +208 -0
  487. mindspore/rewrite/api/symbol_tree.py +1 -2
  488. mindspore/run_check/_check_version.py +2 -6
  489. mindspore/runtime/__init__.py +37 -0
  490. mindspore/runtime/device.py +27 -0
  491. mindspore/runtime/event.py +209 -0
  492. mindspore/runtime/executor.py +148 -0
  493. mindspore/runtime/memory.py +392 -0
  494. mindspore/runtime/stream.py +460 -0
  495. mindspore/runtime/thread_bind_core.py +401 -0
  496. mindspore/train/__init__.py +2 -2
  497. mindspore/train/_utils.py +53 -18
  498. mindspore/train/amp.py +8 -4
  499. mindspore/train/callback/_checkpoint.py +32 -18
  500. mindspore/train/callback/_early_stop.py +1 -1
  501. mindspore/train/callback/_flops_collector.py +105 -69
  502. mindspore/train/callback/_history.py +1 -1
  503. mindspore/train/callback/_summary_collector.py +44 -6
  504. mindspore/train/callback/_tft_register.py +31 -10
  505. mindspore/train/dataset_helper.py +11 -11
  506. mindspore/train/metrics/precision.py +4 -5
  507. mindspore/train/mind_ir_pb2.py +167 -46
  508. mindspore/train/model.py +13 -15
  509. mindspore/train/serialization.py +462 -76
  510. mindspore/train/summary/summary_record.py +1 -2
  511. mindspore/train/train_thor/model_thor.py +1 -1
  512. mindspore/utils/__init__.py +4 -2
  513. mindspore/utils/bin/dataset-cache +0 -0
  514. mindspore/utils/bin/dataset-cache-server +0 -0
  515. mindspore/utils/dryrun.py +138 -0
  516. mindspore/utils/runtime_execution_order_check.py +550 -0
  517. mindspore/version.py +1 -1
  518. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  519. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +522 -456
  520. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  521. mindspore/_data_dump.cpython-310-aarch64-linux-gnu.so +0 -0
  522. mindspore/bin/cache_admin +0 -0
  523. mindspore/bin/cache_server +0 -0
  524. mindspore/common/_tensor_overload.py +0 -139
  525. mindspore/lib/libmindspore_np_dtype.so +0 -0
  526. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  527. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  528. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  529. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  530. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  531. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  532. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  533. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  534. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  535. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  536. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  685. mindspore/profiler/envprofiling.py +0 -254
  686. mindspore/profiler/profiling.py +0 -1926
  687. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  688. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -1,5 +1,5 @@
1
1
  /**
2
- * Copyright 2023-2024 Huawei Technologies Co., Ltd
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
3
  *
4
4
  * Licensed under the Apache License, Version 2.0 (the "License");
5
5
  * you may not use this file except in compliance with the License.
@@ -13,127 +13,172 @@
13
13
  * See the License for the specific language governing permissions and
14
14
  * limitations under the License.
15
15
  */
16
- #ifndef MS_KERNELS_INTERNAL_OP_PARAM_H_
17
- #define MS_KERNELS_INTERNAL_OP_PARAM_H_
18
- #include "asdops/op_desc.h"
19
- #include "asdops/params/matmul.h"
20
- #include "asdops/params/mix.h"
21
- #include "asdops/params/slice.h"
22
- #include "asdops/params/gather.h"
23
- #include "asdops/params/elewise.h"
24
- #include "asdops/params/activation.h"
25
- #include "asdops/params/concat.h"
26
- #include "asdops/params/transpose.h"
27
- #include "asdops/params/norm.h"
28
- #include "asdops/params/softmax.h"
29
- #include "asdops/params/split.h"
30
- #include "asdops/params/expand.h"
31
- #include "asdops/params/fill.h"
32
- #include "asdops/params/reduce.h"
33
- #include "asdops/params/sort.h"
34
- #include "asdops/params/transdata.h"
35
- #include <memory>
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
19
+
20
+ #include <stdint.h>
36
21
  #include <vector>
37
- #include "ms_int_types.h"
22
+
38
23
  namespace mindspore {
39
24
  namespace internal {
40
- struct DtypesParam {
41
- int op_id_ = 0;
42
- std::vector<int64_t> in_dtypes_;
43
- std::vector<int64_t> out_dtypes_;
25
+ // matmul fused op
26
+ constexpr auto kInternalMatMulOpName = "MatMul";
27
+ constexpr auto kInternalMultiWeightMatmulOpName = "MultiWeightMatmul";
28
+ constexpr auto kInternalMatMulAddRmsNormOpName = "MatMulAddRmsNorm";
29
+ // attention fused op
30
+ constexpr auto kInternalFlashAttentionScoreOpName = "FlashAttentionScore";
31
+ constexpr auto kInternalPagedAttentionOpName = "PagedAttention";
32
+ constexpr auto kInternalReshapeAndCacheOpName = "ReshapeAndCache";
33
+ constexpr auto kInternalReshapeAndCacheNzOpName = "ReshapeAndCacheNz";
34
+ constexpr auto kInternalApplyRotaryPosEmbOpName = "ApplyRotaryPosEmb";
35
+ constexpr auto kInternalApplyRotaryPosEmbNzOpName = "ApplyRotaryPosEmbNz";
36
+ // norm fused op
37
+ constexpr auto kInternalAddLayerNormOpName = "AddLayerNorm";
38
+ constexpr auto kInternalRmsNormOpName = "RmsNorm";
39
+ constexpr auto kInternalAddRmsNormOpName = "AddRmsNorm";
40
+ constexpr auto kInternalRmsNormQuantOpName = "RmsNormQuant";
41
+ constexpr auto kInternalAddRmsNormQuantOpName = "AddRmsNormQuantV2";
42
+ constexpr auto kInternalAddRmsNormDynamicQuantOpName = "AddRmsNormDynamicQuant";
43
+ // activation
44
+ constexpr auto kInternalReluOpName = "Relu";
45
+ constexpr auto kInternalGeLUOpName = "GeLU";
46
+ constexpr auto kInternalFastGeLUOpName = "FastGeLU";
47
+ constexpr auto kInternalSwishOpName = "Swish";
48
+ constexpr auto kInternalSwiGLUOpName = "SwiGLU";
49
+ // elewise unary
50
+ constexpr auto kInternalCastOpName = "Cast";
51
+ constexpr auto kInternalExpOpName = "Exp";
52
+ constexpr auto kInternalLnOpName = "Ln";
53
+ constexpr auto kInternalRsqrtOpName = "Rsqrt";
54
+ constexpr auto kInternalSqrtOpName = "Sqrt";
55
+ constexpr auto kInternalAbsOpName = "Abs";
56
+ constexpr auto kInternalReciprocalOpName = "Reciprocal";
57
+ // elewise binary
58
+ constexpr auto kInternalAddOpName = "Add";
59
+ constexpr auto kInternalSubOpName = "Sub";
60
+ constexpr auto kInternalMulOpName = "Mul";
61
+ constexpr auto kInternalDivOpName = "Div";
62
+ constexpr auto kInternalRealDivOpName = "RealDiv";
63
+ constexpr auto kInternalMaxOpName = "Max";
64
+ constexpr auto kInternalMinOpName = "Min";
65
+ constexpr auto kInternalNotOpName = "Not";
66
+ constexpr auto kInternalOrOpName = "Or";
67
+ constexpr auto kInternalAndOpName = "And";
68
+ constexpr auto kInternalEqualOpName = "Equal";
69
+ constexpr auto kInternalNotEqualOpName = "NotEqual";
70
+ constexpr auto kInternalLessOpName = "Less";
71
+ constexpr auto kInternalLessEqualOpName = "LessEqual";
72
+ constexpr auto kInternalGreaterOpName = "Greater";
73
+ constexpr auto kInternalGreaterEqualOpName = "GreaterEqual";
74
+ constexpr auto kInternalLogicalNotOpName = "LogicalNot";
75
+ // others
76
+ constexpr auto kInternalGatherOpName = "Gather";
77
+ constexpr auto kInternalTransposeOpName = "Transpose";
78
+ constexpr auto kInternalTransDataOpName = "TransData";
79
+ constexpr auto kInternalQuantPerChannelOpName = "QuantPerChannel";
80
+ constexpr auto kInternalSoftmaxOpName = "Softmax";
81
+ constexpr auto kInternalReduceSumOpName = "ReduceSum";
82
+ constexpr auto kInternalQuantLinearSparseOpName = "QuantLinearSparse";
83
+
84
+ struct AxesParam {
85
+ std::vector<int64_t> axes;
86
+ };
87
+
88
+ using TransposeParam = AxesParam;
89
+ using SoftmaxParam = AxesParam;
90
+ using ReduceSumParam = AxesParam;
91
+
92
+ struct GatherParam {
93
+ int64_t batch_dims;
94
+ std::vector<int64_t> axes;
95
+ };
96
+
97
+ struct SwiGLUParam {
98
+ int64_t axis;
99
+ };
100
+
101
+ struct MatmulParam {
102
+ bool transpose_a{false};
103
+ bool transpose_b{false};
104
+ bool enable_dequant{false};
105
+ bool with_relu{false};
106
+ bool with_gelu{false};
107
+ bool with_fastgelu{false};
108
+ bool with_bias{false};
109
+ bool with_bias_fastgelu{false};
110
+ bool enable_shuffle{false};
111
+ uint32_t tilingN = 0; // 压缩算法透传参数, 单压缩块 n 方向的基块数
112
+ uint32_t tilingK = 0; // 压缩算法透传参数, 单压缩块 k 方向的基块数
44
113
  };
45
- struct OpParam : public AsdOps::OpDesc {
46
- int dtype_ = 0;
47
- std::vector<int64_t> in_dtypes_;
48
- std::vector<int64_t> out_dtypes_;
49
- std::string op_fullname_;
114
+
115
+ struct MatmulAddRmsNormParam {
116
+ bool transpose_a{false};
117
+ bool transpose_b{false};
118
+ float eps{1e-6};
50
119
  };
51
- enum OpId : int {
52
- MatMul,
53
- ReshapeAndCache,
54
- ReshapeAndCacheNz,
55
- Slice,
56
- Gather,
57
- ApplyRotaryPosEmb,
58
- ApplyRotaryPosEmbNz,
59
- Add,
60
- Sub,
61
- Exp,
62
- Relu,
63
- FlashAttentionScore,
64
- PagedAttention,
65
- Cast,
66
- Gelu,
67
- Transpose,
68
- Equal,
69
- NotEqual,
70
- LogicalNot,
71
- Less,
72
- LessEqual,
73
- Greater,
74
- GreaterEqual,
75
- Mul,
76
- RealDiv,
77
- QuantPerChannel,
78
- LayerNorm,
79
- AddLayerNorm,
80
- RmsNorm,
81
- AddRmsNorm,
82
- RmsNormQuant,
83
- AddRmsNormQuant,
84
- MatmulAddRmsNorm,
85
- Softmax,
86
- Split,
87
- Swish,
88
- SwiGLU,
89
- Concat,
90
- MatmulQkv,
91
- MaskedFill,
92
- BroadcastTo,
93
- ReduceSum,
94
- TopK,
95
- Tile,
96
- GroupedMatmul,
97
- OpId_END,
98
- FastGeLU,
99
- TransData,
100
- QuantLinearSparse,
120
+
121
+ struct MultiWeightMatmulParam {
122
+ uint32_t n0_len{0};
123
+ uint32_t n1_len{0};
124
+ uint32_t n2_len{0};
125
+ bool transpose_a;
126
+ bool transpose_b;
127
+ int32_t silu_position{-1};
128
+ bool with_bias{false};
101
129
  };
102
- using MatMulParam = AsdOps::OpParam::MatMul;
103
- using MixParam = AsdOps::OpParam::Mix;
104
- using GatherParam = AsdOps::OpParam::Gather;
105
- using ElewiseParam = AsdOps::OpParam::Elewise;
106
- using SliceParam = AsdOps::OpParam::Slice;
107
- using ActivationParam = AsdOps::OpParam::Activation;
108
- using TransposeParam = AsdOps::OpParam::Transpose;
109
- using NormParam = AsdOps::OpParam::Norm;
110
- using SoftmaxParam = AsdOps::OpParam::Softmax;
111
- using SplitParam = AsdOps::OpParam::Split;
112
- using ConcatParam = AsdOps::OpParam::Concat;
113
- using MaskedFillParam = AsdOps::OpParam::Fill;
114
- using BroadcastToParam = AsdOps::OpParam::Expand;
115
- using ReduceParam = AsdOps::OpParam::Reduce;
116
- using SortParam = AsdOps::OpParam::Sort;
117
- using ExpandParam = AsdOps::OpParam::Expand;
118
- using TransDataParam = AsdOps::OpParam::Transdata;
119
-
120
- struct AddLayerNormParam {
130
+
131
+ struct NormParam {
121
132
  float eps;
122
- bool operator==(const AddLayerNormParam &other) const { return this->eps == other.eps; }
133
+ bool operator==(const NormParam &other) const { return this->eps == other.eps; }
123
134
  };
124
135
 
125
136
  struct ApplyRotaryPosEmbParam {
126
- // cosFormat=0 shape是[maxSeqLen, headDim], cos/sin不交替
127
- // cosFormat=1 shape是[maxSeqLen, headDim], cos/sin交替
128
- // cosFormat=2 shape是[batch*seqLen, headDim], cos/sin不交替
129
- // cosFormat=3 shape是[batch*seqLen, headDim], cos/sin交替
130
- int32_t cosFormat{0};
137
+ // cos_format=0 shape是[maxSeqLen, headDim], cos/sin不交替
138
+ // cos_format=1 shape是[maxSeqLen, headDim], cos/sin交替
139
+ // cos_format=2 shape是[batch*seqLen, headDim], cos/sin不交替
140
+ // cos_format=3 shape是[batch*seqLen, headDim], cos/sin交替
141
+ int32_t cos_format{0};
142
+ int32_t rotary_coeff{-1};
143
+ std::vector<int32_t> batch_valid_length;
131
144
  };
132
145
 
133
- struct AddRmsNormParam {
134
- float eps;
135
- bool operator==(const AddRmsNormParam &other) const { return this->eps == other.eps; }
146
+ struct TransDataParam {
147
+ enum TransdataType { UNDEFINED = 0, FRACTAL_NZ_TO_ND, ND_TO_FRACTAL_NZ };
148
+ TransdataType transdataType = UNDEFINED;
149
+ enum SpecialType { NORMAL = 0, ATTENTION_INPUT_QKV, ATTENTION_INPUT_MASK };
150
+ int64_t specialTransdata = NORMAL;
151
+ };
152
+
153
+ struct FlashAttentionScoreParam {
154
+ int32_t head_num = 0;
155
+ int32_t inner_precise = 0;
156
+ int32_t pre_tokens = 2147483647;
157
+ int32_t next_tokens = 0;
158
+ int32_t sparse_mode = 0;
159
+ int32_t mask_dtype = 0;
160
+ int32_t input_layout = 0;
161
+ std::vector<int64_t> mask_dims;
162
+ std::vector<int32_t> kv_seq_len;
163
+ std::vector<int32_t> q_seq_len;
164
+ float tor = 0;
165
+
166
+ enum InputLayoutMode : int64_t { BSH = 0, BNSD = 1, SBH = 2, BSND = 3, TND = 4, TH = 5, NSD = 6, SH = 7 };
167
+ };
168
+
169
+ struct PagedAttentionParam {
170
+ int32_t inner_precise = 0;
171
+ int32_t head_num = 0;
172
+ int32_t kv_head_num = 0;
173
+ std::vector<int32_t> kv_seq_len;
174
+ std::vector<int32_t> q_seq_len;
175
+ float tor = 0;
176
+
177
+ enum MaskType : uint32_t { kMaskTypeNone = 0, kMaskTypeAlibi = 1, kMaskTypeLookAhead = 2 };
178
+ MaskType mask_type = kMaskTypeNone;
179
+ int32_t kv_cache_quant_mode = 0;
136
180
  };
137
181
  } // namespace internal
138
182
  } // namespace mindspore
139
- #endif
183
+
184
+ #endif // MS_KERNELS_INTERNAL_KERNEL_OP_PARAM_H_
@@ -14,21 +14,22 @@
14
14
  * limitations under the License.
15
15
  */
16
16
 
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
19
19
 
20
20
  #include <sstream>
21
21
 
22
- #include "acme/include/base_type.h"
22
+ #include "include/base_type.h"
23
23
 
24
24
  namespace mindspore {
25
- namespace acme {
25
+ namespace internal {
26
26
  class HostRunInfo {
27
27
  public:
28
28
  HostRunInfo() = default;
29
29
  virtual ~HostRunInfo() = default;
30
30
  void SetWorkSpaceSize(const std::vector<size_t> &workSpaceSize) { this->ws_size_ = workSpaceSize; }
31
31
  std::vector<size_t> GetWorkSpaceSize() const { return this->ws_size_; }
32
+ virtual uint32_t GetBlockDim() const = 0;
32
33
 
33
34
  private:
34
35
  std::vector<size_t> ws_size_;
@@ -37,10 +38,12 @@ using HostRunInfoPtr = std::shared_ptr<HostRunInfo>;
37
38
 
38
39
  class HostRunInfoComm : public HostRunInfo {
39
40
  public:
40
- HostRunInfoComm() = default;
41
- explicit HostRunInfoComm(size_t block_dim) : block_dims_(block_dim) {}
41
+ explicit HostRunInfoComm(uint32_t block_dim);
42
42
  ~HostRunInfoComm() = default;
43
- uint32_t block_dims_{0};
43
+
44
+ uint32_t GetBlockDim() const override;
45
+
46
+ uint32_t block_dim_{0};
44
47
  uint64_t any_value0_{0};
45
48
  uint64_t any_value1_{0};
46
49
  uint64_t any_value2_{0};
@@ -61,7 +64,7 @@ class TilingInfo {
61
64
  HostRunInfoPtr host_run_info_{nullptr};
62
65
  };
63
66
  using TilingInfoPtr = std::shared_ptr<TilingInfo>;
64
- } // namespace acme
67
+ } // namespace internal
65
68
  } // namespace mindspore
66
69
 
67
- #endif // MS_KERNELS_INTERNAL_KERNEL_ACME_TILING_INFO_H_
70
+ #endif // MS_KERNELS_INTERNAL_KERNEL_TILING_INFO_H_
@@ -0,0 +1,178 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_
19
+
20
+ #include <cstdint>
21
+ #include <functional>
22
+ #include <memory>
23
+ #include <sstream>
24
+ #include <string>
25
+ #include <unordered_map>
26
+ #include <vector>
27
+
28
+ #include "include/internal_op.h"
29
+
30
+ namespace mindspore {
31
+ namespace internal {
32
+ void Encrypt(char **src, size_t str_len, char *dest, bool offset_src = false);
33
+ void Decrypt(char **src, size_t str_len, char *dest, bool offset_src = true);
34
+
35
+ struct ScopeData {
36
+ uint32_t begin;
37
+ uint32_t end;
38
+ uint32_t offset;
39
+ uint32_t num;
40
+ };
41
+
42
+ struct ScopeInfo {
43
+ std::vector<uint16_t> types;
44
+ std::vector<ScopeData> scopes;
45
+ };
46
+
47
+ struct TilingData {
48
+ uint16_t version;
49
+ uint32_t base_offset;
50
+ uint16_t key_len;
51
+ uint16_t value_len;
52
+ uint32_t item_num;
53
+ uint16_t type_len;
54
+ std::vector<ScopeInfo> scope_infos;
55
+ };
56
+
57
+ template <typename T>
58
+ struct ArrayHasher {
59
+ std::size_t operator()(const std::vector<T> &arr) const {
60
+ std::size_t hash = 0;
61
+ for (T num : arr) {
62
+ hash ^= std::hash<T>{}(num) + 0x9e3779b9 + (hash << 6) + (hash >> 2);
63
+ }
64
+ return hash;
65
+ }
66
+ };
67
+
68
+ using Repo = std::unordered_map<std::vector<int>, std::vector<int>, ArrayHasher<int>>;
69
+ using RepoMap = std::unordered_map<std::vector<uint16_t>, Repo, ArrayHasher<uint16_t>>;
70
+
71
+ class TilingLoadUtil {
72
+ public:
73
+ explicit TilingLoadUtil(const std::string &db_file, bool is_full_path = false)
74
+ : db_file_(db_file), is_full_(is_full_path) {}
75
+ ~TilingLoadUtil();
76
+ InternalStatus LoadTilingData(TilingData *tiling_data_out);
77
+ InternalStatus LoadScopeTilings(uint32_t base, uint16_t key_len, uint16_t value_len, const ScopeData &scope, Repo *repo);
78
+
79
+ private:
80
+ std::string GetDataFileFullPath(const std::string &db_name) const;
81
+ InternalStatus InitData();
82
+ InternalStatus ReadTilingData(TilingData *tiling_data);
83
+ InternalStatus ReadScopeData(TilingData *tiling_data);
84
+
85
+ std::string db_file_;
86
+ bool is_full_;
87
+ int f_{-1};
88
+ size_t memory_size_{0};
89
+ char *data_{nullptr};
90
+ };
91
+
92
+ using KeyScope = std::pair<int, int>;
93
+
94
+ class TilingRepo {
95
+ public:
96
+ TilingRepo(const TilingRepo &flags) = delete;
97
+ TilingRepo(TilingRepo &&flags) = delete;
98
+ TilingRepo &operator=(const TilingRepo &flags) = delete;
99
+ TilingRepo &operator=(TilingRepo &&flags) = delete;
100
+ ~TilingRepo() = default;
101
+
102
+ static TilingRepo &Instance();
103
+ void Register(const std::string &name, const std::string &db_name);
104
+ InternalStatus GetTiling(const std::string &name, const std::vector<uint16_t> &types, const std::vector<int> &key,
105
+ std::vector<int> *out,
106
+ const std::function<KeyScope(const std::vector<int> &)> &gen_scope_func = nullptr);
107
+ using LoadRecord = std::unordered_map<std::vector<uint16_t>, std::vector<KeyScope>, ArrayHasher<uint16_t>>;
108
+
109
+ private:
110
+ TilingRepo() = default;
111
+ bool IsRegistered(const std::string &name) const;
112
+ std::vector<int> Get(const std::string &name, const std::vector<uint16_t> &types, const std::vector<int> &key) const;
113
+ InternalStatus LoadScopeData(const std::string &name, const std::vector<uint16_t> &types,
114
+ const KeyScope &scope = std::make_pair(0, 0));
115
+
116
+ std::unordered_map<std::string, size_t> name_idx_map_;
117
+ std::unordered_map<std::string, size_t> db_name_idx_map_;
118
+ std::vector<std::string> db_names_;
119
+ std::vector<TilingData> tiling_datas_;
120
+ std::vector<RepoMap> repo_maps_;
121
+ std::vector<LoadRecord> loaded_;
122
+ };
123
+
124
+ class TilingDBLoad {
125
+ public:
126
+ TilingDBLoad(const std::string &op_name, const std::string &db_name) {
127
+ TilingRepo::Instance().Register(op_name, db_name);
128
+ }
129
+ };
130
+
131
+ struct RuningInfo {
132
+ internal::ShapeInfoList input_shapes;
133
+ internal::InputsImmutableInfoList input_infos;
134
+ internal::ShapeInfoList output_shapes;
135
+ internal::InputsImmutableInfoList output_infos;
136
+ };
137
+
138
+ class Tunable {
139
+ public:
140
+ Tunable() = default;
141
+ virtual ~Tunable() = default;
142
+ virtual InternalOpPtr CreateOpByKey(const std::vector<int64_t> &key) = 0;
143
+ virtual RuningInfo GetRuningInfo(const std::vector<int64_t> &key) const = 0;
144
+ };
145
+ using TunablePtr = std::shared_ptr<Tunable>;
146
+
147
+ using TunableCreator = std::function<TunablePtr()>;
148
+ class TunableBuilder {
149
+ public:
150
+ ~TunableBuilder() = default;
151
+ TunableBuilder(const TunableBuilder &) = delete;
152
+ TunableBuilder &operator=(const TunableBuilder &) = delete;
153
+ static TunableBuilder &Instance();
154
+
155
+ void Register(const std::string &op_name, TunableCreator &&creator);
156
+ TunablePtr Create(const std::string &op_name) const;
157
+
158
+ private:
159
+ TunableBuilder() = default;
160
+ std::unordered_map<std::string, TunableCreator> tunable_creators_;
161
+ };
162
+
163
+ class TuneRegister {
164
+ public:
165
+ TuneRegister(const std::string &op_name, TunableCreator creator) noexcept {
166
+ TunableBuilder::Instance().Register(op_name, std::move(creator));
167
+ }
168
+ ~TuneRegister() = default;
169
+ };
170
+
171
+ #define REG_OP_TUNABLE(op_name, TargetClass) \
172
+ static_assert(std::is_base_of<Tunable, TargetClass>::value, #TargetClass " must be derived from Tunable!"); \
173
+ static const TuneRegister g_##op_name##_tunable_reg(#op_name, \
174
+ []() -> TunablePtr { return std::make_shared<TargetClass>(); })
175
+ } // namespace internal
176
+ } // namespace mindspore
177
+
178
+ #endif // MS_KERNELS_INTERNAL_KERNEL_TILING_UTILS_H_