mindspore 2.4.10__cp39-cp39-manylinux1_x86_64.whl → 2.5.0__cp39-cp39-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (706) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-39-x86_64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-39-x86_64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-39-x86_64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +98 -21
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -3
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +31 -15
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +5 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +285 -191
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +1 -0
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  80. mindspore/experimental/llm_boost/register.py +1 -0
  81. mindspore/experimental/optim/adadelta.py +26 -22
  82. mindspore/experimental/optim/adam.py +3 -0
  83. mindspore/experimental/optim/lr_scheduler.py +33 -24
  84. mindspore/experimental/optim/radam.py +33 -30
  85. mindspore/hal/device.py +28 -0
  86. mindspore/hal/event.py +17 -0
  87. mindspore/hal/memory.py +94 -3
  88. mindspore/hal/stream.py +91 -6
  89. mindspore/include/api/context.h +0 -1
  90. mindspore/lib/libavcodec.so.59 +0 -0
  91. mindspore/lib/libavdevice.so.59 +0 -0
  92. mindspore/lib/libavfilter.so.8 +0 -0
  93. mindspore/lib/libavformat.so.59 +0 -0
  94. mindspore/lib/libavutil.so.57 +0 -0
  95. mindspore/lib/libdnnl.so.2 +0 -0
  96. mindspore/lib/libmindspore_backend.so +0 -0
  97. mindspore/lib/libmindspore_common.so +0 -0
  98. mindspore/lib/libmindspore_core.so +0 -0
  99. mindspore/lib/libmindspore_glog.so.0 +0 -0
  100. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  101. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  102. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  103. mindspore/lib/libmindspore_ops.so +0 -0
  104. mindspore/lib/libmpi_adapter.so +0 -0
  105. mindspore/lib/libmpi_collective.so +0 -0
  106. mindspore/lib/libnnacl.so +0 -0
  107. mindspore/lib/libopencv_core.so.4.5 +0 -0
  108. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  110. mindspore/lib/libps_cache.so +0 -0
  111. mindspore/lib/libswresample.so.4 +0 -0
  112. mindspore/lib/libswscale.so.6 +0 -0
  113. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  114. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  115. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/decoder_kv_cache.py +1 -1
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl/dynamic/prompt_kv_cache.py +1 -1
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  121. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  122. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -1
  123. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/lib/libcust_opapi.so +0 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +224 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/all_finite.py +1 -1
  126. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +1 -1
  127. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +1 -1
  128. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  166. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  167. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/x86_64/libcust_opmaster_rt2.0.so +0 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/x86_64/libcust_opsproto_rt2.0.so +0 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -1
  174. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  175. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  176. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  177. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  178. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  179. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  180. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  181. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  182. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +960 -958
  183. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  184. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  185. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  186. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  187. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  188. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  189. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  190. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  191. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  192. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  193. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  194. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  195. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  196. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  197. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  198. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  199. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  200. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  201. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  202. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  203. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  204. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  205. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  206. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  207. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  208. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  209. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  210. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  211. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  212. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  213. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  214. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  215. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  216. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  217. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  218. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  219. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  220. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  221. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  222. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  223. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  224. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  225. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  226. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  227. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  228. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  229. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  230. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  231. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  232. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  233. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  234. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  235. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  236. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  237. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  238. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  239. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  240. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  241. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  242. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  243. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  244. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  245. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  246. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  247. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  248. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  249. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  250. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so +0 -0
  251. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  252. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  253. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  254. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  255. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  256. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  257. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  258. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  259. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  260. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  261. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  262. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  263. mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
  264. mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
  265. mindspore/lib/plugin/gpu10.1/libnccl.so.2 +0 -0
  266. mindspore/lib/plugin/gpu10.1/libnvidia_collective.so +0 -0
  267. mindspore/lib/plugin/gpu11.1/libnccl.so.2 +0 -0
  268. mindspore/lib/plugin/gpu11.1/libnvidia_collective.so +0 -0
  269. mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
  270. mindspore/lib/plugin/gpu11.6/libnvidia_collective.so +0 -0
  271. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  272. mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
  273. mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
  274. mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
  275. mindspore/log.py +12 -0
  276. mindspore/mindrecord/__init__.py +1 -1
  277. mindspore/mindrecord/config.py +17 -316
  278. mindspore/mindrecord/filereader.py +1 -9
  279. mindspore/mindrecord/filewriter.py +5 -15
  280. mindspore/mindrecord/mindpage.py +1 -9
  281. mindspore/mint/__init__.py +824 -218
  282. mindspore/mint/distributed/__init__.py +66 -4
  283. mindspore/mint/distributed/distributed.py +2594 -44
  284. mindspore/mint/linalg/__init__.py +6 -0
  285. mindspore/mint/nn/__init__.py +473 -14
  286. mindspore/mint/nn/functional.py +486 -11
  287. mindspore/mint/nn/layer/__init__.py +17 -4
  288. mindspore/mint/nn/layer/_functions.py +330 -0
  289. mindspore/mint/nn/layer/activation.py +169 -1
  290. mindspore/mint/nn/layer/basic.py +123 -0
  291. mindspore/mint/nn/layer/conv.py +727 -0
  292. mindspore/mint/nn/layer/normalization.py +215 -19
  293. mindspore/mint/nn/layer/padding.py +797 -0
  294. mindspore/mint/nn/layer/pooling.py +170 -0
  295. mindspore/mint/optim/__init__.py +2 -1
  296. mindspore/mint/optim/adam.py +223 -0
  297. mindspore/mint/optim/adamw.py +26 -19
  298. mindspore/mint/special/__init__.py +2 -1
  299. mindspore/multiprocessing/__init__.py +5 -0
  300. mindspore/nn/cell.py +126 -19
  301. mindspore/nn/dynamic_lr.py +2 -1
  302. mindspore/nn/layer/activation.py +6 -6
  303. mindspore/nn/layer/basic.py +35 -25
  304. mindspore/nn/layer/channel_shuffle.py +3 -3
  305. mindspore/nn/layer/embedding.py +3 -3
  306. mindspore/nn/layer/normalization.py +8 -7
  307. mindspore/nn/layer/padding.py +4 -3
  308. mindspore/nn/layer/pooling.py +47 -13
  309. mindspore/nn/layer/rnn_cells.py +1 -1
  310. mindspore/nn/layer/rnns.py +2 -1
  311. mindspore/nn/layer/timedistributed.py +5 -5
  312. mindspore/nn/layer/transformer.py +48 -26
  313. mindspore/nn/learning_rate_schedule.py +5 -3
  314. mindspore/nn/loss/loss.py +31 -36
  315. mindspore/nn/optim/ada_grad.py +1 -0
  316. mindspore/nn/optim/adadelta.py +2 -2
  317. mindspore/nn/optim/adam.py +1 -1
  318. mindspore/nn/optim/lars.py +1 -4
  319. mindspore/nn/optim/optimizer.py +1 -1
  320. mindspore/nn/optim/rprop.py +2 -2
  321. mindspore/nn/optim/thor.py +2 -1
  322. mindspore/nn/utils/init.py +13 -11
  323. mindspore/nn/wrap/cell_wrapper.py +4 -6
  324. mindspore/nn/wrap/loss_scale.py +3 -4
  325. mindspore/numpy/array_creations.py +60 -62
  326. mindspore/numpy/array_ops.py +148 -143
  327. mindspore/numpy/logic_ops.py +41 -42
  328. mindspore/numpy/math_ops.py +361 -359
  329. mindspore/numpy/utils.py +16 -16
  330. mindspore/numpy/utils_const.py +4 -4
  331. mindspore/ops/__init__.py +2 -1
  332. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  333. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  334. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  335. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  336. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  337. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  338. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  339. mindspore/ops/_vmap/vmap_base.py +0 -2
  340. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  341. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  342. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  343. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  344. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  345. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  346. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  347. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  348. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  349. mindspore/ops/composite/base.py +1 -1
  350. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  351. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  352. mindspore/ops/function/__init__.py +12 -0
  353. mindspore/ops/function/array_func.py +561 -159
  354. mindspore/ops/function/clip_func.py +64 -0
  355. mindspore/ops/function/debug_func.py +28 -20
  356. mindspore/ops/function/image_func.py +1 -1
  357. mindspore/ops/function/linalg_func.py +5 -4
  358. mindspore/ops/function/math_func.py +1659 -290
  359. mindspore/ops/function/nn_func.py +988 -317
  360. mindspore/ops/function/parameter_func.py +3 -56
  361. mindspore/ops/function/random_func.py +243 -33
  362. mindspore/ops/function/sparse_unary_func.py +1 -1
  363. mindspore/ops/functional.py +18 -5
  364. mindspore/ops/functional_overload.py +897 -0
  365. mindspore/ops/operations/__init__.py +3 -2
  366. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  367. mindspore/ops/operations/_grad_ops.py +2 -34
  368. mindspore/ops/operations/_infer_ops.py +2 -1
  369. mindspore/ops/operations/_inner_ops.py +38 -8
  370. mindspore/ops/operations/array_ops.py +45 -303
  371. mindspore/ops/operations/comm_ops.py +19 -16
  372. mindspore/ops/operations/custom_ops.py +11 -55
  373. mindspore/ops/operations/debug_ops.py +42 -47
  374. mindspore/ops/operations/inner_ops.py +6 -4
  375. mindspore/ops/operations/linalg_ops.py +3 -2
  376. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  377. mindspore/ops/operations/math_ops.py +11 -216
  378. mindspore/ops/operations/nn_ops.py +146 -308
  379. mindspore/ops/primitive.py +23 -21
  380. mindspore/ops/tensor_method.py +1669 -0
  381. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  382. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  383. mindspore/ops_generate/arg_handler.py +0 -61
  384. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  385. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  386. mindspore/ops_generate/base_generator.py +11 -0
  387. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  388. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  389. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  390. mindspore/ops_generate/functions_cc_generator.py +233 -0
  391. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  392. mindspore/ops_generate/gen_constants.py +157 -3
  393. mindspore/ops_generate/gen_ops.py +245 -990
  394. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  395. mindspore/ops_generate/gen_utils.py +119 -33
  396. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  397. mindspore/ops_generate/op_api_proto.py +206 -0
  398. mindspore/ops_generate/op_def_py_generator.py +131 -0
  399. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  400. mindspore/ops_generate/op_proto.py +373 -108
  401. mindspore/ops_generate/op_template_parser.py +436 -0
  402. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  403. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  404. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  405. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  406. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  407. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  408. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  409. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  410. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  411. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  412. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  413. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  414. mindspore/ops_generate/pyboost_utils.py +92 -33
  415. mindspore/ops_generate/template.py +294 -44
  416. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  417. mindspore/parallel/__init__.py +3 -3
  418. mindspore/parallel/_auto_parallel_context.py +24 -33
  419. mindspore/parallel/_parallel_serialization.py +13 -2
  420. mindspore/parallel/_utils.py +4 -1
  421. mindspore/parallel/algo_parameter_config.py +1 -1
  422. mindspore/parallel/checkpoint_transform.py +44 -0
  423. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  424. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  425. mindspore/parallel/cluster/run.py +20 -3
  426. mindspore/parallel/parameter_broadcast.py +1 -1
  427. mindspore/parallel/shard.py +3 -0
  428. mindspore/parallel/transform_safetensors.py +119 -253
  429. mindspore/profiler/__init__.py +17 -4
  430. mindspore/profiler/analysis/__init__.py +0 -0
  431. mindspore/profiler/analysis/parser/__init__.py +0 -0
  432. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  433. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  434. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  435. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  436. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  437. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  438. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  439. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  440. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  441. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  442. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  443. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  444. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  445. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  446. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  447. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  448. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  449. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  450. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  451. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  452. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  453. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  454. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  455. mindspore/profiler/analysis/task_manager.py +131 -0
  456. mindspore/profiler/analysis/time_converter.py +84 -0
  457. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  458. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  459. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  460. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  461. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  462. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  463. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  464. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  465. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  466. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  467. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  468. mindspore/profiler/analysis/work_flow.py +73 -0
  469. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  470. mindspore/profiler/common/command_executor.py +90 -0
  471. mindspore/profiler/common/constant.py +174 -3
  472. mindspore/profiler/common/file_manager.py +208 -0
  473. mindspore/profiler/common/log.py +130 -0
  474. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  475. mindspore/profiler/common/path_manager.py +371 -0
  476. mindspore/profiler/common/process_bar.py +168 -0
  477. mindspore/profiler/common/process_pool.py +9 -3
  478. mindspore/profiler/common/profiler_context.py +476 -0
  479. mindspore/profiler/common/profiler_info.py +304 -0
  480. mindspore/profiler/common/profiler_output_path.py +284 -0
  481. mindspore/profiler/common/profiler_parameters.py +210 -0
  482. mindspore/profiler/common/profiler_path_manager.py +120 -0
  483. mindspore/profiler/common/record_function.py +76 -0
  484. mindspore/profiler/common/tlv_decoder.py +76 -0
  485. mindspore/profiler/common/util.py +75 -2
  486. mindspore/profiler/dynamic_profiler.py +270 -37
  487. mindspore/profiler/envprofiler.py +138 -0
  488. mindspore/profiler/mstx.py +199 -0
  489. mindspore/profiler/platform/__init__.py +21 -0
  490. mindspore/profiler/platform/base_profiler.py +40 -0
  491. mindspore/profiler/platform/cpu_profiler.py +124 -0
  492. mindspore/profiler/platform/gpu_profiler.py +74 -0
  493. mindspore/profiler/platform/npu_profiler.py +309 -0
  494. mindspore/profiler/profiler.py +580 -93
  495. mindspore/profiler/profiler_action_controller.py +187 -0
  496. mindspore/profiler/profiler_interface.py +114 -0
  497. mindspore/profiler/schedule.py +208 -0
  498. mindspore/rewrite/api/symbol_tree.py +1 -2
  499. mindspore/run_check/_check_version.py +2 -6
  500. mindspore/runtime/__init__.py +37 -0
  501. mindspore/runtime/device.py +27 -0
  502. mindspore/runtime/event.py +209 -0
  503. mindspore/runtime/executor.py +148 -0
  504. mindspore/runtime/memory.py +392 -0
  505. mindspore/runtime/stream.py +460 -0
  506. mindspore/runtime/thread_bind_core.py +401 -0
  507. mindspore/train/__init__.py +2 -2
  508. mindspore/train/_utils.py +53 -18
  509. mindspore/train/amp.py +8 -4
  510. mindspore/train/callback/_checkpoint.py +32 -18
  511. mindspore/train/callback/_early_stop.py +1 -1
  512. mindspore/train/callback/_flops_collector.py +105 -69
  513. mindspore/train/callback/_history.py +1 -1
  514. mindspore/train/callback/_summary_collector.py +44 -6
  515. mindspore/train/callback/_tft_register.py +31 -10
  516. mindspore/train/dataset_helper.py +11 -11
  517. mindspore/train/metrics/precision.py +4 -5
  518. mindspore/train/mind_ir_pb2.py +167 -46
  519. mindspore/train/model.py +13 -15
  520. mindspore/train/serialization.py +462 -76
  521. mindspore/train/summary/summary_record.py +1 -2
  522. mindspore/train/train_thor/model_thor.py +1 -1
  523. mindspore/utils/__init__.py +4 -2
  524. mindspore/utils/bin/dataset-cache +0 -0
  525. mindspore/utils/bin/dataset-cache-server +0 -0
  526. mindspore/utils/dryrun.py +138 -0
  527. mindspore/utils/runtime_execution_order_check.py +550 -0
  528. mindspore/version.py +1 -1
  529. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  530. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +533 -467
  531. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  532. mindspore/_data_dump.cpython-39-x86_64-linux-gnu.so +0 -0
  533. mindspore/bin/cache_admin +0 -0
  534. mindspore/bin/cache_server +0 -0
  535. mindspore/common/_tensor_overload.py +0 -139
  536. mindspore/lib/libmindspore_np_dtype.so +0 -0
  537. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  538. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  539. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  540. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  541. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  542. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  543. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  544. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  545. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  546. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  547. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  548. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  549. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  550. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  551. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  552. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  553. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  554. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -97
  555. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  556. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  557. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  558. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  559. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  560. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  561. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  562. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  563. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  564. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  565. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  566. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  567. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  568. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  569. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  570. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  571. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  572. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  573. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  574. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  575. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  576. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  577. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  578. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  579. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  580. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  581. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  582. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  583. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  584. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  585. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  586. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  587. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  588. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  589. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  590. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  591. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  592. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  593. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  594. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  595. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  596. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  597. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  598. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  599. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  600. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  601. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  602. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  603. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  604. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  605. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  606. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  607. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  608. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  609. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  610. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  611. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  612. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  613. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  614. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  615. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  616. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  617. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  618. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  619. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  620. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  621. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  622. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  623. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  624. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  625. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  626. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  627. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  628. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  629. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  630. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  631. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  632. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  633. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  634. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  635. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  636. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  637. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  638. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  639. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  640. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  641. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  642. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  643. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  644. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  645. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  646. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  647. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  648. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  649. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  650. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  651. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  652. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  653. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  654. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  655. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  656. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  657. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  658. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  659. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  660. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  661. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  662. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  663. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  664. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  665. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  666. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  667. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  668. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  669. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  670. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  671. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_impl.so +0 -0
  672. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  673. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  674. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  687. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  688. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  689. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  690. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  691. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  692. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  693. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  694. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  695. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  696. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  697. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  698. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/matmul_add_rmsnorm/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  699. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  700. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  701. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  702. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  703. mindspore/profiler/envprofiling.py +0 -254
  704. mindspore/profiler/profiling.py +0 -1926
  705. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  706. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -14,16 +14,17 @@
14
14
  * limitations under the License.
15
15
  */
16
16
 
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ACME_BASE_TYPE_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ACME_BASE_TYPE_H_
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_BASE_TYPE_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_BASE_TYPE_H_
19
19
 
20
20
  #include <vector>
21
+ #include <unordered_set>
21
22
  #include <map>
22
23
  #include <cstdint>
23
24
  #include <memory>
24
25
 
25
26
  namespace mindspore {
26
- namespace acme {
27
+ namespace internal {
27
28
  using ShapeInfo = std::vector<int64_t>;
28
29
 
29
30
  enum DataType : int {
@@ -63,9 +64,9 @@ enum TensorFormat : int {
63
64
  kFormatFRACTAL_Z_3D
64
65
  };
65
66
 
66
- enum AcmeStatus {
67
- kAcmeOk = 0,
68
- kAcmeError,
67
+ enum InternalStatus {
68
+ kInternalOk = 0,
69
+ kInternalError,
69
70
  };
70
71
 
71
72
  class ArgImmutableInfo {
@@ -87,6 +88,19 @@ class ArgImmutableInfo {
87
88
  TensorFormat format_{TensorFormat::kFormatUnknown};
88
89
  };
89
90
 
91
+ inline size_t CountNumFromShape(const ShapeInfo &shape) {
92
+ if (shape.empty()) {
93
+ return 0;
94
+ }
95
+
96
+ size_t num = 1;
97
+ for (auto s : shape) {
98
+ num *= static_cast<size_t>(s);
99
+ }
100
+
101
+ return num;
102
+ }
103
+
90
104
  class ArgDesc {
91
105
  public:
92
106
  ArgDesc(const ArgImmutableInfo &arg_ii) : immutable_info_(arg_ii) {}
@@ -114,18 +128,7 @@ class ArgDesc {
114
128
 
115
129
  const ArgImmutableInfo &GetImmutableInfo() const { return immutable_info_; }
116
130
 
117
- inline size_t ElementNum() const {
118
- if (shape_.empty()) {
119
- return 0;
120
- }
121
-
122
- size_t num = 1;
123
- for (auto s : shape_) {
124
- num *= static_cast<size_t>(s);
125
- }
126
-
127
- return num;
128
- }
131
+ inline size_t ElementNum() const { return CountNumFromShape(shape_); }
129
132
 
130
133
  private:
131
134
  ShapeInfo shape_{0};
@@ -148,7 +151,9 @@ using ShapeInfoList = std::vector<ShapeInfo>;
148
151
 
149
152
  using InOutDtypesList = std::vector<std::vector<InputDataTypes>>;
150
153
  using InOutDtypesTargetMap = std::map<std::string, InOutDtypesList>;
151
- } // namespace acme
154
+
155
+ using InOutIndicesType = std::pair<std::unordered_set<size_t>, std::unordered_set<size_t>>;
156
+ } // namespace internal
152
157
  } // namespace mindspore
153
158
 
154
- #endif // MS_KERNELS_INTERNAL_KERNEL_ACME_BASE_TYPE_H_
159
+ #endif // MS_KERNELS_INTERNAL_KERNEL_BASE_TYPE_H_
@@ -14,9 +14,11 @@
14
14
  * limitations under the License.
15
15
  */
16
16
 
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_CAST_TILING_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_CAST_TILING_H_
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_INTERNAL_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_INTERNAL_H_
19
19
 
20
- #include "acme/src/ops/device_src/ascendc/cast/cast_tiling.h"
20
+ #include "include/op_param.h"
21
+ #include "include/op_creator.h"
22
+ #include "include/tiling_info.h"
21
23
 
22
- #endif
24
+ #endif // MS_KERNELS_INTERNAL_KERNEL_INTERNAL_H_
@@ -0,0 +1,114 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_INTERNAL_OP_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_INTERNAL_OP_H_
19
+
20
+ #include <vector>
21
+ #include <string>
22
+
23
+ #include "include/base_type.h"
24
+ #include "include/op_param.h"
25
+ #include "include/tiling_info.h"
26
+
27
+ namespace mindspore {
28
+ namespace internal {
29
+ enum OpType : int {
30
+ kOpTypeAICore = 0,
31
+ kOpTypeAICpu,
32
+ kOpTypeAIV,
33
+ kOpTypeWriteBack,
34
+ kOpTypeMixAIC,
35
+ kOpTypeMixAIV,
36
+ kOpTypeFFTSPlus,
37
+ kOpTypeDSA,
38
+ kOpTypeDVPP,
39
+ kOpTypeHCCL,
40
+ kOpTypeInvalid
41
+ };
42
+
43
+ class InternalOp {
44
+ public:
45
+ InternalOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
46
+ const std::string &op_name);
47
+ virtual ~InternalOp() = default;
48
+ InternalStatus Init();
49
+
50
+ virtual InternalStatus UpdateShape(const ShapeInfoList &inputs_shape, const ShapeInfoList &outputs_shape);
51
+ virtual InternalStatus UpdateParam(const void *) { return kInternalOk; }
52
+
53
+ virtual size_t GetTilingSize() const;
54
+ virtual std::vector<size_t> GetWorkspaceSize() const;
55
+
56
+ virtual void SetTilingInfo(const TilingInfoPtr &tiling_info);
57
+
58
+ virtual InternalStatus Launch(const InputsAddrList &input_ptrs, const OutputsAddrList &output_ptrs, const WsAddrList &ws_ptrs,
59
+ void *stream, const std::string &op_fullname = "");
60
+ virtual InternalStatus Tiling(RawHostAddr host_ptr, HostRunInfoPtr *run_info_ptr);
61
+ virtual std::string DumpTiling(const RawHostAddr host_ptr) const = 0;
62
+
63
+ virtual ShapeInfoList InferShape(const ShapeInfoList &inputs_shape) const = 0;
64
+
65
+ virtual InternalStatus TilingFromTuning(const RawDeviceAddr tiling_addr);
66
+ virtual bool IsSupported(const InputDataTypes &dtypes);
67
+
68
+ virtual std::string GetOpName() { return "Internal" + op_name_; };
69
+ std::string GetOpNameOrigin() { return op_name_; };
70
+ virtual uint32_t GetLaunchCoreNum() const { return host_run_info_comm_ptr_->block_dim_; };
71
+ virtual OpType GetOpType() = 0;
72
+
73
+ // ---- Ops DataBase related functions ----
74
+ // Version: Op implementation version(update when the unnegligible change happens)
75
+ virtual int64_t GetOpVersion() const { return 0; }
76
+ // DataBaseKey: Op information(which can rebuild this op without ambiguity)
77
+ virtual std::vector<int64_t> GetDataBaseKey() const { return std::vector<int64_t>{}; }
78
+ // Tiling
79
+ virtual std::vector<int64_t> GetCurrentTiling() const { return {}; }
80
+ virtual InternalStatus Tiling(const std::vector<int64_t> &tiling, RawHostAddr &tiling_addr,
81
+ HostRunInfoPtr *run_info_ptr) {
82
+ return kInternalError;
83
+ }
84
+ // ---- Ops DataBase related functions ----
85
+
86
+ protected:
87
+ virtual InternalStatus InitImpl();
88
+ virtual InternalStatus TilingImpl(RawHostAddr host_ptr, HostRunInfoPtr *run_info_ptr) = 0;
89
+ virtual InternalStatus LaunchImpl(const InputsAddrList &input_ptrs, const OutputsAddrList &output_ptrs,
90
+ const WsAddrList &ws_ptrs, void *stream) = 0;
91
+ void SetHostRunInfoComm(const HostRunInfoComm &, HostRunInfoPtr *);
92
+
93
+ InputsImmutableInfoList inputs_ii_;
94
+ OutputsImmutableInfoList outputs_ii_;
95
+ ShapeInfoList inputs_shape_;
96
+ ShapeInfoList outputs_shape_;
97
+ std::string op_name_{"UnknownOp"};
98
+ size_t tiling_size_{0};
99
+ std::vector<size_t> ws_size_;
100
+ RawDeviceAddr tiling_device_addr_{nullptr};
101
+ HostRunInfoCommPtr host_run_info_comm_ptr_{nullptr};
102
+
103
+ private:
104
+ virtual InternalStatus LaunchWithProfiling(const InputsAddrList &input_ptrs, const OutputsAddrList &output_ptrs,
105
+ const WsAddrList &ws_ptrs, void *stream, const std::string &op_fullname);
106
+ };
107
+
108
+ using InternalOpPtr = std::shared_ptr<InternalOp>;
109
+
110
+ short GetPlatformEnum(const std::string &soc_name);
111
+ } // namespace internal
112
+ } // namespace mindspore
113
+
114
+ #endif // MS_KERNELS_INTERNAL_KERNEL_INTERNAL_OP_H_
@@ -0,0 +1,70 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_BOOST_KERNEL_H_
17
+ #define MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_BOOST_KERNEL_H_
18
+ #include <memory>
19
+ #include <vector>
20
+ #include "include/llm/tensor.h"
21
+
22
+ namespace mindspore {
23
+ namespace internal {
24
+
25
+ struct BoostParam {};
26
+ struct RawBuf {
27
+ uint64_t size_{0};
28
+ void *addr_{nullptr};
29
+ };
30
+ using HostRawBuf = RawBuf;
31
+ using DeviceRawBuf = RawBuf;
32
+
33
+ using BoostParamPtr = std::shared_ptr<BoostParam>;
34
+
35
+ class BoostKernel {
36
+ public:
37
+ BoostKernel(const BoostParamPtr &param) : param_(param){};
38
+ virtual ~BoostKernel() {}
39
+ // this routine will check if this kernel can support the requirements
40
+ // specified in ValidationInfo.
41
+ virtual bool Init() = 0;
42
+ virtual void SetInputs(const std::vector<Tensor *> &inputs) { inputs_ = inputs; }
43
+ virtual void SetOutputs(const std::vector<Tensor *> &outputs) { outputs_ = outputs; }
44
+ virtual void SetWorkSpace(const std::vector<DeviceRawBuf> &workspace) { return; }
45
+ virtual void SetStream(const void *stream_ptr) { stream_ptr_ = const_cast<void *>(stream_ptr); }
46
+ virtual void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) = 0;
47
+ virtual int Launch() = 0;
48
+ virtual uint64_t GetTilingBufSize() = 0;
49
+ virtual int Tiling(HostRawBuf &tilingBuf) = 0;
50
+ virtual std::vector<uint64_t> GetWorkSpaceSize() = 0;
51
+ virtual int InferShape(const std::vector<TensorDesc> &inputs, std::vector<TensorDesc> &outputs) = 0;
52
+ virtual bool IsSupported() { return true; }
53
+
54
+ virtual std::vector<Tensor *> &get_inputs() { return inputs_; }
55
+ virtual std::vector<Tensor *> &get_outputs() { return outputs_; }
56
+
57
+ std::string get_name() { return kernel_name_; }
58
+ void set_name(std::string kernel_name) { kernel_name_ = kernel_name; }
59
+
60
+ protected:
61
+ std::string kernel_name_;
62
+ BoostParamPtr param_ = nullptr;
63
+ std::vector<Tensor *> inputs_;
64
+ std::vector<Tensor *> outputs_;
65
+ void *stream_ptr_ = nullptr;
66
+ };
67
+ using BoostKernelPtr = std::shared_ptr<BoostKernel>;
68
+ } // namespace internal
69
+ } // namespace mindspore
70
+ #endif // MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_BOOST_KERNEL_H_
@@ -0,0 +1,85 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_LLAMA_IMPL_H_
17
+ #define MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_LLAMA_IMPL_H_
18
+
19
+ #include <iostream>
20
+ #include <memory>
21
+ #include <string>
22
+ #include <vector>
23
+ #include "include/llm/boost_kernel.h"
24
+ #include "include/llm/model_interface.h"
25
+
26
+ namespace mindspore {
27
+ namespace internal {
28
+ struct OpLlamaModelParam : public BoostParam {
29
+ int batch_size_;
30
+ int seq_length_;
31
+ int head_num_;
32
+ int kv_head_num_;
33
+ int hidden_size_;
34
+ int num_layers_;
35
+ float ln_eps_;
36
+ int vocab_size_;
37
+ int multiple_of_;
38
+ int device_id_;
39
+ int device_num_;
40
+ bool paged_attention_ = false;
41
+ int64_t page_size_;
42
+ int page_num_;
43
+ int table_id_;
44
+ void *hcom_ = nullptr;
45
+ };
46
+
47
+ using OpLlamaModelParamPtr = std::shared_ptr<OpLlamaModelParam>;
48
+
49
+ class LlamaImpl : public BoostKernel, public ModelInterface {
50
+ public:
51
+ explicit LlamaImpl(const OpLlamaModelParamPtr param);
52
+ virtual ~LlamaImpl();
53
+ bool Init() override;
54
+ void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
55
+ int Launch() override;
56
+ uint64_t GetTilingBufSize() override;
57
+ int Tiling(HostRawBuf &tilingBuf) override;
58
+ int InferShape(const std::vector<TensorDesc> &inputs, std::vector<TensorDesc> &outputs) override;
59
+ void PrintModel();
60
+ static int CreateDictFromCKPT(dict *dict, std::string name);
61
+ int AllocTable() override;
62
+ int FreeTable(int table_id) override;
63
+ bool AclInit();
64
+
65
+ private:
66
+ bool HcclInit();
67
+ bool AllocKVCacheTable();
68
+ bool BuildLlamaModel();
69
+ bool LlamaAllocateInnerTensors();
70
+ void *AllocateWs(size_t ws_size) override;
71
+ virtual std::vector<uint64_t> GetWorkSpaceSize() override;
72
+ bool SetupWorkspace() override;
73
+ void SetWorkSpace(const std::vector<DeviceRawBuf> &workspace) override;
74
+ int HandleDynamicInput();
75
+ int SetupInputTensors();
76
+
77
+ DeviceRawBuf tiling_buf_;
78
+
79
+ void *prefil_mode_dev_ = nullptr;
80
+ void *decode_mode_dev_ = nullptr;
81
+ size_t batch_ = 0;
82
+ };
83
+ } // namespace internal
84
+ } // namespace mindspore
85
+ #endif // MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_LLAMA_IMPL_H_
@@ -0,0 +1,52 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_MODEL_INTERFACE_H_
17
+ #define MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_MODEL_INTERFACE_H_
18
+
19
+ #include <map>
20
+ #include "include/llm/tensor.h"
21
+
22
+ namespace mindspore {
23
+ namespace internal {
24
+
25
+ using dict = std::map<std::string, Tensor *>;
26
+ class CacheMgr;
27
+ class Graph;
28
+
29
+ class ModelInterface {
30
+ public:
31
+ ModelInterface(int dev_id, int num_layers, int seq_len, int page_num, int page_size, int head_num,
32
+ int kv_head_num, int hidden_size);
33
+ virtual ~ModelInterface();
34
+ virtual int AllocTable() = 0;
35
+ virtual int FreeTable(int table_id) = 0;
36
+ virtual void *AllocateWs(size_t ws_size) = 0;
37
+ virtual bool SetupWorkspace() = 0;
38
+ void SetIsFIrstIter(bool is_first_iter) { is_first_iter_ = is_first_iter; }
39
+ void SetupWeights(dict *dict_weights) { dict_weights_ = dict_weights; }
40
+
41
+ protected:
42
+ Graph *graph_ = nullptr;
43
+ CacheMgr *cache_mgr_;
44
+ dict *dict_weights_ = nullptr;
45
+ bool is_first_iter_ = true;
46
+ void *workspace_addr_ = nullptr;
47
+ size_t workspace_size_ = 0;
48
+ static constexpr size_t max_ws_size_ = static_cast<size_t>(8000) * (1 << 20);
49
+ };
50
+ } // namespace internal
51
+ } // namespace mindspore
52
+ #endif // MS_KERNELS_INTERNAL_KERNEL_INCLUDE_LLM_MODEL_INTERFACE_H_
@@ -0,0 +1,81 @@
1
+ /**
2
+ * Copyright (c) Huawei Technologies Co., Ltd. 2023. All rights reserved.
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_SRC_OPS_LLAMA_TENSOR_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_SRC_OPS_LLAMA_TENSOR_H_
19
+ #include <vector>
20
+ #include <map>
21
+ #include <limits>
22
+ #include <iostream>
23
+ #include "include/base_type.h"
24
+
25
+ using DIMS = std::vector<int64_t>;
26
+ namespace mindspore::internal {
27
+ constexpr size_t HALF_DATA_SIZE = 2;
28
+ enum TensorDType : int {
29
+ TENSOR_DTYPE_UNDEFINED = -1,
30
+ TENSOR_DTYPE_FLOAT = 0,
31
+ TENSOR_DTYPE_FLOAT16 = 1,
32
+ TENSOR_DTYPE_INT8 = 2,
33
+ TENSOR_DTYPE_INT32 = 3,
34
+ TENSOR_DTYPE_UINT8 = 4,
35
+ TENSOR_DTYPE_INT16 = 6,
36
+ TENSOR_DTYPE_UINT16 = 7,
37
+ TENSOR_DTYPE_UINT32 = 8,
38
+ TENSOR_DTYPE_INT64 = 9,
39
+ TENSOR_DTYPE_UINT64 = 10,
40
+ TENSOR_DTYPE_DOUBLE = 11,
41
+ TENSOR_DTYPE_BOOL = 12,
42
+ TENSOR_DTYPE_STRING = 13,
43
+ TENSOR_DTYPE_COMPLEX64 = 16,
44
+ TENSOR_DTYPE_COMPLEX128 = 17,
45
+ TENSOR_DTYPE_BF16 = 27
46
+ };
47
+
48
+ static const std::map<TensorDType, size_t> MAP_OF_DTYPE_SIZE = {{TensorDType::TENSOR_DTYPE_UNDEFINED, 0},
49
+ {TensorDType::TENSOR_DTYPE_FLOAT, sizeof(float)},
50
+ {TensorDType::TENSOR_DTYPE_FLOAT16, HALF_DATA_SIZE},
51
+ {TensorDType::TENSOR_DTYPE_INT8, sizeof(int8_t)},
52
+ {TensorDType::TENSOR_DTYPE_INT32, sizeof(int32_t)},
53
+ {TensorDType::TENSOR_DTYPE_UINT8, sizeof(uint8_t)},
54
+ {TensorDType::TENSOR_DTYPE_INT16, sizeof(int16_t)},
55
+ {TensorDType::TENSOR_DTYPE_UINT16, sizeof(uint16_t)},
56
+ {TensorDType::TENSOR_DTYPE_UINT32, sizeof(uint32_t)},
57
+ {TensorDType::TENSOR_DTYPE_INT64, sizeof(int64_t)},
58
+ {TensorDType::TENSOR_DTYPE_UINT64, sizeof(uint64_t)},
59
+ {TensorDType::TENSOR_DTYPE_DOUBLE, sizeof(double)},
60
+ {TensorDType::TENSOR_DTYPE_BOOL, sizeof(bool)},
61
+ {TensorDType::TENSOR_DTYPE_BF16, HALF_DATA_SIZE}};
62
+
63
+ struct TensorDesc {
64
+ TensorDType dtype = TENSOR_DTYPE_UNDEFINED;
65
+ TensorFormat format = TensorFormat::kFormatUnknown;
66
+ DIMS dims;
67
+ int64_t Numel() const;
68
+ };
69
+
70
+ struct Tensor {
71
+ TensorDesc desc;
72
+ void *data = nullptr;
73
+ void *hostData = nullptr;
74
+ size_t dataSize = 0;
75
+ int64_t Numel() const;
76
+ };
77
+
78
+ size_t GetTensorElementSize(const TensorDType dtype);
79
+
80
+ } // namespace mindspore::internal
81
+ #endif // MS_KERNELS_INTERNAL_KERNEL_SRC_OPS_LLAMA_TENSOR_H_
@@ -0,0 +1,123 @@
1
+ /**
2
+ * Copyright 2024 Huawei Technologies Co., Ltd
3
+ *
4
+ * Licensed under the Apache License, Version 2.0 (the "License");
5
+ * you may not use this file except in compliance with the License.
6
+ * You may obtain a copy of the License at
7
+ *
8
+ * http://www.apache.org/licenses/LICENSE-2.0
9
+ *
10
+ * Unless required by applicable law or agreed to in writing, software
11
+ * distributed under the License is distributed on an "AS IS" BASIS,
12
+ * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ * See the License for the specific language governing permissions and
14
+ * limitations under the License.
15
+ */
16
+
17
+ #ifndef MS_KERNELS_INTERNAL_KERNEL_OP_CREATOR_H_
18
+ #define MS_KERNELS_INTERNAL_KERNEL_OP_CREATOR_H_
19
+
20
+ #include "include/internal_op.h"
21
+ #include "include/op_param.h"
22
+
23
+ namespace mindspore {
24
+ namespace internal {
25
+ InternalOpPtr CreateMatmulOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
26
+ const MatmulParam &param, const std::string &op_name);
27
+ InternalOpPtr CreateAddOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
28
+ const std::string &op_name);
29
+ InternalOpPtr CreateAddLayerNormOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
30
+ const NormParam &param, const std::string &op_name);
31
+ InternalOpPtr CreateAddRmsNormDynamicQuantOp(const InputsImmutableInfoList &inputs_ii,
32
+ const OutputsImmutableInfoList &outputs_ii, const NormParam &param,
33
+ const std::string &op_name);
34
+ InternalOpPtr CreateAddRmsNormQuantOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
35
+ const NormParam &param, const std::string &op_name);
36
+ InternalOpPtr CreateCastOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
37
+ const std::string &op_name);
38
+ InternalOpPtr CreateTransposeOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
39
+ const TransposeParam &param, const std::string &op_name);
40
+ InternalOpPtr CreateQuantPerChannelOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
41
+ const std::string &op_name);
42
+ InternalOpPtr CreateSwishOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
43
+ const std::string &op_name);
44
+ InternalOpPtr CreateSwiGLUOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
45
+ const SwiGLUParam &param, const std::string &op_name);
46
+ InternalOpPtr CreateLogicalNotOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
47
+ const std::string &op_name);
48
+ InternalOpPtr CreateSoftmaxOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
49
+ const SoftmaxParam &param, const std::string &op_name);
50
+ InternalOpPtr CreateReduceSumOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
51
+ const ReduceSumParam &param, const std::string &op_name);
52
+ InternalOpPtr CreateGatherOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
53
+ const GatherParam &param, const std::string &op_name);
54
+ InternalOpPtr CreateApplyRotaryPosEmbOp(const InputsImmutableInfoList &inputs_ii,
55
+ const OutputsImmutableInfoList &outputs_ii, const ApplyRotaryPosEmbParam &param,
56
+ const std::string &op_name);
57
+ InternalOpPtr CreateApplyRotaryPosEmbNzOp(const InputsImmutableInfoList &inputs_ii,
58
+ const OutputsImmutableInfoList &outputs_ii, const ApplyRotaryPosEmbParam &param,
59
+ const std::string &op_name);
60
+ InternalOpPtr CreateRmsNormOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
61
+ const NormParam &param, const std::string &op_name);
62
+ InternalOpPtr CreateMatmulAddRmsNormOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
63
+ const MatmulAddRmsNormParam &param, const std::string &op_name);
64
+ InternalOpPtr CreateMultiWeightMatmulOp(const InputsImmutableInfoList &inputs_ii,
65
+ const OutputsImmutableInfoList &outputs_ii, const MultiWeightMatmulParam &param,
66
+ const std::string &op_name);
67
+ // param section 0
68
+ InternalOpPtr CreateGeLUOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
69
+ const std::string &op_name);
70
+ InternalOpPtr CreateAddRmsNormOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
71
+ const NormParam &param, const std::string &op_name);
72
+ InternalOpPtr CreateFlashAttentionScoreOp(const InputsImmutableInfoList &inputs_ii,
73
+ const OutputsImmutableInfoList &outputs_ii, const FlashAttentionScoreParam &param,
74
+ const std::string &op_name);
75
+ InternalOpPtr CreatePagedAttentionOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
76
+ const PagedAttentionParam &param, const std::string &op_name);
77
+ // param section 1
78
+ InternalOpPtr CreateReshapeAndCacheOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
79
+ const std::string &op_name);
80
+ InternalOpPtr CreateReshapeAndCacheNzOp(const InputsImmutableInfoList &inputs_ii,
81
+ const OutputsImmutableInfoList &outputs_ii, const std::string &op_name);
82
+ InternalOpPtr CreateMulOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
83
+ const std::string &op_name);
84
+ InternalOpPtr CreateSubOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
85
+ const std::string &op_name);
86
+ InternalOpPtr CreateRealDivOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
87
+ const std::string &op_name);
88
+
89
+ // param section 2
90
+ InternalOpPtr CreateFastGeLUOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
91
+ const std::string &op_name);
92
+ InternalOpPtr CreateTransDataOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
93
+ const TransDataParam &param, const std::string &op_name);
94
+ InternalOpPtr CreateQuantLinearSparseOp(const InputsImmutableInfoList &inputs_ii,
95
+ const OutputsImmutableInfoList &outputs_ii, const std::string &op_name);
96
+ InternalOpPtr CreateTssAddLayerNormOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
97
+ const std::string &op_name);
98
+ // param section 3
99
+ InternalOpPtr CreateLessOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
100
+ const std::string &op_name);
101
+ InternalOpPtr CreateEqualOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
102
+ const std::string &op_name);
103
+ InternalOpPtr CreateNotEqualOp(const InputsImmutableInfoList &inputs_ii, const OutputsImmutableInfoList &outputs_ii,
104
+ const std::string &op_name);
105
+ // param section 4
106
+
107
+ // param section 5
108
+
109
+ // param section 6
110
+
111
+ // param section 7
112
+
113
+ // param section 8
114
+
115
+ // param section 9
116
+
117
+ // param section 10
118
+
119
+ bool IsInternalKernelDtypesSupported(const std::string op_name, InputDataTypes in_dtypes, InputDataTypes out_dtypes);
120
+ } // namespace internal
121
+ } // namespace mindspore
122
+
123
+ #endif // MS_KERNELS_INTERNAL_KERNEL_OP_CREATOR_H_