mindspore 2.4.1__cp39-none-any.whl → 2.5.0__cp39-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (847) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-39-aarch64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-39-aarch64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-39-aarch64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +99 -25
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -1
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +30 -27
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +10 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +292 -193
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +28 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +125 -65
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +3 -2
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +239 -64
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +52 -30
  80. mindspore/experimental/llm_boost/atb/qwen_boost.py +47 -24
  81. mindspore/experimental/llm_boost/register.py +1 -0
  82. mindspore/experimental/optim/adadelta.py +26 -22
  83. mindspore/experimental/optim/adam.py +3 -0
  84. mindspore/experimental/optim/lr_scheduler.py +33 -24
  85. mindspore/experimental/optim/radam.py +33 -30
  86. mindspore/hal/device.py +28 -0
  87. mindspore/hal/event.py +17 -0
  88. mindspore/hal/memory.py +94 -3
  89. mindspore/hal/stream.py +91 -6
  90. mindspore/include/api/context.h +1 -2
  91. mindspore/include/dataset/constants.h +2 -2
  92. mindspore/lib/libavcodec.so.59 +0 -0
  93. mindspore/lib/libavdevice.so.59 +0 -0
  94. mindspore/lib/libavfilter.so.8 +0 -0
  95. mindspore/lib/libavformat.so.59 +0 -0
  96. mindspore/lib/libavutil.so.57 +0 -0
  97. mindspore/lib/libdnnl.so.2 +0 -0
  98. mindspore/lib/libmindspore_backend.so +0 -0
  99. mindspore/lib/libmindspore_common.so +0 -0
  100. mindspore/lib/libmindspore_core.so +0 -0
  101. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  102. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  103. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  104. mindspore/lib/libmindspore_ops.so +0 -0
  105. mindspore/lib/libmpi_adapter.so +0 -0
  106. mindspore/lib/libmpi_collective.so +0 -0
  107. mindspore/lib/libnnacl.so +0 -0
  108. mindspore/lib/libopencv_core.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  110. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  111. mindspore/lib/libps_cache.so +0 -0
  112. mindspore/lib/libswresample.so.4 +0 -0
  113. mindspore/lib/libswscale.so.6 +0 -0
  114. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  115. mindspore/lib/plugin/ascend/custom_aicore_ops/op_proto/libop_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/framework/npu_supported_ops.json +10 -0
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json +182 -0
  121. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/decoder_kv_cache.py +51 -16
  122. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/prompt_kv_cache.py +51 -16
  123. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +158 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +158 -0
  126. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  127. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +158 -0
  128. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +158 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +158 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +158 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +158 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +158 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +167 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +167 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +167 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +167 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +167 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +167 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +167 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +167 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/binary_info_config.json +302 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/decoder_kv_cache.json +892 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/prompt_kv_cache.json +892 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/inc/op_proto.h +33 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/framework/npu_supported_ops.json +14 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/include/aclnn_decoder_kv_cache.h +59 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/include/aclnn_prompt_kv_cache.h +59 -0
  166. mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_api/lib/libcust_opapi.so +0 -0
  167. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl}/dynamic/all_finite.py +51 -16
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.cpp +192 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +215 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.cpp +274 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +215 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +80 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  174. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +80 -0
  175. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  176. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +80 -0
  177. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  178. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +158 -0
  179. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  180. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +158 -0
  181. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  182. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +158 -0
  183. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  184. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +158 -0
  185. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  186. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +158 -0
  187. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  188. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +158 -0
  189. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  190. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +158 -0
  191. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  192. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +158 -0
  193. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  194. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +167 -0
  195. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  196. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +167 -0
  197. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  198. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +167 -0
  199. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  200. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +167 -0
  201. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  202. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +167 -0
  203. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  204. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +167 -0
  205. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  206. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +167 -0
  207. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  208. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +167 -0
  209. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  210. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  211. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_86a73ff6e28d734c96bb8d3054f7dd18.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o} +0 -0
  212. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  213. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_f55e0ebaad1f2f572e43677336992fa0.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o} +0 -0
  214. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  215. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_576ceaeef5870c451cab59af55ea46ad.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o} +0 -0
  216. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  217. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  218. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  219. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  220. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  221. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  222. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  223. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  224. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  225. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  226. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  227. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  228. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  229. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  230. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  231. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  232. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  233. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  234. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  235. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  236. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  237. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  238. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  239. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  240. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  241. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  242. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  243. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  244. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  245. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  246. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  247. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  248. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  249. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  250. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  251. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  252. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  253. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  254. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  255. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  256. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  257. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  258. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  259. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  260. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  261. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  262. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  263. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  264. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  265. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  266. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  267. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  268. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  269. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  270. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  271. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  272. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  273. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  274. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  275. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  276. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  277. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  278. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  279. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  280. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  281. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  282. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  283. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  284. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  285. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  286. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/all_finite.json +139 -0
  287. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/binary_info_config.json +361 -0
  288. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/decoder_kv_cache.json +892 -0
  289. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/prompt_kv_cache.json +892 -0
  290. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  291. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  292. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  293. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  294. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/all_finite.json +139 -0
  295. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/binary_info_config.json +361 -0
  296. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/decoder_kv_cache.json +892 -0
  297. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/prompt_kv_cache.json +892 -0
  298. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  299. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  300. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  301. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -0
  302. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  303. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  304. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  305. mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
  306. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  307. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  308. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  309. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  310. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  311. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/bin/PkgInspect +0 -0
  312. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/bin/op_man +0 -0
  313. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +957 -955
  314. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/host/libasdops_cann_host.so +0 -0
  315. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/host/libasdops_host.so +0 -0
  316. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops.so +0 -0
  317. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops_static.a +0 -0
  318. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/liblcal_static.a +0 -0
  319. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  320. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  321. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  322. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  323. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  324. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  325. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  326. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  327. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  328. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  329. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  330. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  331. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  332. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  333. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  334. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  335. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  336. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  337. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  338. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  339. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  340. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  341. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  342. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  343. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  344. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  345. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  346. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  347. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  348. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  349. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  350. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  351. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  352. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  353. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  354. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  355. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  356. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  357. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  358. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  359. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  360. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  361. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  362. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  363. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  364. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  365. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  366. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  367. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  368. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  369. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  370. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  371. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  372. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  373. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  374. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  375. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  376. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  377. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  378. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  379. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  380. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  381. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  382. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  383. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  384. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  385. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  386. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_layer_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so} +0 -0
  387. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  388. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  389. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  390. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  391. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  392. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  393. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  394. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  395. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  396. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  397. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  398. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  399. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  400. mindspore/log.py +12 -0
  401. mindspore/mindrecord/__init__.py +1 -1
  402. mindspore/mindrecord/config.py +17 -316
  403. mindspore/mindrecord/filereader.py +1 -9
  404. mindspore/mindrecord/filewriter.py +5 -15
  405. mindspore/mindrecord/mindpage.py +1 -9
  406. mindspore/mint/__init__.py +824 -218
  407. mindspore/mint/distributed/__init__.py +66 -4
  408. mindspore/mint/distributed/distributed.py +2594 -44
  409. mindspore/mint/linalg/__init__.py +6 -0
  410. mindspore/mint/nn/__init__.py +473 -14
  411. mindspore/mint/nn/functional.py +486 -11
  412. mindspore/mint/nn/layer/__init__.py +17 -4
  413. mindspore/mint/nn/layer/_functions.py +330 -0
  414. mindspore/mint/nn/layer/activation.py +169 -1
  415. mindspore/mint/nn/layer/basic.py +123 -0
  416. mindspore/mint/nn/layer/conv.py +727 -0
  417. mindspore/mint/nn/layer/normalization.py +215 -19
  418. mindspore/mint/nn/layer/padding.py +797 -0
  419. mindspore/mint/nn/layer/pooling.py +170 -0
  420. mindspore/mint/optim/__init__.py +2 -1
  421. mindspore/mint/optim/adam.py +223 -0
  422. mindspore/mint/optim/adamw.py +26 -19
  423. mindspore/mint/special/__init__.py +2 -1
  424. mindspore/multiprocessing/__init__.py +5 -0
  425. mindspore/nn/__init__.py +2 -0
  426. mindspore/nn/cell.py +142 -21
  427. mindspore/nn/dynamic_lr.py +2 -1
  428. mindspore/nn/layer/activation.py +6 -6
  429. mindspore/nn/layer/basic.py +35 -25
  430. mindspore/nn/layer/channel_shuffle.py +3 -3
  431. mindspore/nn/layer/conv.py +3 -0
  432. mindspore/nn/layer/embedding.py +3 -3
  433. mindspore/nn/layer/normalization.py +8 -7
  434. mindspore/nn/layer/padding.py +4 -3
  435. mindspore/nn/layer/pooling.py +55 -23
  436. mindspore/nn/layer/rnn_cells.py +1 -1
  437. mindspore/nn/layer/rnns.py +2 -1
  438. mindspore/nn/layer/timedistributed.py +5 -5
  439. mindspore/nn/layer/transformer.py +48 -26
  440. mindspore/nn/learning_rate_schedule.py +5 -3
  441. mindspore/nn/loss/loss.py +31 -36
  442. mindspore/nn/optim/ada_grad.py +1 -0
  443. mindspore/nn/optim/adadelta.py +2 -2
  444. mindspore/nn/optim/adam.py +1 -1
  445. mindspore/nn/optim/lars.py +1 -4
  446. mindspore/nn/optim/optimizer.py +1 -1
  447. mindspore/nn/optim/rprop.py +2 -2
  448. mindspore/nn/optim/thor.py +2 -1
  449. mindspore/nn/utils/__init__.py +22 -0
  450. mindspore/nn/utils/init.py +73 -0
  451. mindspore/nn/wrap/cell_wrapper.py +4 -6
  452. mindspore/nn/wrap/loss_scale.py +3 -4
  453. mindspore/numpy/array_creations.py +60 -62
  454. mindspore/numpy/array_ops.py +148 -143
  455. mindspore/numpy/logic_ops.py +41 -42
  456. mindspore/numpy/math_ops.py +361 -359
  457. mindspore/numpy/utils.py +16 -16
  458. mindspore/numpy/utils_const.py +4 -4
  459. mindspore/ops/__init__.py +2 -1
  460. mindspore/ops/_grad_experimental/grad_comm_ops.py +107 -8
  461. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  462. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  463. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  464. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  465. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  466. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  467. mindspore/ops/_vmap/vmap_base.py +0 -2
  468. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  469. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  470. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  471. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  472. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  473. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  474. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  475. mindspore/ops/auto_generate/gen_ops_prim.py +8027 -3411
  476. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  477. mindspore/ops/composite/base.py +1 -1
  478. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  479. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  480. mindspore/ops/function/__init__.py +12 -0
  481. mindspore/ops/function/array_func.py +561 -159
  482. mindspore/ops/function/clip_func.py +64 -0
  483. mindspore/ops/function/debug_func.py +28 -20
  484. mindspore/ops/function/image_func.py +1 -1
  485. mindspore/ops/function/linalg_func.py +5 -4
  486. mindspore/ops/function/math_func.py +1664 -294
  487. mindspore/ops/function/nn_func.py +988 -317
  488. mindspore/ops/function/parameter_func.py +3 -56
  489. mindspore/ops/function/random_func.py +243 -33
  490. mindspore/ops/function/sparse_unary_func.py +1 -1
  491. mindspore/ops/functional.py +18 -5
  492. mindspore/ops/functional_overload.py +897 -0
  493. mindspore/ops/operations/__init__.py +3 -2
  494. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  495. mindspore/ops/operations/_grad_ops.py +2 -34
  496. mindspore/ops/operations/_infer_ops.py +2 -1
  497. mindspore/ops/operations/_inner_ops.py +38 -8
  498. mindspore/ops/operations/array_ops.py +45 -303
  499. mindspore/ops/operations/comm_ops.py +23 -17
  500. mindspore/ops/operations/custom_ops.py +7 -49
  501. mindspore/ops/operations/debug_ops.py +42 -47
  502. mindspore/ops/operations/inner_ops.py +6 -4
  503. mindspore/ops/operations/linalg_ops.py +3 -2
  504. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  505. mindspore/ops/operations/math_ops.py +11 -216
  506. mindspore/ops/operations/nn_ops.py +153 -310
  507. mindspore/ops/primitive.py +23 -21
  508. mindspore/ops/tensor_method.py +1669 -0
  509. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  510. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  511. mindspore/ops_generate/arg_handler.py +0 -61
  512. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  513. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  514. mindspore/ops_generate/base_generator.py +11 -0
  515. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  516. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  517. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  518. mindspore/ops_generate/functions_cc_generator.py +233 -0
  519. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  520. mindspore/ops_generate/gen_constants.py +157 -3
  521. mindspore/ops_generate/gen_ops.py +245 -990
  522. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  523. mindspore/ops_generate/gen_utils.py +119 -33
  524. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  525. mindspore/ops_generate/op_api_proto.py +206 -0
  526. mindspore/ops_generate/op_def_py_generator.py +131 -0
  527. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  528. mindspore/ops_generate/op_proto.py +373 -108
  529. mindspore/ops_generate/op_template_parser.py +436 -0
  530. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  531. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  532. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  533. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  534. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  535. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  536. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  537. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  538. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  539. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  540. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  541. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  542. mindspore/ops_generate/pyboost_utils.py +92 -33
  543. mindspore/ops_generate/template.py +294 -44
  544. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  545. mindspore/parallel/__init__.py +3 -3
  546. mindspore/parallel/_auto_parallel_context.py +44 -34
  547. mindspore/parallel/_cell_wrapper.py +22 -3
  548. mindspore/parallel/_parallel_serialization.py +13 -2
  549. mindspore/parallel/_utils.py +4 -2
  550. mindspore/parallel/algo_parameter_config.py +1 -1
  551. mindspore/parallel/checkpoint_transform.py +44 -0
  552. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  553. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  554. mindspore/parallel/cluster/run.py +20 -3
  555. mindspore/parallel/parameter_broadcast.py +1 -1
  556. mindspore/parallel/shard.py +3 -0
  557. mindspore/parallel/transform_safetensors.py +119 -253
  558. mindspore/profiler/__init__.py +17 -4
  559. mindspore/profiler/analysis/__init__.py +0 -0
  560. mindspore/profiler/analysis/parser/__init__.py +0 -0
  561. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  562. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  563. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  564. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  565. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  566. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  567. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  568. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  569. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  570. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  571. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  572. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  573. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  574. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  575. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  576. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  577. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  578. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  579. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  580. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  581. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  582. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  583. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  584. mindspore/profiler/analysis/task_manager.py +131 -0
  585. mindspore/profiler/analysis/time_converter.py +84 -0
  586. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  587. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  588. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  589. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  590. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  591. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  592. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  593. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  594. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  595. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  596. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  597. mindspore/profiler/analysis/work_flow.py +73 -0
  598. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  599. mindspore/profiler/common/command_executor.py +90 -0
  600. mindspore/profiler/common/constant.py +174 -3
  601. mindspore/profiler/common/file_manager.py +208 -0
  602. mindspore/profiler/common/log.py +130 -0
  603. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  604. mindspore/profiler/common/path_manager.py +371 -0
  605. mindspore/profiler/common/process_bar.py +168 -0
  606. mindspore/profiler/common/process_pool.py +9 -3
  607. mindspore/profiler/common/profiler_context.py +476 -0
  608. mindspore/profiler/common/profiler_info.py +304 -0
  609. mindspore/profiler/common/profiler_output_path.py +284 -0
  610. mindspore/profiler/common/profiler_parameters.py +210 -0
  611. mindspore/profiler/common/profiler_path_manager.py +120 -0
  612. mindspore/profiler/common/record_function.py +76 -0
  613. mindspore/profiler/common/tlv_decoder.py +76 -0
  614. mindspore/profiler/common/util.py +75 -2
  615. mindspore/profiler/dynamic_profiler.py +270 -37
  616. mindspore/profiler/envprofiler.py +138 -0
  617. mindspore/profiler/mstx.py +199 -0
  618. mindspore/profiler/platform/__init__.py +21 -0
  619. mindspore/profiler/platform/base_profiler.py +40 -0
  620. mindspore/profiler/platform/cpu_profiler.py +124 -0
  621. mindspore/profiler/platform/gpu_profiler.py +74 -0
  622. mindspore/profiler/platform/npu_profiler.py +309 -0
  623. mindspore/profiler/profiler.py +580 -93
  624. mindspore/profiler/profiler_action_controller.py +187 -0
  625. mindspore/profiler/profiler_interface.py +114 -0
  626. mindspore/profiler/schedule.py +208 -0
  627. mindspore/rewrite/api/symbol_tree.py +1 -2
  628. mindspore/run_check/_check_version.py +18 -13
  629. mindspore/runtime/__init__.py +37 -0
  630. mindspore/runtime/device.py +27 -0
  631. mindspore/runtime/event.py +209 -0
  632. mindspore/runtime/executor.py +148 -0
  633. mindspore/runtime/memory.py +392 -0
  634. mindspore/runtime/stream.py +460 -0
  635. mindspore/runtime/thread_bind_core.py +401 -0
  636. mindspore/train/__init__.py +2 -2
  637. mindspore/train/_utils.py +53 -18
  638. mindspore/train/amp.py +8 -4
  639. mindspore/train/callback/_checkpoint.py +32 -18
  640. mindspore/train/callback/_early_stop.py +1 -1
  641. mindspore/train/callback/_flops_collector.py +105 -69
  642. mindspore/train/callback/_history.py +1 -1
  643. mindspore/train/callback/_summary_collector.py +44 -6
  644. mindspore/train/callback/_tft_register.py +37 -15
  645. mindspore/train/dataset_helper.py +11 -11
  646. mindspore/train/metrics/precision.py +4 -5
  647. mindspore/train/mind_ir_pb2.py +167 -46
  648. mindspore/train/model.py +13 -14
  649. mindspore/train/serialization.py +461 -72
  650. mindspore/train/summary/summary_record.py +1 -2
  651. mindspore/train/train_thor/model_thor.py +1 -1
  652. mindspore/utils/__init__.py +4 -2
  653. mindspore/utils/bin/dataset-cache +0 -0
  654. mindspore/utils/bin/dataset-cache-server +0 -0
  655. mindspore/utils/dryrun.py +138 -0
  656. mindspore/utils/runtime_execution_order_check.py +550 -0
  657. mindspore/version.py +1 -1
  658. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/METADATA +3 -4
  659. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/RECORD +672 -479
  660. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  661. mindspore/_data_dump.cpython-39-aarch64-linux-gnu.so +0 -0
  662. mindspore/bin/cache_admin +0 -0
  663. mindspore/bin/cache_server +0 -0
  664. mindspore/common/_tensor_overload.py +0 -139
  665. mindspore/lib/libmindspore_np_dtype.so +0 -0
  666. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_576ceaeef5870c451cab59af55ea46ad.json +0 -58
  667. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_86a73ff6e28d734c96bb8d3054f7dd18.json +0 -58
  668. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_f55e0ebaad1f2f572e43677336992fa0.json +0 -58
  669. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/config/ascend910b/all_finite.json +0 -109
  670. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/config/ascend910b/binary_info_config.json +0 -38
  671. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  672. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  673. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  674. mindspore/lib/plugin/ascend/custom_ascendc_ops/version.info +0 -1
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  687. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  688. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  689. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  690. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  691. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  692. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -92
  693. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  694. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  695. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  696. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  697. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  698. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  699. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  700. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  701. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  702. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  703. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  704. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  705. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  706. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  707. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  708. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  709. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  710. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  711. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  712. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  713. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  714. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  715. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  716. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  717. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  718. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  719. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  720. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  721. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  722. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  723. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  724. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  725. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  726. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  727. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  728. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  729. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  730. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  731. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  732. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  733. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  734. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  735. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  736. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  737. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  738. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  739. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  740. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  741. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  742. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  743. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  744. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  745. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  746. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  747. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  748. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  749. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  750. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  751. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  752. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  753. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  754. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  755. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  756. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  757. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  758. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  759. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  760. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  761. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  762. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  763. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  764. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  765. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  766. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  767. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  768. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  769. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  770. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  771. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  772. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  773. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  774. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  775. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  776. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  777. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  778. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  779. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  780. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  781. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  782. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  783. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  784. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  785. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  786. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  787. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  788. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  789. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  790. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  791. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  792. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  793. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  794. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  795. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  796. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  797. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  798. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  799. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  800. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  801. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  802. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  803. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  804. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  805. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  806. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  807. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  808. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  809. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  810. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  811. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  812. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  813. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  814. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  815. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  816. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  817. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  818. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  819. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  820. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  821. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  822. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  823. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  824. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  825. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  826. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  827. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  828. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  829. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  830. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  831. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  832. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  833. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  834. mindspore/profiler/envprofiling.py +0 -254
  835. mindspore/profiler/profiling.py +0 -1926
  836. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910}/op_api/include/aclnn_decoder_kv_cache.h +0 -0
  837. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910}/op_api/include/aclnn_prompt_kv_cache.h +0 -0
  838. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/decoder_kv_cache.cpp +0 -0
  839. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/prompt_kv_cache.cpp +0 -0
  840. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_api/include/aclnn_all_finite.h +0 -0
  841. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json +0 -0
  842. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json → custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json} +0 -0
  843. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json +0 -0
  844. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl}/dynamic/all_finite.cpp +0 -0
  845. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_proto/inc/op_proto.h +0 -0
  846. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  847. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -13,17 +13,32 @@
13
13
  # limitations under the License.
14
14
  # ============================================================================
15
15
  """boost base class"""
16
+ from enum import Enum
16
17
  import numpy as np
17
18
  import mindspore as ms
18
19
  from mindspore import ops, Tensor
20
+ from mindspore import log as logger
19
21
  from mindspore.ops import operations as P
20
22
  import mindspore.common.dtype as mstype
21
23
  from mindspore._c_expression import _set_format
22
-
23
24
  from mindspore.common.parameter import Parameter
24
25
  from mindspore.experimental.llm_boost.utils import get_real_rank, get_real_group_size
25
26
  from mindspore.common.initializer import Zero
26
27
 
28
+ FORMAT_NZ = "FRACTAL_NZ"
29
+ BUILDIN_BACKEND_NAME = "ATB"
30
+
31
+
32
+ class PositionEmbeddingType(int, Enum):
33
+ ROPE = 0
34
+ ALIBI = 1
35
+ ABSOLUTE = 2
36
+
37
+
38
+ class NormType(int, Enum):
39
+ RMS_NORM = 0
40
+ LAYER_NORM = 1
41
+
27
42
 
28
43
  class AttentionMask:
29
44
  """attention mask"""
@@ -31,30 +46,34 @@ class AttentionMask:
31
46
  @classmethod
32
47
  def static(cls, max_seq_len, dtype=mstype.float16, need_nz=False):
33
48
  """cache mask"""
34
- bias_cache = Tensor(np.tril(np.ones((max_seq_len, max_seq_len), dtype=np.bool_))).reshape(max_seq_len,
35
- max_seq_len)
49
+ bias_cache = Tensor(
50
+ np.tril(np.ones((max_seq_len, max_seq_len), dtype=np.bool_))
51
+ ).reshape(max_seq_len, max_seq_len)
36
52
  bias_cache = ~bias_cache
37
53
  if dtype == mstype.float16:
38
54
  mask_value = Tensor(np.finfo(np.float32).min, mstype.float16)
39
55
  else:
40
56
  mask_value = Tensor(1)
41
- attn_mask = ops.masked_fill(Tensor(np.zeros(
42
- (max_seq_len, max_seq_len)), dtype=mstype.float16), bias_cache, mask_value)
57
+ attn_mask = ops.masked_fill(
58
+ Tensor(np.zeros((max_seq_len, max_seq_len)), dtype=mstype.float16),
59
+ bias_cache,
60
+ mask_value,
61
+ )
43
62
  if need_nz:
44
63
  # ND -> NZ
45
64
  attn_mask = ops.reshape(attn_mask, (1, max_seq_len, max_seq_len))
46
- attn_mask = ops.reshape(
47
- attn_mask, (1, max_seq_len, max_seq_len // 16, 16))
65
+ attn_mask = ops.reshape(attn_mask, (1, max_seq_len, max_seq_len // 16, 16))
48
66
  attn_mask = ops.transpose(attn_mask, (0, 2, 1, 3)).contiguous()
49
- attn_mask = _set_format(attn_mask, "FRACTAL_NZ")
67
+ attn_mask = _set_format(attn_mask, FORMAT_NZ)
50
68
  return attn_mask
51
69
 
52
70
 
53
- class AtbBoostBase():
71
+ class AtbBoostBase:
54
72
  """atb boost base class"""
55
73
 
56
74
  def __init__(self, config):
57
75
  super().__init__()
76
+ self.backend_name = BUILDIN_BACKEND_NAME
58
77
  self.is_first_iteration = False
59
78
  self.config = config
60
79
  self.dtype = config.compute_dtype
@@ -68,27 +87,97 @@ class AtbBoostBase():
68
87
  self.need_nz = config.need_nz
69
88
  self.placeholder = Tensor(np.zeros(1), dtype=self.dtype)
70
89
  self.lm_head_indices_fake = Tensor([0], dtype=mstype.int64)
71
- self.position_embedding_type = "ROPE"
90
+ self.position_embedding_type = PositionEmbeddingType.ROPE
72
91
  self.add_norm_enable = True
73
92
  self.max_decode_length = self.config.max_decode_length
74
93
  self.max_base_len = 128
75
94
  self.attn_mask = AttentionMask.static(
76
- self.max_base_len, dtype=self.dtype, need_nz=self.need_nz)
95
+ self.max_base_len, dtype=self.dtype, need_nz=self.need_nz
96
+ )
77
97
 
78
98
  self.cast = P.Cast()
79
99
  self.reshape = P.Reshape()
80
100
  self.kv_quant = None
81
101
  self.rank_id = get_real_rank()
82
102
  self.device_num = get_real_group_size()
103
+ self.ascend_weight = []
104
+ self.k_caches = []
105
+ self.v_caches = []
83
106
 
84
107
  def _convert_tensor_format_and_dtype(self, tensor, dtype=mstype.float16):
85
108
  tensor = self.cast(tensor, dtype=dtype)
86
109
  if self.need_nz:
87
- tensor = _set_format(tensor, "FRACTAL_NZ")
110
+ tensor = _set_format(tensor, FORMAT_NZ)
88
111
  return tensor
89
112
 
113
+ def _convert_qkv_concat_weight(self, param_dict):
114
+ """convert qkv concat weight"""
115
+ for i in range(self.num_layers):
116
+ # qkv weight concat
117
+ wq_weight_name = f"model.layers.{i}.attention.wq.weight"
118
+ wk_weight_name = f"model.layers.{i}.attention.wk.weight"
119
+ wv_weight_name = f"model.layers.{i}.attention.wv.weight"
120
+ qkv_concat_weight_name = f"model.layers.{i}.attention.w_qkv.weight"
121
+ if wq_weight_name not in param_dict:
122
+ break
123
+ wq_weight = param_dict[wq_weight_name].asnumpy()
124
+ wk_weight = param_dict[wk_weight_name].asnumpy()
125
+ wv_weight = param_dict[wv_weight_name].asnumpy()
126
+ qkv_weight = np.concatenate((wq_weight, wk_weight, wv_weight), 0)
127
+ param_dict[qkv_concat_weight_name] = Parameter(
128
+ qkv_weight, name=qkv_concat_weight_name
129
+ )
130
+
131
+ # gate hidden weight concat
132
+ ffn_gate_weight_name = f"model.layers.{i}.feed_forward.w1.weight"
133
+ ffn_hidden_weight_name = f"model.layers.{i}.feed_forward.w3.weight"
134
+ gate_hidden_concat_weight_name = (
135
+ f"model.layers.{i}.feed_forward.w_gate_hidden.weight"
136
+ )
137
+
138
+ ffn_gate_weight = param_dict[ffn_gate_weight_name].asnumpy()
139
+ ffn_hidden_weight = param_dict[ffn_hidden_weight_name].asnumpy()
140
+ gate_hidden_weight = np.concatenate((ffn_gate_weight, ffn_hidden_weight), 0)
141
+ param_dict[gate_hidden_concat_weight_name] = Parameter(
142
+ gate_hidden_weight, name=gate_hidden_concat_weight_name
143
+ )
144
+
145
+ param_dict.pop(wq_weight_name)
146
+ param_dict.pop(wk_weight_name)
147
+ param_dict.pop(wv_weight_name)
148
+ param_dict.pop(ffn_gate_weight_name)
149
+ param_dict.pop(ffn_hidden_weight_name)
150
+ logger.info(f"transform: {qkv_concat_weight_name}")
151
+ logger.info(f"transform: {gate_hidden_concat_weight_name}")
152
+
153
+ for i in range(self.num_layers):
154
+ # qkv bias concat
155
+ wq_bias_name = f"model.layers.{i}.attention.wq.bias"
156
+ wk_bias_name = f"model.layers.{i}.attention.wk.bias"
157
+ wv_bias_name = f"model.layers.{i}.attention.wv.bias"
158
+ qkv_concat_bias_name = f"model.layers.{i}.attention.w_qkv.bias"
159
+ if wq_bias_name not in param_dict:
160
+ break
161
+
162
+ wq_bias_weight = param_dict[wq_bias_name].asnumpy()
163
+ wk_bias_weight = param_dict[wk_bias_name].asnumpy()
164
+ wv_bias_weight = param_dict[wv_bias_name].asnumpy()
165
+ qkv_bias_weight = np.concatenate(
166
+ (wq_bias_weight, wk_bias_weight, wv_bias_weight), 0
167
+ )
168
+ param_dict[qkv_concat_bias_name] = Parameter(
169
+ qkv_bias_weight, name=qkv_concat_bias_name
170
+ )
171
+
172
+ param_dict.pop(wq_bias_name)
173
+ param_dict.pop(wk_bias_name)
174
+ param_dict.pop(wv_bias_name)
175
+ logger.info(f"transform: {qkv_concat_bias_name}")
176
+ return param_dict
177
+
90
178
  def set_weights(self, parm_dict, dtype=mstype.float16):
91
179
  """set weights for llm boost"""
180
+ self._convert_qkv_concat_weight(parm_dict)
92
181
  embedding_weight_name = "model.tok_embeddings.embedding_weight"
93
182
  attention_norm_name = "attention_norm"
94
183
  qkv_name = "attention.w_qkv"
@@ -101,45 +190,88 @@ class AtbBoostBase():
101
190
  placeholder = Parameter(Tensor(np.zeros(1), dtype=dtype))
102
191
 
103
192
  ascend_weight = []
104
- ascend_weight.append(
105
- self.cast(parm_dict[embedding_weight_name], dtype))
193
+ ascend_weight.append(self.cast(parm_dict[embedding_weight_name], dtype))
106
194
  for i in range(self.num_layers):
107
- ascend_weight.append(self._convert_tensor_format_and_dtype(
108
- parm_dict[f"model.layers.{i}.{attention_norm_name}.weight"], dtype))
195
+ ascend_weight.append(
196
+ self._convert_tensor_format_and_dtype(
197
+ parm_dict[f"model.layers.{i}.{attention_norm_name}.weight"], dtype
198
+ )
199
+ )
109
200
  ascend_weight.extend([placeholder] * 3)
110
201
 
111
202
  ascend_weight.append(
112
- self._convert_tensor_format_and_dtype(parm_dict[f"model.layers.{i}.{qkv_name}.weight"], dtype))
113
- ascend_weight.append(self._convert_tensor_format_and_dtype(parm_dict.get(
114
- f"model.layers.{i}.{qkv_name}.bias", placeholder), dtype))
203
+ self._convert_tensor_format_and_dtype(
204
+ parm_dict[f"model.layers.{i}.{qkv_name}.weight"], dtype
205
+ )
206
+ )
207
+ ascend_weight.append(
208
+ self._convert_tensor_format_and_dtype(
209
+ parm_dict.get(f"model.layers.{i}.{qkv_name}.bias", placeholder),
210
+ dtype,
211
+ )
212
+ )
115
213
  ascend_weight.extend([placeholder] * 16)
116
214
 
117
215
  ascend_weight.append(
118
- self._convert_tensor_format_and_dtype(parm_dict[f"model.layers.{i}.{o_name}.weight"], dtype))
119
- ascend_weight.append(self._convert_tensor_format_and_dtype(parm_dict.get(
120
- f"model.layers.{i}.{o_name}.bias", placeholder), dtype))
216
+ self._convert_tensor_format_and_dtype(
217
+ parm_dict[f"model.layers.{i}.{o_name}.weight"], dtype
218
+ )
219
+ )
220
+ ascend_weight.append(
221
+ self._convert_tensor_format_and_dtype(
222
+ parm_dict.get(f"model.layers.{i}.{o_name}.bias", placeholder), dtype
223
+ )
224
+ )
121
225
  ascend_weight.extend([placeholder] * 4)
122
226
 
123
227
  ascend_weight.append(
124
- self._convert_tensor_format_and_dtype(parm_dict[f"model.layers.{i}.{mlp_norm_name}.weight"], dtype))
228
+ self._convert_tensor_format_and_dtype(
229
+ parm_dict[f"model.layers.{i}.{mlp_norm_name}.weight"], dtype
230
+ )
231
+ )
125
232
  ascend_weight.extend([placeholder] * 3)
126
233
 
127
234
  ascend_weight.append(
128
- self._convert_tensor_format_and_dtype(parm_dict[f"model.layers.{i}.{mlp_gate_name}.weight"], dtype))
129
- ascend_weight.append(self._convert_tensor_format_and_dtype(parm_dict.get(
130
- f"model.layers.{i}.{mlp_gate_name}.bias", placeholder), dtype))
235
+ self._convert_tensor_format_and_dtype(
236
+ parm_dict[f"model.layers.{i}.{mlp_gate_name}.weight"], dtype
237
+ )
238
+ )
239
+ ascend_weight.append(
240
+ self._convert_tensor_format_and_dtype(
241
+ parm_dict.get(
242
+ f"model.layers.{i}.{mlp_gate_name}.bias", placeholder
243
+ ),
244
+ dtype,
245
+ )
246
+ )
131
247
  ascend_weight.extend([placeholder] * 10)
132
248
 
133
249
  ascend_weight.append(
134
- self._convert_tensor_format_and_dtype(parm_dict[f"model.layers.{i}.{mlp_down_name}.weight"], dtype))
135
- ascend_weight.append(self._convert_tensor_format_and_dtype(parm_dict.get(
136
- f"model.layers.{i}.{mlp_down_name}.bias", placeholder), dtype))
250
+ self._convert_tensor_format_and_dtype(
251
+ parm_dict[f"model.layers.{i}.{mlp_down_name}.weight"], dtype
252
+ )
253
+ )
254
+ ascend_weight.append(
255
+ self._convert_tensor_format_and_dtype(
256
+ parm_dict.get(
257
+ f"model.layers.{i}.{mlp_down_name}.bias", placeholder
258
+ ),
259
+ dtype,
260
+ )
261
+ )
137
262
  ascend_weight.extend([placeholder] * 4)
138
263
 
139
264
  ascend_weight.append(
140
- self._convert_tensor_format_and_dtype(parm_dict[f"{norm_out_name}.weight"], dtype))
265
+ self._convert_tensor_format_and_dtype(
266
+ parm_dict[f"{norm_out_name}.weight"], dtype
267
+ )
268
+ )
141
269
  ascend_weight.append(
142
- self._convert_tensor_format_and_dtype(parm_dict[f"{lm_head_name}.weight"], dtype))
270
+ self._convert_tensor_format_and_dtype(
271
+ parm_dict[f"{lm_head_name}.weight"], dtype
272
+ )
273
+ )
274
+ self.ascend_weight = ascend_weight
143
275
  self.atb_encoder_operation.set_weights(ascend_weight)
144
276
  self.atb_decoder_operation.set_weights(ascend_weight)
145
277
 
@@ -147,20 +279,47 @@ class AtbBoostBase():
147
279
  """set kv_cache for llm boost"""
148
280
  if not k_caches or v_caches:
149
281
  if self.need_nz:
150
- kv_shape = (self.config.num_blocks, self.num_kv_heads*self.head_dim //
151
- self.device_num // 16, self.config.block_size, 16)
152
- k_caches = [_set_format(Parameter(Tensor(
153
- shape=kv_shape, dtype=self.dtype, init=Zero())), "FRACTAL_NZ") for _ in range(self.num_layers)]
154
- v_caches = [_set_format(Parameter(Tensor(
155
- shape=kv_shape, dtype=self.dtype, init=Zero())), "FRACTAL_NZ") for _ in range(self.num_layers)]
282
+ kv_shape = (
283
+ self.config.num_blocks,
284
+ self.num_kv_heads * self.head_dim // self.device_num // 16,
285
+ self.config.block_size,
286
+ 16,
287
+ )
288
+ k_caches = [
289
+ _set_format(
290
+ Parameter(
291
+ Tensor(shape=kv_shape, dtype=self.dtype, init=Zero())
292
+ ),
293
+ FORMAT_NZ,
294
+ )
295
+ for _ in range(self.num_layers)
296
+ ]
297
+ v_caches = [
298
+ _set_format(
299
+ Parameter(
300
+ Tensor(shape=kv_shape, dtype=self.dtype, init=Zero())
301
+ ),
302
+ FORMAT_NZ,
303
+ )
304
+ for _ in range(self.num_layers)
305
+ ]
156
306
  else:
157
- kv_shape = (self.config.num_blocks, self.config.block_size,
158
- self.num_kv_heads // self.device_num, self.head_dim)
159
- k_caches = [Parameter(Tensor(
160
- shape=kv_shape, dtype=self.dtype, init=Zero())) for _ in range(self.num_layers)]
161
- v_caches = [Parameter(Tensor(
162
- shape=kv_shape, dtype=self.dtype, init=Zero())) for _ in range(self.num_layers)]
163
-
307
+ kv_shape = (
308
+ self.config.num_blocks,
309
+ self.config.block_size,
310
+ self.num_kv_heads // self.device_num,
311
+ self.head_dim,
312
+ )
313
+ k_caches = [
314
+ Parameter(Tensor(shape=kv_shape, dtype=self.dtype, init=Zero()))
315
+ for _ in range(self.num_layers)
316
+ ]
317
+ v_caches = [
318
+ Parameter(Tensor(shape=kv_shape, dtype=self.dtype, init=Zero()))
319
+ for _ in range(self.num_layers)
320
+ ]
321
+ self.k_caches = k_caches
322
+ self.v_caches = v_caches
164
323
  self.atb_encoder_operation.set_kvcache(k_caches, v_caches)
165
324
  self.atb_decoder_operation.set_kvcache(k_caches, v_caches)
166
325
 
@@ -171,11 +330,9 @@ class AtbBoostBase():
171
330
  def _execute_operator(self, acl_inputs, acl_param):
172
331
  """execute operator."""
173
332
  if self.is_first_iteration:
174
- acl_model_out = self.atb_encoder_operation.forward(
175
- acl_inputs, acl_param)
333
+ acl_model_out = self.atb_encoder_operation.forward(acl_inputs, acl_param)
176
334
  else:
177
- acl_model_out = self.atb_decoder_operation.forward(
178
- acl_inputs, acl_param)
335
+ acl_model_out = self.atb_decoder_operation.forward(acl_inputs, acl_param)
179
336
  acl_hidden_state = acl_model_out[0]
180
337
  return acl_hidden_state
181
338
 
@@ -183,28 +340,46 @@ class AtbBoostBase():
183
340
  r"""
184
341
  LlmBoost forward.
185
342
  """
186
- input_ids = boost_inputs["input_ids"]
187
- position_ids = boost_inputs["position_ids"]
188
- cos_embed = boost_inputs["cos_embed"]
189
- sin_embed = boost_inputs["sin_embed"]
190
- block_tables = boost_inputs["block_tables"]
191
- slot_mapping = boost_inputs["slot_mapping"]
192
- batch_valid_length = boost_inputs["batch_valid_length"]
193
- lm_head_indices = boost_inputs["lm_head_indices"]
194
- seqLen = boost_inputs["seq_lens"]
343
+ input_ids = boost_inputs.get("input_ids", None)
344
+ position_ids = boost_inputs.get("position_ids", None)
345
+ cos_embed = boost_inputs.get("cos_embed", None)
346
+ sin_embed = boost_inputs.get("sin_embed", None)
347
+ block_tables = boost_inputs.get("block_tables", None)
348
+ slot_mapping = boost_inputs.get("slot_mapping", None)
349
+ batch_valid_length = boost_inputs.get("batch_valid_length", None)
350
+ lm_head_indices = boost_inputs.get("lm_head_indices", None)
351
+ seqLen = boost_inputs.get("seq_lens", None)
352
+ input_ids = self.reshape(input_ids, (-1,))
195
353
  if self.is_first_iteration:
196
354
  attention_mask = self.attn_mask
197
355
  else:
198
- position_ids = batch_valid_length - 1
356
+ if position_ids is None:
357
+ position_ids = batch_valid_length - 1
199
358
  attention_mask = self.placeholder
200
359
  lm_head_indices = self.lm_head_indices_fake
201
360
 
202
- acl_inputs, acl_param = self._prepare_inputs(prefill=self.is_first_iteration, input_ids=input_ids,
203
- position_ids=position_ids, cos_embed=cos_embed,
204
- sin_embed=sin_embed, attention_mask=attention_mask,
205
- block_tables=block_tables, slots=slot_mapping,
206
- input_lengths=batch_valid_length, lm_head_indices=lm_head_indices,
207
- seqLen=seqLen)
361
+ if input_ids is not None and input_ids.dtype != mstype.int64:
362
+ input_ids = self.cast(input_ids, mstype.int64)
363
+ if position_ids is not None and position_ids.dtype != mstype.int64:
364
+ position_ids = self.cast(position_ids, mstype.int64)
365
+ if batch_valid_length is not None and batch_valid_length.dtype != mstype.int32:
366
+ batch_valid_length = self.cast(batch_valid_length, mstype.int32)
367
+ if lm_head_indices is not None and lm_head_indices.dtype != mstype.int64:
368
+ lm_head_indices = self.cast(lm_head_indices, mstype.int64)
369
+
370
+ acl_inputs, acl_param = self._prepare_inputs(
371
+ prefill=self.is_first_iteration,
372
+ input_ids=input_ids,
373
+ position_ids=position_ids,
374
+ cos_embed=cos_embed,
375
+ sin_embed=sin_embed,
376
+ attention_mask=attention_mask,
377
+ block_tables=block_tables,
378
+ slots=slot_mapping,
379
+ input_lengths=batch_valid_length,
380
+ lm_head_indices=lm_head_indices,
381
+ seqLen=seqLen,
382
+ )
208
383
  ms.hal.synchronize()
209
384
  logits = self._execute_operator(acl_inputs, acl_param)
210
385
  logits = self.cast(logits, mstype.float32)
@@ -15,10 +15,16 @@
15
15
  """llm boost"""
16
16
  import json
17
17
  import mindspore.common.dtype as mstype
18
- from mindspore.experimental.llm_boost.atb.boost_base import AtbBoostBase
18
+ from mindspore.experimental.llm_boost.atb.boost_base import (
19
+ AtbBoostBase,
20
+ PositionEmbeddingType,
21
+ NormType,
22
+ )
19
23
  from mindspore._c_expression import LlmBoostBinder
20
24
  from mindspore.experimental.llm_boost.register import LlmBoostRegister, LlmBoostType
21
25
 
26
+ CPP_LLAMA_MODEL_CLASS_NAME = "llama_LlamaDecoderModel"
27
+
22
28
 
23
29
  @LlmBoostRegister.register(LlmBoostType.BUILDIN, "Llama")
24
30
  class LlamaBoost(AtbBoostBase):
@@ -30,14 +36,21 @@ class LlamaBoost(AtbBoostBase):
30
36
  self.acl_encoder_operation_inputs = [None] * self.in_tensor_length
31
37
  self.acl_decoder_operation_inputs = [None] * self.in_tensor_length
32
38
  self.atb_encoder_operation = LlmBoostBinder(
33
- "ATB", "llama_parallel_DecoderModel")
39
+ self.backend_name, CPP_LLAMA_MODEL_CLASS_NAME
40
+ )
34
41
  self.atb_decoder_operation = LlmBoostBinder(
35
- "ATB", "llama_parallel_DecoderModel")
42
+ self.backend_name, CPP_LLAMA_MODEL_CLASS_NAME
43
+ )
36
44
 
37
45
  def init(self):
38
- """set param"""
46
+ """
47
+ Initialize the object
48
+ returns True if object needs input manipulation by mindformers
49
+ """
50
+
39
51
  coder_param = {
40
- "rmsNormEps": self.config.rms_norm_eps,
52
+ "normEps": self.config.rms_norm_eps,
53
+ "normType": NormType.RMS_NORM,
41
54
  "numAttentionHeadsPerRank": self.config.num_heads // self.device_num,
42
55
  "hiddenSizePerAttentionHead": self.head_dim,
43
56
  "numHiddenLayers": self.num_layers,
@@ -46,35 +59,45 @@ class LlamaBoost(AtbBoostBase):
46
59
  "isFA": False,
47
60
  "isBF16": self.dtype == mstype.bfloat16,
48
61
  "packQuantType": [[1, 1] for _ in range(self.num_layers)],
49
- "linearQuantType": [[0, -1, -1, 0, 0, -1, 0] for _ in range(self.num_layers)],
50
- "linearTransposeType": [[1, -1, -1, 1, 1, -1, 1] for i in range(self.num_layers)],
62
+ "linearQuantType": [
63
+ [0, -1, -1, 0, 0, -1, 0] for _ in range(self.num_layers)
64
+ ],
65
+ "linearTransposeType": [
66
+ [1, -1, -1, 1, 1, -1, 1] for i in range(self.num_layers)
67
+ ],
51
68
  "isEmbeddingParallel": False,
52
69
  "isLmHeadParallel": not self.config.parallel_config.vocab_emb_dp,
53
70
  "lmHeadTransposeType": 1,
54
- "supportSwiGLU": True,
55
- "kvQuant": self.kv_quant is not None,
71
+ "enableSwiGLU": True,
72
+ "enablekvQuant": self.kv_quant is not None,
56
73
  "rank": self.rank_id,
57
74
  "worldSize": self.device_num,
58
- "backend": "lccl",
75
+ "backend": self.config.communication_backend,
59
76
  "rankTableFile": "",
60
- "positionEmbeddingType": self.position_embedding_type,
77
+ "positionEmbeddingType": PositionEmbeddingType.ROPE,
61
78
  "hiddenSize": self.config.hidden_size,
62
79
  "gemma": False,
63
- "enableAddNorm": True,
64
- "supportCompressHead": False,
80
+ "enableAddNorm": False,
81
+ "enableCompressHead": False,
82
+ "isUnpadInputs": True,
65
83
  }
66
84
  encoder_param = {
67
- **coder_param, "isPrefill": True,
68
- "supportLcoc": True,
69
- "supportSpeculate": False,
70
- "skipWordEmbedding": False
85
+ **coder_param,
86
+ "isPrefill": True,
87
+ "enableLcoc": True,
88
+ "enableSpeculate": False,
89
+ "skipWordEmbedding": False,
90
+ "enableSplitFuse": False,
71
91
  }
72
92
  decoder_param = {
73
- **coder_param, "isPrefill": False, "supportLcoc": False,
74
- "supportSpeculate": False
93
+ **coder_param,
94
+ "isPrefill": False,
95
+ "enableLcoc": False,
96
+ "enableSpeculate": False,
75
97
  }
76
98
  self.atb_encoder_operation.init(json.dumps({**encoder_param}))
77
99
  self.atb_decoder_operation.init(json.dumps({**decoder_param}))
100
+ return True
78
101
 
79
102
  def _prepare_inputs(
80
103
  self,
@@ -92,14 +115,15 @@ class LlamaBoost(AtbBoostBase):
92
115
  **kwargs
93
116
  ):
94
117
  """prepare inputs"""
95
- self.acl_param = json.dumps({
96
- "seqLen": seqLen,
97
- })
98
- self.acl_decoder_operation_inputs[0] = self.cast(
99
- input_ids, mstype.int64)
118
+ self.acl_param = json.dumps(
119
+ {
120
+ "seqLen": seqLen,
121
+ }
122
+ )
123
+
124
+ self.acl_decoder_operation_inputs[0] = input_ids
100
125
  self.acl_decoder_operation_inputs[1] = self.placeholder
101
- self.acl_decoder_operation_inputs[2] = self.cast(
102
- position_ids, mstype.int32)
126
+ self.acl_decoder_operation_inputs[2] = position_ids
103
127
  self.acl_decoder_operation_inputs[3] = cos_embed
104
128
  self.acl_decoder_operation_inputs[4] = sin_embed
105
129
  self.acl_decoder_operation_inputs[5] = attention_mask
@@ -108,8 +132,6 @@ class LlamaBoost(AtbBoostBase):
108
132
  self.acl_decoder_operation_inputs[8] = self.placeholder
109
133
  self.acl_decoder_operation_inputs[9] = self.placeholder
110
134
  self.acl_decoder_operation_inputs[10] = self.placeholder
111
- self.acl_decoder_operation_inputs[11] = self.cast(
112
- input_lengths, mstype.int32)
113
- self.acl_decoder_operation_inputs[12] = self.cast(
114
- lm_head_indices, mstype.int64)
135
+ self.acl_decoder_operation_inputs[11] = input_lengths
136
+ self.acl_decoder_operation_inputs[12] = lm_head_indices
115
137
  return self.acl_decoder_operation_inputs, self.acl_param