mindspore 2.4.1__cp39-none-any.whl → 2.5.0__cp39-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (847) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Third_Party_Open_Source_Software_Notice +39 -0
  3. mindspore/__init__.py +8 -3
  4. mindspore/_akg/akg/composite/build_module.py +6 -2
  5. mindspore/_akg/akg/utils/kernel_exec.py +2 -2
  6. mindspore/_c_dataengine.cpython-39-aarch64-linux-gnu.so +0 -0
  7. mindspore/_c_expression.cpython-39-aarch64-linux-gnu.so +0 -0
  8. mindspore/_c_mindrecord.cpython-39-aarch64-linux-gnu.so +0 -0
  9. mindspore/_checkparam.py +0 -5
  10. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  11. mindspore/_extends/parse/compile_config.py +64 -0
  12. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  14. mindspore/_extends/parse/parser.py +23 -5
  15. mindspore/_extends/parse/standard_method.py +123 -27
  16. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  17. mindspore/amp.py +7 -1
  18. mindspore/boost/boost_cell_wrapper.py +136 -41
  19. mindspore/common/__init__.py +3 -1
  20. mindspore/common/_register_for_tensor.py +0 -1
  21. mindspore/common/_stub_tensor.py +25 -4
  22. mindspore/common/_tensor_cpp_method.py +17 -0
  23. mindspore/common/_tensor_docs.py +6132 -0
  24. mindspore/common/api.py +99 -25
  25. mindspore/common/dtype.py +34 -34
  26. mindspore/common/dump.py +2 -1
  27. mindspore/common/file_system.py +8 -1
  28. mindspore/common/generator.py +2 -0
  29. mindspore/common/hook_handle.py +3 -1
  30. mindspore/common/initializer.py +3 -4
  31. mindspore/common/lazy_inline.py +8 -2
  32. mindspore/common/mindir_util.py +10 -2
  33. mindspore/common/parameter.py +30 -27
  34. mindspore/common/tensor.py +713 -1337
  35. mindspore/communication/__init__.py +1 -1
  36. mindspore/communication/_comm_helper.py +10 -0
  37. mindspore/communication/comm_func.py +215 -173
  38. mindspore/communication/management.py +23 -20
  39. mindspore/context.py +292 -193
  40. mindspore/dataset/__init__.py +23 -19
  41. mindspore/dataset/callback/ds_callback.py +2 -1
  42. mindspore/dataset/core/config.py +84 -3
  43. mindspore/dataset/engine/cache_admin.py +3 -3
  44. mindspore/dataset/engine/cache_client.py +5 -4
  45. mindspore/dataset/engine/datasets.py +192 -149
  46. mindspore/dataset/engine/datasets_audio.py +14 -0
  47. mindspore/dataset/engine/datasets_standard_format.py +28 -11
  48. mindspore/dataset/engine/datasets_text.py +38 -1
  49. mindspore/dataset/engine/datasets_user_defined.py +125 -65
  50. mindspore/dataset/engine/datasets_vision.py +81 -8
  51. mindspore/dataset/engine/iterators.py +281 -63
  52. mindspore/dataset/engine/obs/util.py +8 -0
  53. mindspore/dataset/engine/queue.py +40 -0
  54. mindspore/dataset/engine/samplers.py +26 -2
  55. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  56. mindspore/dataset/engine/validators.py +43 -11
  57. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  58. mindspore/dataset/transforms/transforms.py +29 -12
  59. mindspore/dataset/vision/validators.py +1 -2
  60. mindspore/device_context/__init__.py +21 -0
  61. mindspore/device_context/ascend/__init__.py +25 -0
  62. mindspore/device_context/ascend/device.py +72 -0
  63. mindspore/device_context/ascend/op_debug.py +94 -0
  64. mindspore/device_context/ascend/op_precision.py +193 -0
  65. mindspore/device_context/ascend/op_tuning.py +127 -0
  66. mindspore/device_context/cpu/__init__.py +25 -0
  67. mindspore/device_context/cpu/device.py +62 -0
  68. mindspore/device_context/cpu/op_tuning.py +43 -0
  69. mindspore/device_context/gpu/__init__.py +21 -0
  70. mindspore/device_context/gpu/device.py +70 -0
  71. mindspore/device_context/gpu/op_precision.py +67 -0
  72. mindspore/device_context/gpu/op_tuning.py +175 -0
  73. mindspore/device_manager.py +134 -0
  74. mindspore/experimental/llm_boost/__init__.py +3 -2
  75. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  76. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  77. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  78. mindspore/experimental/llm_boost/atb/boost_base.py +239 -64
  79. mindspore/experimental/llm_boost/atb/llama_boost.py +52 -30
  80. mindspore/experimental/llm_boost/atb/qwen_boost.py +47 -24
  81. mindspore/experimental/llm_boost/register.py +1 -0
  82. mindspore/experimental/optim/adadelta.py +26 -22
  83. mindspore/experimental/optim/adam.py +3 -0
  84. mindspore/experimental/optim/lr_scheduler.py +33 -24
  85. mindspore/experimental/optim/radam.py +33 -30
  86. mindspore/hal/device.py +28 -0
  87. mindspore/hal/event.py +17 -0
  88. mindspore/hal/memory.py +94 -3
  89. mindspore/hal/stream.py +91 -6
  90. mindspore/include/api/context.h +1 -2
  91. mindspore/include/dataset/constants.h +2 -2
  92. mindspore/lib/libavcodec.so.59 +0 -0
  93. mindspore/lib/libavdevice.so.59 +0 -0
  94. mindspore/lib/libavfilter.so.8 +0 -0
  95. mindspore/lib/libavformat.so.59 +0 -0
  96. mindspore/lib/libavutil.so.57 +0 -0
  97. mindspore/lib/libdnnl.so.2 +0 -0
  98. mindspore/lib/libmindspore_backend.so +0 -0
  99. mindspore/lib/libmindspore_common.so +0 -0
  100. mindspore/lib/libmindspore_core.so +0 -0
  101. mindspore/lib/libmindspore_gpr.so.15 +0 -0
  102. mindspore/lib/libmindspore_grpc++.so.1 +0 -0
  103. mindspore/lib/libmindspore_grpc.so.15 +0 -0
  104. mindspore/lib/libmindspore_ops.so +0 -0
  105. mindspore/lib/libmpi_adapter.so +0 -0
  106. mindspore/lib/libmpi_collective.so +0 -0
  107. mindspore/lib/libnnacl.so +0 -0
  108. mindspore/lib/libopencv_core.so.4.5 +0 -0
  109. mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
  110. mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
  111. mindspore/lib/libps_cache.so +0 -0
  112. mindspore/lib/libswresample.so.4 +0 -0
  113. mindspore/lib/libswscale.so.6 +0 -0
  114. mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json +2048 -0
  115. mindspore/lib/plugin/ascend/custom_aicore_ops/op_proto/libop_proto.so +0 -0
  116. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
  117. mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
  118. mindspore/lib/plugin/ascend/custom_ascendc_910/framework/npu_supported_ops.json +10 -0
  119. mindspore/lib/plugin/ascend/custom_ascendc_910/op_api/lib/libcust_opapi.so +0 -0
  120. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json +182 -0
  121. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/decoder_kv_cache.py +51 -16
  122. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/prompt_kv_cache.py +51 -16
  123. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +158 -0
  124. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  125. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +158 -0
  126. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  127. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +158 -0
  128. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  129. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +158 -0
  130. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  131. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +158 -0
  132. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  133. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +158 -0
  134. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  135. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +158 -0
  136. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  137. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +158 -0
  138. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  139. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +167 -0
  140. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  141. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +167 -0
  142. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  143. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +167 -0
  144. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  145. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +167 -0
  146. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  147. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +167 -0
  148. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  149. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +167 -0
  150. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  151. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +167 -0
  152. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  153. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +167 -0
  154. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/ascend910/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  155. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/binary_info_config.json +302 -0
  156. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/decoder_kv_cache.json +892 -0
  157. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/kernel/config/ascend910/prompt_kv_cache.json +892 -0
  158. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  159. mindspore/lib/plugin/ascend/custom_ascendc_910/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  160. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/inc/op_proto.h +33 -0
  161. mindspore/lib/plugin/ascend/custom_ascendc_910/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  162. mindspore/lib/plugin/ascend/custom_ascendc_910/version.info +1 -0
  163. mindspore/lib/plugin/ascend/custom_ascendc_910b/framework/npu_supported_ops.json +14 -0
  164. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/include/aclnn_decoder_kv_cache.h +59 -0
  165. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_api/include/aclnn_prompt_kv_cache.h +59 -0
  166. mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_api/lib/libcust_opapi.so +0 -0
  167. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl}/dynamic/all_finite.py +51 -16
  168. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.cpp +192 -0
  169. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/decoder_kv_cache.py +215 -0
  170. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.cpp +274 -0
  171. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl/dynamic/prompt_kv_cache.py +215 -0
  172. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +80 -0
  173. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  174. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +80 -0
  175. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  176. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +80 -0
  177. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  178. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +158 -0
  179. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  180. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +158 -0
  181. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  182. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +158 -0
  183. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  184. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +158 -0
  185. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  186. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +158 -0
  187. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  188. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +158 -0
  189. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  190. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +158 -0
  191. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  192. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +158 -0
  193. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  194. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +167 -0
  195. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  196. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +167 -0
  197. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  198. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +167 -0
  199. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  200. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +167 -0
  201. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  202. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +167 -0
  203. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  204. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +167 -0
  205. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  206. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +167 -0
  207. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  208. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +167 -0
  209. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend310p/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  210. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  211. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_86a73ff6e28d734c96bb8d3054f7dd18.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o} +0 -0
  212. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  213. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_f55e0ebaad1f2f572e43677336992fa0.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o} +0 -0
  214. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  215. mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_576ceaeef5870c451cab59af55ea46ad.o → custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o} +0 -0
  216. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  217. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  218. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  219. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  220. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  221. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  222. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  223. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  224. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  225. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  226. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  227. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  228. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  229. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  230. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  231. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  232. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  233. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  234. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  235. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  236. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  237. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  238. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  239. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  240. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  241. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  242. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  243. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  244. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  245. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  246. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  247. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910_93/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  248. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.json +78 -0
  249. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_52f59e2a65d9b1bb002de35c2819754a.o +0 -0
  250. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.json +78 -0
  251. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_6b5e50e30256d85838d6ce83514df20f.o +0 -0
  252. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.json +78 -0
  253. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_74e4ac02880d452e3308c94af273562e.o +0 -0
  254. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.json +156 -0
  255. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_0d5520cc587ad44ce634bf3fbcffc272.o +0 -0
  256. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.json +156 -0
  257. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_20390d30b3c4c0d23167ccca6c030c2b.o +0 -0
  258. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.json +156 -0
  259. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_2d151f0b1d2db51faa2968d5b67544e2.o +0 -0
  260. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.json +156 -0
  261. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_561690ec17cc1def3d2fcf68c1b07b56.o +0 -0
  262. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.json +156 -0
  263. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_570f9aaa99e5e773b3dd0a33784363f4.o +0 -0
  264. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.json +156 -0
  265. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_59668a0f0764afb98fda8ab9e84126f1.o +0 -0
  266. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.json +156 -0
  267. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_91d9833e4792b70b670e4e2b916abd86.o +0 -0
  268. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.json +156 -0
  269. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/decoder_kv_cache/DecoderKvCache_c74cdc5fef094383401856f8519504af.o +0 -0
  270. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.json +165 -0
  271. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0515c7b1a4cd614449e38c5e9a7e3f8d.o +0 -0
  272. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.json +165 -0
  273. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_09f22d898d6358c91e7c4fc48bac48e7.o +0 -0
  274. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.json +165 -0
  275. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_0cb9a6f894b925250227136e5aab7061.o +0 -0
  276. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.json +165 -0
  277. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_2fa8702ffd7ca85e9e194f62644415d5.o +0 -0
  278. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.json +165 -0
  279. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_570b62f187dfd439b64613d881deedb7.o +0 -0
  280. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.json +165 -0
  281. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_585218c11411ff84709b9e725b66c435.o +0 -0
  282. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.json +165 -0
  283. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_5c9365ccde170b358c5b126d69dae13e.o +0 -0
  284. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.json +165 -0
  285. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/ascend910b/prompt_kv_cache/PromptKvCache_6d97c45b7c43bc16fcff8baa5dacac4e.o +0 -0
  286. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/all_finite.json +139 -0
  287. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/binary_info_config.json +361 -0
  288. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/decoder_kv_cache.json +892 -0
  289. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend310p/prompt_kv_cache.json +892 -0
  290. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/all_finite.json +139 -0
  291. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/binary_info_config.json +361 -0
  292. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/decoder_kv_cache.json +892 -0
  293. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910_93/prompt_kv_cache.json +892 -0
  294. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/all_finite.json +139 -0
  295. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/binary_info_config.json +361 -0
  296. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/decoder_kv_cache.json +892 -0
  297. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/kernel/config/ascend910b/prompt_kv_cache.json +892 -0
  298. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  299. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  300. mindspore/lib/plugin/ascend/custom_ascendc_910b/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  301. mindspore/lib/plugin/ascend/custom_ascendc_910b/version.info +1 -0
  302. mindspore/lib/plugin/ascend/custom_compiler/setup.py +1 -1
  303. mindspore/lib/plugin/ascend/libascend_collective.so +0 -0
  304. mindspore/lib/plugin/ascend/libdvpp_utils.so +0 -0
  305. mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
  306. mindspore/lib/plugin/ascend/liblowlatency_collective.so +0 -0
  307. mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
  308. mindspore/lib/plugin/ascend/libmindspore_internal_kernels.so +0 -0
  309. mindspore/lib/plugin/ascend/libms_ascend_native_boost.so +0 -0
  310. mindspore/lib/plugin/ascend/libms_atb_boost.so +0 -0
  311. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/bin/PkgInspect +0 -0
  312. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/bin/op_man +0 -0
  313. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/device/ascend910b/bin/ascend910b.bin +957 -955
  314. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/host/libasdops_cann_host.so +0 -0
  315. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/host/libasdops_host.so +0 -0
  316. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops.so +0 -0
  317. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/libasdops_static.a +0 -0
  318. mindspore/lib/plugin/ascend/ms_kernels_internal/asdops/lib/liblcal_static.a +0 -0
  319. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/base_type.h → base_type.h} +25 -20
  320. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{cast/cast_tiling.h → internal.h} +6 -4
  321. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_op.h +114 -0
  322. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/boost_kernel.h +70 -0
  323. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/llama_impl.h +85 -0
  324. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/model_interface.h +52 -0
  325. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/llm/tensor.h +81 -0
  326. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_creator.h +123 -0
  327. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/op_param.h +155 -110
  328. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/{acme/include/tiling_info.h → tiling_info.h} +12 -9
  329. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tiling_utils.h +178 -0
  330. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_layer_norm_op.so +0 -0
  331. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_op.so +0 -0
  332. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_op.so +0 -0
  333. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_op.so +0 -0
  334. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_op.so +0 -0
  335. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcast_op.so +0 -0
  336. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libcompare_op.so +0 -0
  337. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libgelu_op.so +0 -0
  338. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libllama_op.so +0 -0
  339. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmatmul_op.so +0 -0
  340. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_kernels_internal.so +0 -0
  341. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libms_optiling.so +0 -0
  342. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libmulti_weight_matmul_kernel_op.so +0 -0
  343. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_op.so +0 -0
  344. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_op.so +0 -0
  345. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/librms_norm_op.so +0 -0
  346. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz.o +0 -0
  347. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_f16_nz/internal_pp_matmul_f16_nz_0.o +0 -0
  348. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress.o +0 -0
  349. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_i8_nz_compress/internal_pp_matmul_i8_nz_compress_0.o +0 -0
  350. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz.o +0 -0
  351. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/object_kernels/internal_pp_matmul_int8_nz/internal_pp_matmul_int8_nz_0.o +0 -0
  352. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libadd_rms_norm_quant_ascend310p.so +0 -0
  353. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_310p_impl.so → op_kernels/ascend310p/so_kernels/libapply_rotary_pos_emb_310p_ascend310p.so} +0 -0
  354. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcast_ascend310p.so +0 -0
  355. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libcompare_ascend310p.so +0 -0
  356. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libgelu_ascend310p.so +0 -0
  357. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libmatmul_ascend310p.so +0 -0
  358. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend310p/so_kernels/libreshape_and_cache_nz_ascend310p.so +0 -0
  359. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.json +163 -0
  360. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_4b60f88cdc28b25a36bad2d8b0a88092.o +0 -0
  361. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.json +163 -0
  362. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/hphol_kernels/add_rms_norm_dynamic_quant/AddRmsNormDynamicQuant_cde61da2bd6fededcb1ba310a6ad16ee.o +0 -0
  363. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  364. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  365. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  366. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  367. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  368. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  369. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  370. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  371. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix.o +0 -0
  372. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aic_0.o +0 -0
  373. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_matmul_postfusion_mix/internal_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  374. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix.o +0 -0
  375. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  376. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/internal_multi_weight_matmul_postfusion_mix/internal_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  377. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_bf16.o +0 -0
  378. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp16.o +0 -0
  379. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_bf16_fp32.o +0 -0
  380. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_bf16.o +0 -0
  381. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp16.o +0 -0
  382. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/{matmul_add_rmsnorm → object_kernels/matmul_add_rmsnorm}/matmul_add_rmsnorm_fp16_fp32.o +0 -0
  383. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2.o +0 -0
  384. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aic_0.o +0 -0
  385. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/object_kernels/paged_attention_v2/paged_attention_v2_mix_aiv_0.o +0 -0
  386. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_layer_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_layer_norm_ascend910b.so} +0 -0
  387. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libadd_rms_norm_impl.so → op_kernels/ascend910b/so_kernels/libadd_rms_norm_ascend910b.so} +0 -0
  388. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libadd_rms_norm_quant_ascend910b.so +0 -0
  389. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libapply_rotary_pos_emb_impl.so → op_kernels/ascend910b/so_kernels/libapply_rotary_pos_emb_ascend910b.so} +0 -0
  390. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libcast_impl.so → op_kernels/ascend910b/so_kernels/libcast_ascend910b.so} +0 -0
  391. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libnot_equal_impl.so → op_kernels/ascend910b/so_kernels/libcompare_ascend910b.so} +0 -0
  392. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libgelu_impl.so → op_kernels/ascend910b/so_kernels/libgelu_ascend910b.so} +0 -0
  393. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/so_kernels/libllama_ascend910b.so +0 -0
  394. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmatmul_impl.so → op_kernels/ascend910b/so_kernels/libmatmul_ascend910b.so} +0 -0
  395. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libmulti_weight_matmul_kernel_impl.so → op_kernels/ascend910b/so_kernels/libmulti_weight_matmul_kernel_ascend910b.so} +0 -0
  396. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/libreshape_and_cache_impl.so → op_kernels/ascend910b/so_kernels/libreshape_and_cache_ascend910b.so} +0 -0
  397. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/{lib/librms_norm_impl.so → op_kernels/ascend910b/so_kernels/librms_norm_ascend910b.so} +0 -0
  398. mindspore/lib/plugin/ascend/ms_kernels_internal/lccl/lib/liblccl_wrapper.so +0 -0
  399. mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
  400. mindspore/log.py +12 -0
  401. mindspore/mindrecord/__init__.py +1 -1
  402. mindspore/mindrecord/config.py +17 -316
  403. mindspore/mindrecord/filereader.py +1 -9
  404. mindspore/mindrecord/filewriter.py +5 -15
  405. mindspore/mindrecord/mindpage.py +1 -9
  406. mindspore/mint/__init__.py +824 -218
  407. mindspore/mint/distributed/__init__.py +66 -4
  408. mindspore/mint/distributed/distributed.py +2594 -44
  409. mindspore/mint/linalg/__init__.py +6 -0
  410. mindspore/mint/nn/__init__.py +473 -14
  411. mindspore/mint/nn/functional.py +486 -11
  412. mindspore/mint/nn/layer/__init__.py +17 -4
  413. mindspore/mint/nn/layer/_functions.py +330 -0
  414. mindspore/mint/nn/layer/activation.py +169 -1
  415. mindspore/mint/nn/layer/basic.py +123 -0
  416. mindspore/mint/nn/layer/conv.py +727 -0
  417. mindspore/mint/nn/layer/normalization.py +215 -19
  418. mindspore/mint/nn/layer/padding.py +797 -0
  419. mindspore/mint/nn/layer/pooling.py +170 -0
  420. mindspore/mint/optim/__init__.py +2 -1
  421. mindspore/mint/optim/adam.py +223 -0
  422. mindspore/mint/optim/adamw.py +26 -19
  423. mindspore/mint/special/__init__.py +2 -1
  424. mindspore/multiprocessing/__init__.py +5 -0
  425. mindspore/nn/__init__.py +2 -0
  426. mindspore/nn/cell.py +142 -21
  427. mindspore/nn/dynamic_lr.py +2 -1
  428. mindspore/nn/layer/activation.py +6 -6
  429. mindspore/nn/layer/basic.py +35 -25
  430. mindspore/nn/layer/channel_shuffle.py +3 -3
  431. mindspore/nn/layer/conv.py +3 -0
  432. mindspore/nn/layer/embedding.py +3 -3
  433. mindspore/nn/layer/normalization.py +8 -7
  434. mindspore/nn/layer/padding.py +4 -3
  435. mindspore/nn/layer/pooling.py +55 -23
  436. mindspore/nn/layer/rnn_cells.py +1 -1
  437. mindspore/nn/layer/rnns.py +2 -1
  438. mindspore/nn/layer/timedistributed.py +5 -5
  439. mindspore/nn/layer/transformer.py +48 -26
  440. mindspore/nn/learning_rate_schedule.py +5 -3
  441. mindspore/nn/loss/loss.py +31 -36
  442. mindspore/nn/optim/ada_grad.py +1 -0
  443. mindspore/nn/optim/adadelta.py +2 -2
  444. mindspore/nn/optim/adam.py +1 -1
  445. mindspore/nn/optim/lars.py +1 -4
  446. mindspore/nn/optim/optimizer.py +1 -1
  447. mindspore/nn/optim/rprop.py +2 -2
  448. mindspore/nn/optim/thor.py +2 -1
  449. mindspore/nn/utils/__init__.py +22 -0
  450. mindspore/nn/utils/init.py +73 -0
  451. mindspore/nn/wrap/cell_wrapper.py +4 -6
  452. mindspore/nn/wrap/loss_scale.py +3 -4
  453. mindspore/numpy/array_creations.py +60 -62
  454. mindspore/numpy/array_ops.py +148 -143
  455. mindspore/numpy/logic_ops.py +41 -42
  456. mindspore/numpy/math_ops.py +361 -359
  457. mindspore/numpy/utils.py +16 -16
  458. mindspore/numpy/utils_const.py +4 -4
  459. mindspore/ops/__init__.py +2 -1
  460. mindspore/ops/_grad_experimental/grad_comm_ops.py +107 -8
  461. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  462. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  463. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  464. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  465. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  466. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  467. mindspore/ops/_vmap/vmap_base.py +0 -2
  468. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  469. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  470. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  471. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  472. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  473. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  474. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  475. mindspore/ops/auto_generate/gen_ops_prim.py +8027 -3411
  476. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  477. mindspore/ops/composite/base.py +1 -1
  478. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  479. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  480. mindspore/ops/function/__init__.py +12 -0
  481. mindspore/ops/function/array_func.py +561 -159
  482. mindspore/ops/function/clip_func.py +64 -0
  483. mindspore/ops/function/debug_func.py +28 -20
  484. mindspore/ops/function/image_func.py +1 -1
  485. mindspore/ops/function/linalg_func.py +5 -4
  486. mindspore/ops/function/math_func.py +1664 -294
  487. mindspore/ops/function/nn_func.py +988 -317
  488. mindspore/ops/function/parameter_func.py +3 -56
  489. mindspore/ops/function/random_func.py +243 -33
  490. mindspore/ops/function/sparse_unary_func.py +1 -1
  491. mindspore/ops/functional.py +18 -5
  492. mindspore/ops/functional_overload.py +897 -0
  493. mindspore/ops/operations/__init__.py +3 -2
  494. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  495. mindspore/ops/operations/_grad_ops.py +2 -34
  496. mindspore/ops/operations/_infer_ops.py +2 -1
  497. mindspore/ops/operations/_inner_ops.py +38 -8
  498. mindspore/ops/operations/array_ops.py +45 -303
  499. mindspore/ops/operations/comm_ops.py +23 -17
  500. mindspore/ops/operations/custom_ops.py +7 -49
  501. mindspore/ops/operations/debug_ops.py +42 -47
  502. mindspore/ops/operations/inner_ops.py +6 -4
  503. mindspore/ops/operations/linalg_ops.py +3 -2
  504. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  505. mindspore/ops/operations/math_ops.py +11 -216
  506. mindspore/ops/operations/nn_ops.py +153 -310
  507. mindspore/ops/primitive.py +23 -21
  508. mindspore/ops/tensor_method.py +1669 -0
  509. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  510. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  511. mindspore/ops_generate/arg_handler.py +0 -61
  512. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  513. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  514. mindspore/ops_generate/base_generator.py +11 -0
  515. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  516. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  517. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  518. mindspore/ops_generate/functions_cc_generator.py +233 -0
  519. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  520. mindspore/ops_generate/gen_constants.py +157 -3
  521. mindspore/ops_generate/gen_ops.py +245 -990
  522. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  523. mindspore/ops_generate/gen_utils.py +119 -33
  524. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  525. mindspore/ops_generate/op_api_proto.py +206 -0
  526. mindspore/ops_generate/op_def_py_generator.py +131 -0
  527. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  528. mindspore/ops_generate/op_proto.py +373 -108
  529. mindspore/ops_generate/op_template_parser.py +436 -0
  530. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  531. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  532. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  533. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  534. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  535. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  536. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  537. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  538. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  539. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  540. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  541. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  542. mindspore/ops_generate/pyboost_utils.py +92 -33
  543. mindspore/ops_generate/template.py +294 -44
  544. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  545. mindspore/parallel/__init__.py +3 -3
  546. mindspore/parallel/_auto_parallel_context.py +44 -34
  547. mindspore/parallel/_cell_wrapper.py +22 -3
  548. mindspore/parallel/_parallel_serialization.py +13 -2
  549. mindspore/parallel/_utils.py +4 -2
  550. mindspore/parallel/algo_parameter_config.py +1 -1
  551. mindspore/parallel/checkpoint_transform.py +44 -0
  552. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  553. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  554. mindspore/parallel/cluster/run.py +20 -3
  555. mindspore/parallel/parameter_broadcast.py +1 -1
  556. mindspore/parallel/shard.py +3 -0
  557. mindspore/parallel/transform_safetensors.py +119 -253
  558. mindspore/profiler/__init__.py +17 -4
  559. mindspore/profiler/analysis/__init__.py +0 -0
  560. mindspore/profiler/analysis/parser/__init__.py +0 -0
  561. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  562. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  563. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  564. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  565. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  566. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  567. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  568. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  569. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  570. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  571. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  572. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  573. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  574. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  575. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  576. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  577. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  578. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  579. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  580. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  581. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  582. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  583. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  584. mindspore/profiler/analysis/task_manager.py +131 -0
  585. mindspore/profiler/analysis/time_converter.py +84 -0
  586. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  587. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  588. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  589. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  590. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  591. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  592. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  593. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  594. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  595. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  596. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  597. mindspore/profiler/analysis/work_flow.py +73 -0
  598. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  599. mindspore/profiler/common/command_executor.py +90 -0
  600. mindspore/profiler/common/constant.py +174 -3
  601. mindspore/profiler/common/file_manager.py +208 -0
  602. mindspore/profiler/common/log.py +130 -0
  603. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  604. mindspore/profiler/common/path_manager.py +371 -0
  605. mindspore/profiler/common/process_bar.py +168 -0
  606. mindspore/profiler/common/process_pool.py +9 -3
  607. mindspore/profiler/common/profiler_context.py +476 -0
  608. mindspore/profiler/common/profiler_info.py +304 -0
  609. mindspore/profiler/common/profiler_output_path.py +284 -0
  610. mindspore/profiler/common/profiler_parameters.py +210 -0
  611. mindspore/profiler/common/profiler_path_manager.py +120 -0
  612. mindspore/profiler/common/record_function.py +76 -0
  613. mindspore/profiler/common/tlv_decoder.py +76 -0
  614. mindspore/profiler/common/util.py +75 -2
  615. mindspore/profiler/dynamic_profiler.py +270 -37
  616. mindspore/profiler/envprofiler.py +138 -0
  617. mindspore/profiler/mstx.py +199 -0
  618. mindspore/profiler/platform/__init__.py +21 -0
  619. mindspore/profiler/platform/base_profiler.py +40 -0
  620. mindspore/profiler/platform/cpu_profiler.py +124 -0
  621. mindspore/profiler/platform/gpu_profiler.py +74 -0
  622. mindspore/profiler/platform/npu_profiler.py +309 -0
  623. mindspore/profiler/profiler.py +580 -93
  624. mindspore/profiler/profiler_action_controller.py +187 -0
  625. mindspore/profiler/profiler_interface.py +114 -0
  626. mindspore/profiler/schedule.py +208 -0
  627. mindspore/rewrite/api/symbol_tree.py +1 -2
  628. mindspore/run_check/_check_version.py +18 -13
  629. mindspore/runtime/__init__.py +37 -0
  630. mindspore/runtime/device.py +27 -0
  631. mindspore/runtime/event.py +209 -0
  632. mindspore/runtime/executor.py +148 -0
  633. mindspore/runtime/memory.py +392 -0
  634. mindspore/runtime/stream.py +460 -0
  635. mindspore/runtime/thread_bind_core.py +401 -0
  636. mindspore/train/__init__.py +2 -2
  637. mindspore/train/_utils.py +53 -18
  638. mindspore/train/amp.py +8 -4
  639. mindspore/train/callback/_checkpoint.py +32 -18
  640. mindspore/train/callback/_early_stop.py +1 -1
  641. mindspore/train/callback/_flops_collector.py +105 -69
  642. mindspore/train/callback/_history.py +1 -1
  643. mindspore/train/callback/_summary_collector.py +44 -6
  644. mindspore/train/callback/_tft_register.py +37 -15
  645. mindspore/train/dataset_helper.py +11 -11
  646. mindspore/train/metrics/precision.py +4 -5
  647. mindspore/train/mind_ir_pb2.py +167 -46
  648. mindspore/train/model.py +13 -14
  649. mindspore/train/serialization.py +461 -72
  650. mindspore/train/summary/summary_record.py +1 -2
  651. mindspore/train/train_thor/model_thor.py +1 -1
  652. mindspore/utils/__init__.py +4 -2
  653. mindspore/utils/bin/dataset-cache +0 -0
  654. mindspore/utils/bin/dataset-cache-server +0 -0
  655. mindspore/utils/dryrun.py +138 -0
  656. mindspore/utils/runtime_execution_order_check.py +550 -0
  657. mindspore/version.py +1 -1
  658. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/METADATA +3 -4
  659. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/RECORD +672 -479
  660. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  661. mindspore/_data_dump.cpython-39-aarch64-linux-gnu.so +0 -0
  662. mindspore/bin/cache_admin +0 -0
  663. mindspore/bin/cache_server +0 -0
  664. mindspore/common/_tensor_overload.py +0 -139
  665. mindspore/lib/libmindspore_np_dtype.so +0 -0
  666. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_576ceaeef5870c451cab59af55ea46ad.json +0 -58
  667. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_86a73ff6e28d734c96bb8d3054f7dd18.json +0 -58
  668. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/ascend910b/all_finite/AllFinite_f55e0ebaad1f2f572e43677336992fa0.json +0 -58
  669. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/config/ascend910b/all_finite.json +0 -109
  670. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/kernel/config/ascend910b/binary_info_config.json +0 -38
  671. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/op_tiling/lib/linux/aarch64/libcust_opmaster_rt2.0.so +0 -0
  672. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_impl/ai_core/tbe/op_tiling/liboptiling.so +0 -0
  673. mindspore/lib/plugin/ascend/custom_ascendc_ops/op_proto/lib/linux/aarch64/libcust_opsproto_rt2.0.so +0 -0
  674. mindspore/lib/plugin/ascend/custom_ascendc_ops/version.info +0 -1
  675. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme.h +0 -24
  676. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/acme_op.h +0 -82
  677. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_creator.h +0 -113
  678. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/include/op_param.h +0 -193
  679. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/dtype_registry.h +0 -90
  680. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/kernel_register.h +0 -46
  681. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/platform_configs.h +0 -89
  682. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/core/platform/rt_funcs.h +0 -135
  683. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_layer_norm_op.h +0 -60
  684. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_op.h +0 -50
  685. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/add_rms_norm_quant_op.h +0 -50
  686. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_nz_op.h +0 -42
  687. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/apply_rotary_pos_emb_op.h +0 -55
  688. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_elewise_op.h +0 -34
  689. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_only_ops.h +0 -94
  690. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/asd_op_base.h +0 -97
  691. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/cast_op.h +0 -52
  692. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/flash_attention_score_op.h +0 -92
  693. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/gelu_op.h +0 -44
  694. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_add_rmsnorm_op.h +0 -73
  695. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/matmul_op.h +0 -108
  696. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_impls_op.h +0 -64
  697. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/multi_weight_matmul_op.h +0 -91
  698. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/paged_attention_op.h +0 -99
  699. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_nz_op.h +0 -44
  700. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/reshape_and_cache_op.h +0 -44
  701. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/ops/host_src/rms_norm_op.h +0 -64
  702. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/asd_utils.h +0 -179
  703. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/comm_utils.h +0 -69
  704. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/acme/src/utils/profiling_util.h +0 -366
  705. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/add_impl.h +0 -56
  706. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/kernel/add.h +0 -21
  707. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/add/tiling/add_tiling.h +0 -43
  708. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/apply_rotary_pos_emb_impl.h +0 -46
  709. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb.h +0 -23
  710. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_base.h +0 -456
  711. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_bf16.h +0 -217
  712. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp.h +0 -391
  713. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp16.h +0 -126
  714. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_fp32.h +0 -230
  715. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_tiling.h +0 -43
  716. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb/kernel/apply_rotary_pos_emb_value.h +0 -27
  717. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/apply_rotary_pos_emb_nz_impl.h +0 -34
  718. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz.h +0 -23
  719. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_base.h +0 -460
  720. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp16.h +0 -116
  721. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_fp32.h +0 -230
  722. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_tiling.h +0 -43
  723. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/apply_rotary_pos_emb_nz/kernel/apply_rotary_pos_emb_nz_value.h +0 -27
  724. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/asdop/asd_op_impl.h +0 -74
  725. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/backend_param.h +0 -74
  726. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/cast_impl.h +0 -48
  727. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/cast/kernel/cast_kernel.h +0 -21
  728. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_impl.h +0 -55
  729. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/compare_tiling.h +0 -27
  730. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/compare/kernel/compare_kernel.h +0 -23
  731. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/and_impl.h +0 -29
  732. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/div_impl.h +0 -29
  733. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_impl.h +0 -48
  734. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/elewise_binary_tiling.h +0 -25
  735. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/and_kernel.h +0 -46
  736. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/div_kernel.h +0 -46
  737. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_base.h +0 -260
  738. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/elewise_binary_kernel.h +0 -35
  739. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/max_kernel.h +0 -66
  740. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/min_kernel.h +0 -66
  741. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/mul_kernel.h +0 -66
  742. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/kernel/or_kernel.h +0 -46
  743. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/max_impl.h +0 -29
  744. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/min_impl.h +0 -29
  745. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/mul_impl.h +0 -29
  746. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_binary/or_impl.h +0 -29
  747. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/abs_impl.h +0 -29
  748. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_impl.h +0 -47
  749. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/elewise_unary_tiling.h +0 -24
  750. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/exp_impl.h +0 -29
  751. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/abs_kernel.h +0 -45
  752. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_base.h +0 -148
  753. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/elewise_unary_kernel.h +0 -31
  754. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/exp_kernel.h +0 -45
  755. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/ln_kernel.h +0 -45
  756. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/not_kernel.h +0 -45
  757. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/reciprocal_kernel.h +0 -45
  758. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/relu_kernel.h +0 -55
  759. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/rsqrt_kernel.h +0 -45
  760. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/kernel/sqrt_kernel.h +0 -45
  761. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/ln_impl.h +0 -29
  762. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/not_impl.h +0 -29
  763. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/reciprocal_impl.h +0 -29
  764. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/relu_impl.h +0 -29
  765. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/rsqrt_impl.h +0 -29
  766. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/elewise_unary/sqrt_impl.h +0 -29
  767. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/flash_attention_score/flash_attention_score_impl.h +0 -68
  768. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_kernel.h +0 -99
  769. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/internal_rtbackend.h +0 -21
  770. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/lccl/lccl_wrapper.h +0 -58
  771. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_types.h +0 -91
  772. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/ms_int_utils.h +0 -108
  773. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/paged_attention/paged_attention_impl.h +0 -64
  774. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/add_param.h +0 -68
  775. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/attention_param.h +0 -40
  776. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/cast_param.h +0 -30
  777. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/compare_param.h +0 -31
  778. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/elewise_param.h +0 -41
  779. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/grouped_matmul_param.h +0 -40
  780. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_ext_param.h +0 -38
  781. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/matmul_qkv_param.h +0 -42
  782. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/param/sub_param.h +0 -33
  783. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/profiling_util.h +0 -377
  784. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/kernel/reshape_and_cache_nz.h +0 -24
  785. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_impl.h +0 -42
  786. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/reshape_and_cache_nz/reshape_and_cache_nz_tiling.h +0 -27
  787. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/rms_norm/rms_norm_impl.h +0 -46
  788. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/kernel/sub_kernel.h +0 -20
  789. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_impl.h +0 -48
  790. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/sub/sub_tiling.h +0 -25
  791. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/matmul_table.h +0 -399
  792. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/tune_repo/utils.h +0 -41
  793. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/backend.h +0 -45
  794. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_tiling.h +0 -29
  795. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/elewise_utils.h +0 -30
  796. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log.h +0 -69
  797. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_core.h +0 -43
  798. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_entity.h +0 -38
  799. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_sink.h +0 -69
  800. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_stream.h +0 -41
  801. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_tiling.h +0 -71
  802. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/log/log_utils.h +0 -165
  803. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/math.h +0 -20
  804. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_creator.h +0 -39
  805. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/register/kernel_registry.h +0 -121
  806. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/include/utils/utils.h +0 -106
  807. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libAdd_impl.so +0 -0
  808. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libSub_impl.so +0 -0
  809. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libadd_rms_norm_quant_acme_impl.so +0 -0
  810. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_310p_old_impl.so +0 -0
  811. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libapply_rotary_pos_emb_old_impl.so +0 -0
  812. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_impl.so +0 -0
  813. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/lib/libreshape_and_cache_nz_old_impl.so +0 -0
  814. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.json +0 -19
  815. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix.o +0 -0
  816. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aic_0.o +0 -0
  817. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMatMulPostFusionMixTactic/acme_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  818. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.json +0 -19
  819. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix.o +0 -0
  820. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aic_0.o +0 -0
  821. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/AcmeMultiWeightMatMulPostFusionMixTactic/acme_multi_weight_matmul_postfusion_mix_mix_aiv_0.o +0 -0
  822. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_full_mix.o +0 -0
  823. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bnsd_tri_mix.o +0 -0
  824. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_full_mix.o +0 -0
  825. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_bf16_bsh_tri_mix.o +0 -0
  826. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_full_mix.o +0 -0
  827. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bnsd_tri_mix.o +0 -0
  828. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_full_mix.o +0 -0
  829. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/flash_attention_score/flash_attention_score_fp16_bsh_tri_mix.o +0 -0
  830. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bnsd_mix.o +0 -0
  831. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_bf16_bsh_mix.o +0 -0
  832. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bnsd_mix.o +0 -0
  833. mindspore/lib/plugin/ascend/ms_kernels_internal/internal_kernel/op_kernels/ascend910b/paged_attention/paged_attention_fp16_bsh_mix.o +0 -0
  834. mindspore/profiler/envprofiling.py +0 -254
  835. mindspore/profiler/profiling.py +0 -1926
  836. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910}/op_api/include/aclnn_decoder_kv_cache.h +0 -0
  837. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910}/op_api/include/aclnn_prompt_kv_cache.h +0 -0
  838. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/decoder_kv_cache.cpp +0 -0
  839. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910/op_impl/ai_core/tbe/custom_ascendc_910_impl}/dynamic/prompt_kv_cache.cpp +0 -0
  840. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_api/include/aclnn_all_finite.h +0 -0
  841. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json +0 -0
  842. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json → custom_ascendc_910b/op_impl/ai_core/tbe/config/ascend910_93/aic-ascend910_93-ops-info.json} +0 -0
  843. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json +0 -0
  844. /mindspore/lib/plugin/ascend/{custom_ascendc_ops/op_impl/ai_core/tbe/custom_ascendc_ops_impl → custom_ascendc_910b/op_impl/ai_core/tbe/custom_ascendc_910b_impl}/dynamic/all_finite.cpp +0 -0
  845. /mindspore/lib/plugin/ascend/{custom_ascendc_ops → custom_ascendc_910b}/op_proto/inc/op_proto.h +0 -0
  846. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  847. {mindspore-2.4.1.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -1,230 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef ROTARY_POS_EMB_NZ_FP32
17
- #define ROTARY_POS_EMB_NZ_FP32
18
- #include "apply_rotary_pos_emb_nz_base.h"
19
- template <typename QK_DTYPE, typename COS_DTYPE, bool IF_COS_BROADCAST>
20
- class RopeFp32 : public RopeBase<QK_DTYPE, COS_DTYPE, IF_COS_BROADCAST> {
21
- public:
22
- __aicore__ inline RopeFp32(RopeTilingNzData *tilingData) : RopeBase<QK_DTYPE, COS_DTYPE, IF_COS_BROADCAST>(tilingData) {
23
- this->repeatSize_ = 64; // 64 = 256B / sizeof(float)
24
- this->maxProcessNum_ = 3 * MAX_LEN_FP16; // 3 for fp16 space needed
25
- this->repeatTimesQ_ = (this->tilingData_->hiddenSizeQ + this->repeatSize_ - 1) / this->repeatSize_;
26
- this->repeatTimesK_ = (this->tilingData_->hiddenSizeK + this->repeatSize_ - 1) / this->repeatSize_;
27
- headDimAlign_ = ((this->tilingData_->headDim + ELE_NUM_FP32 - 1) / ELE_NUM_FP32) * ELE_NUM_FP32;
28
- this->alignHalfHeadDim_ = (this->rotateStride_ * NUM_TWO) % ELE_NUM_FP32;
29
- this->hiddenSizeAlign_ = ((this->hiddenSize_ + this->repeatSize_ - 1) / this->repeatSize_) * this->repeatSize_;
30
- this->syncOffset_ =
31
- (this->tilingData_->headDim % ELE_NUM_FP16 == 0) ? this->hiddenSizeAlign_ : this->headNum_ * headDimAlign_;
32
- this->offsetExtraGm_ = NUM_TWO * block_idx * this->syncOffset_;
33
-
34
- sliceSizeTmp_ = (SLICE_SIZE / this->tilingData_->headDim) * this->tilingData_->headDim; // 向下取整
35
-
36
- // fp16
37
- this->oriPos_ = 0;
38
- this->removeBefore_ = this->oriPos_ + sliceSizeTmp_;
39
- this->padBefore_ = this->removeBefore_ + sliceSizeTmp_;
40
- resOut_ = this->padBefore_ + sliceSizeTmp_;
41
-
42
- // fp32
43
- this->cosPad_ = 0;
44
- this->sinPad_ = this->cosPad_ + sliceSizeTmp_;
45
- this->negOne_ = this->sinPad_ + sliceSizeTmp_;
46
- oriPosF32_ = this->negOne_ + sliceSizeTmp_;
47
- PadBeforeF32_ = oriPosF32_ + sliceSizeTmp_;
48
- removeBeforeF32_ = PadBeforeF32_ + sliceSizeTmp_;
49
- posOneF32_ = removeBeforeF32_ + sliceSizeTmp_;
50
- resOutFp32_ = posOneF32_ + sliceSizeTmp_;
51
-
52
- this->pipe_.InitBuffer(qkfp32QueueCO2_, 1,
53
- (this->tilingData_->maxUbSize - this->batchSize_ * NUM_TWO -
54
- this->maxProcessNum_ * sizeof(QK_DTYPE))); // 留給fp32的
55
- AscendC::LocalTensor<COS_DTYPE> qkfp32_perloop_ub = qkfp32QueueCO2_.AllocTensor<COS_DTYPE>();
56
- qkfp32Ubuf_ = (__ubuf__ COS_DTYPE *)qkfp32_perloop_ub.GetPhyAddr();
57
- this->pipe_.InitBuffer(outQueueCO2_, 1, ((this->maxProcessNum_) * sizeof(QK_DTYPE)));
58
- AscendC::LocalTensor<QK_DTYPE> cache_perloop_ub1 = outQueueCO2_.AllocTensor<QK_DTYPE>();
59
- commonUbuf_ = (__ubuf__ QK_DTYPE *)cache_perloop_ub1.GetPhyAddr();
60
-
61
- // 判断
62
- if (this->tilingData_->hiddenSizeQ > sliceSizeTmp_) {
63
- sliceTimeQ_ = (this->tilingData_->hiddenSizeQ + sliceSizeTmp_ - 1) / sliceSizeTmp_; // 向上取整
64
- lastSliceSizeQ_ = this->tilingData_->hiddenSizeQ - (sliceTimeQ_ - 1) * sliceSizeTmp_; // 向上取整
65
- } else {
66
- sliceTimeQ_ = 1;
67
- lastSliceSizeQ_ = this->tilingData_->hiddenSizeQ;
68
- }
69
-
70
- if (this->tilingData_->hiddenSizeK > sliceSizeTmp_) {
71
- sliceTimeK_ = (this->tilingData_->hiddenSizeK + sliceSizeTmp_ - 1) / sliceSizeTmp_; // 向上取整
72
- lastSliceSizeK_ = this->tilingData_->hiddenSizeK - (sliceTimeK_ - 1) * sliceSizeTmp_;
73
- } else {
74
- sliceTimeK_ = 1;
75
- lastSliceSizeK_ = this->tilingData_->hiddenSizeK;
76
- }
77
- }
78
-
79
- template <typename T>
80
- __aicore__ inline void CastQKDType2F32(uint32_t repeatTimes) {
81
- vconv_f162f32(qkfp32Ubuf_ + oriPosF32_, commonUbuf_ + this->oriPos_, repeatTimes, 1, 1, DEFAULT_REPEAT_STRIDE,
82
- DEFAULT_REPEAT_STRIDE / NUM_TWO);
83
- vconv_f162f32(qkfp32Ubuf_ + removeBeforeF32_, commonUbuf_ + this->removeBefore_, repeatTimes, 1, 1,
84
- DEFAULT_REPEAT_STRIDE, DEFAULT_REPEAT_STRIDE / NUM_TWO);
85
- vconv_f162f32(qkfp32Ubuf_ + PadBeforeF32_, commonUbuf_ + this->padBefore_, repeatTimes, 1, 1, DEFAULT_REPEAT_STRIDE,
86
- DEFAULT_REPEAT_STRIDE / NUM_TWO);
87
- }
88
-
89
- #if defined(__CCE_KT_TEST__) || (__CCE_AICORE__ == 220)
90
- template <>
91
- __aicore__ inline void CastQKDType2F32<bfloat16_t>(uint32_t repeatTimes) {
92
- vconv_bf162f32(qkfp32Ubuf_ + oriPosF32_, commonUbuf_ + this->oriPos_, repeatTimes, 1, 1, DEFAULT_REPEAT_STRIDE,
93
- DEFAULT_REPEAT_STRIDE / NUM_TWO);
94
- vconv_bf162f32(qkfp32Ubuf_ + removeBeforeF32_, commonUbuf_ + this->removeBefore_, repeatTimes, 1, 1,
95
- DEFAULT_REPEAT_STRIDE, DEFAULT_REPEAT_STRIDE / NUM_TWO);
96
- vconv_bf162f32(qkfp32Ubuf_ + PadBeforeF32_, commonUbuf_ + this->padBefore_, repeatTimes, 1, 1,
97
- DEFAULT_REPEAT_STRIDE, DEFAULT_REPEAT_STRIDE / NUM_TWO);
98
- }
99
- #endif
100
-
101
- template <typename T>
102
- __aicore__ inline void CastF322QKDType(__gm__ QK_DTYPE *dst, __ubuf__ QK_DTYPE *src1, __ubuf__ float *src,
103
- uint32_t repeatTimes, uint32_t hiddenSize1) {
104
- vconv_f322f16(src1, src, repeatTimes, 1, 1, DEFAULT_REPEAT_STRIDE / NUM_TWO, DEFAULT_REPEAT_STRIDE);
105
- set_flag(PIPE_V, PIPE_MTE3, EVENT_ID1);
106
-
107
- wait_flag(PIPE_V, PIPE_MTE3, EVENT_ID1);
108
- copy_ubuf_to_gm(dst, src1, 0, 1, hiddenSize1 / ELE_NUM_FP16, 0, 0);
109
- }
110
-
111
- #if defined(__CCE_KT_TEST__) || (__CCE_AICORE__ == 220)
112
- template <>
113
- __aicore__ inline void CastF322QKDType<bfloat16_t>(__gm__ QK_DTYPE *dst, __ubuf__ QK_DTYPE *src1, __ubuf__ float *src,
114
- uint32_t repeatTimes, uint32_t hiddenSize1) {
115
- vconv_f322bf16r(src1, src, repeatTimes, 1, 1, DEFAULT_REPEAT_STRIDE / NUM_TWO, DEFAULT_REPEAT_STRIDE);
116
- set_flag(PIPE_V, PIPE_MTE3, EVENT_ID1);
117
-
118
- wait_flag(PIPE_V, PIPE_MTE3, EVENT_ID1);
119
- copy_ubuf_to_gm(dst, src1, 0, 1, hiddenSize1 / ELE_NUM_FP16, 0, 0);
120
- }
121
- #endif
122
-
123
-
124
- __aicore__ inline void Process(__gm__ uint8_t *extraGm) {
125
- if (this->tilingData_->cosFormat == 1) {
126
- pipe_barrier((PIPE_ALL));
127
- this->ExpandCosSin(qkfp32Ubuf_, this->cosGm_, (__gm__ COS_DTYPE *)extraGm);
128
- this->cosGm_ = (__gm__ COS_DTYPE *)extraGm;
129
- pipe_barrier((PIPE_ALL));
130
- this->ExpandCosSin(qkfp32Ubuf_, this->sinGm_,
131
- (__gm__ COS_DTYPE *)extraGm + this->tilingData_->ntokens * this->tilingData_->headDim);
132
- this->sinGm_ = (__gm__ COS_DTYPE *)extraGm + this->tilingData_->ntokens * this->tilingData_->headDim;
133
- extraGm =
134
- extraGm + this->tilingData_->ntokens * this->tilingData_->headDim * 4; // sizeof(uint8_t) * 2 = sizeof(half)
135
- pipe_barrier((PIPE_ALL));
136
- }
137
- uint32_t headNumTempQ = this->tilingData_->hiddenSizeQ > sliceSizeTmp_
138
- ? (sliceSizeTmp_ / this->tilingData_->headDim)
139
- : this->tilingData_->headNumQ;
140
- uint32_t dynamicSliceQ =
141
- this->tilingData_->hiddenSizeQ > sliceSizeTmp_ ? sliceSizeTmp_ : this->tilingData_->hiddenSizeQ;
142
- uint32_t headNumTempK = this->tilingData_->hiddenSizeK > sliceSizeTmp_
143
- ? (sliceSizeTmp_ / this->tilingData_->headDim)
144
- : this->tilingData_->headNumK;
145
- uint32_t dynamicSliceK =
146
- this->tilingData_->hiddenSizeK > sliceSizeTmp_ ? sliceSizeTmp_ : this->tilingData_->hiddenSizeK;
147
- uint32_t repeatTemp = (dynamicSliceQ + this->repeatSize_ - 1) / this->repeatSize_;
148
- this->ExpandNeg(qkfp32Ubuf_, posOneF32_, headNumTempQ, repeatTemp);
149
- for (uint32_t zz = 0; zz < this->dynamicRound_; ++zz) { // 每个核 核内只需拷贝一次cos sin(每个头cos sin都一样)
150
- this->CosSinBroadcast(extraGm, zz, qkfp32Ubuf_,
151
- dynamicSliceQ); // 一次放得下:hiddensize, 一次放不下:sliceSizeTmp
152
- for (uint32_t perSlice = 0; perSlice < sliceTimeQ_; ++perSlice) { // 核内每块
153
- uint32_t dynamicSliceQTemp = (perSlice == sliceTimeQ_ - 1) ? lastSliceSizeQ_ : sliceSizeTmp_;
154
- headNumTempQ = dynamicSliceQTemp / this->tilingData_->headDim;
155
- uint32_t repeatTimeOnce = (dynamicSliceQTemp + this->repeatSize_ - 1) / this->repeatSize_;
156
- this->QkComm(this->qGm_ + block_idx * this->nlCoreRun_ * this->tilingData_->hiddenSizeQ +
157
- zz * this->tilingData_->hiddenSizeQ + perSlice * sliceSizeTmp_,
158
- extraGm, dynamicSliceQTemp, commonUbuf_, headNumTempQ);
159
- if (this->alignRotary_ == 0) {
160
- pipe_barrier((PIPE_V));
161
- CastQKDType2F32<QK_DTYPE>(repeatTimeOnce);
162
-
163
- pipe_barrier((PIPE_V));
164
- this->CalcRopeAlign(qkfp32Ubuf_, repeatTimeOnce, oriPosF32_, removeBeforeF32_, resOutFp32_);
165
- } else {
166
- set_flag(PIPE_MTE2, PIPE_V, EVENT_ID1);
167
- wait_flag(PIPE_MTE2, PIPE_V, EVENT_ID1);
168
-
169
- CastQKDType2F32<QK_DTYPE>(repeatTimeOnce);
170
- pipe_barrier((PIPE_V));
171
- this->CalcRope(qkfp32Ubuf_, repeatTimeOnce, oriPosF32_, removeBeforeF32_, PadBeforeF32_, posOneF32_,
172
- resOutFp32_);
173
-
174
- } // 帶PIPE_V
175
- CastF322QKDType<QK_DTYPE>(this->outQGm_ + block_idx * this->nlCoreRun_ * this->tilingData_->hiddenSizeQ +
176
- zz * this->tilingData_->hiddenSizeQ + perSlice * sliceSizeTmp_,
177
- commonUbuf_ + resOut_, qkfp32Ubuf_ + resOutFp32_, repeatTimeOnce, dynamicSliceQTemp);
178
- pipe_barrier(PIPE_ALL);
179
- }
180
- for (uint32_t perSlice = 0; perSlice < sliceTimeK_; ++perSlice) { // 核内每块
181
- uint32_t dynamicSliceKTemp = (perSlice == sliceTimeK_ - 1) ? lastSliceSizeK_ : sliceSizeTmp_;
182
- headNumTempK = dynamicSliceKTemp / this->tilingData_->headDim;
183
- uint32_t repeatTimeOnce = (dynamicSliceKTemp + this->repeatSize_ - 1) / this->repeatSize_;
184
- this->QkComm(this->kGm_ + block_idx * this->nlCoreRun_ * this->tilingData_->hiddenSizeK +
185
- zz * this->tilingData_->hiddenSizeK + perSlice * sliceSizeTmp_,
186
- extraGm, dynamicSliceKTemp, commonUbuf_, headNumTempK);
187
- if (this->alignRotary_ == 0) {
188
- pipe_barrier((PIPE_V));
189
- CastQKDType2F32<QK_DTYPE>(repeatTimeOnce);
190
-
191
- pipe_barrier((PIPE_V));
192
- this->CalcRopeAlign(qkfp32Ubuf_, repeatTimeOnce, oriPosF32_, removeBeforeF32_, resOutFp32_);
193
- } else {
194
- set_flag(PIPE_MTE2, PIPE_V, EVENT_ID1);
195
- wait_flag(PIPE_MTE2, PIPE_V, EVENT_ID1);
196
- CastQKDType2F32<QK_DTYPE>(repeatTimeOnce);
197
-
198
- pipe_barrier((PIPE_V));
199
- this->CalcRope(qkfp32Ubuf_, repeatTimeOnce, oriPosF32_, removeBeforeF32_, PadBeforeF32_, posOneF32_,
200
- resOutFp32_);
201
- } // 帶PIPE_V
202
-
203
- CastF322QKDType<QK_DTYPE>(this->outKGm_ + block_idx * this->nlCoreRun_ * this->tilingData_->hiddenSizeK +
204
- zz * this->tilingData_->hiddenSizeK + perSlice * sliceSizeTmp_,
205
- commonUbuf_ + resOut_, qkfp32Ubuf_ + resOutFp32_, repeatTimeOnce, dynamicSliceKTemp);
206
- pipe_barrier(PIPE_ALL);
207
- }
208
- }
209
- }
210
-
211
- private:
212
- AscendC::TQue<AscendC::QuePosition::VECIN, 1> qkfp32QueueCO2_;
213
- AscendC::TQue<AscendC::QuePosition::VECIN, 1> outQueueCO2_;
214
- __ubuf__ QK_DTYPE *commonUbuf_{nullptr};
215
- __ubuf__ COS_DTYPE *qkfp32Ubuf_{nullptr};
216
- uint32_t oriPosF32_{0}; // fp32的buf中qk的位置
217
- uint32_t PadBeforeF32_{0}; // fp32的buf中保存qk[-x : hiddensize - x]
218
- uint32_t removeBeforeF32_{0}; // fp32的buf中保存qk[x : hiddensize + x]
219
- uint32_t posOneF32_{0}; // fp32的buf中0 0 0 1 1 1的位置
220
- uint32_t headDimAlign_; // 对齐的headDim
221
- uint32_t sliceTimeQ_; // 切分块的次数
222
- uint32_t lastSliceSizeQ_; // 最后一块的大小
223
- uint32_t sliceTimeK_;
224
- uint32_t lastSliceSizeK_;
225
- uint32_t sliceSizeTmp_;
226
- uint32_t resOut_;
227
- uint32_t resOutFp32_;
228
- };
229
-
230
- #endif
@@ -1,43 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ROPE_NZ_TILING_DATA_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_ROPE_NZ_TILING_DATA_H_
19
-
20
- #include <stdint.h>
21
-
22
- struct RopeTilingNzData {
23
- uint32_t hiddenSizeQ{16};
24
- uint32_t hiddenSizeK{16};
25
- uint32_t headDim{1}; // qk头长度的最大值
26
- uint32_t headNumQ{1};
27
- uint32_t headNumK{1};
28
- uint32_t rotaryCoeff{4}; // 旋转系数
29
- uint32_t ntokens{1}; // 总token数
30
- uint32_t realCore{0}; // 实际用到核数
31
- uint32_t cosFormat{0}; // 是否复用cos sin
32
- uint32_t batch{32}; // 几个batch
33
- uint32_t maxUbSize{0}; // 最大UB内存
34
- uint32_t tilingId{0};
35
-
36
- uint32_t seqLen;
37
- uint32_t broadCastCos{0};
38
- uint32_t posDtype;
39
- uint32_t posSize;
40
- uint32_t maxSeqLen;
41
- };
42
-
43
- #endif
@@ -1,27 +0,0 @@
1
- /**
2
- * Copyright (c) Huawei Technologies Co., Ltd. 2024. All rights reserved.
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef COMMON_NZ_VAL_H
17
- #define COMMON_NZ_VAL_H
18
- const constexpr uint32_t NUM_TWO = 2; // 2
19
- const constexpr uint32_t BLK_SIZE = 32; // 一个block字节数
20
- const constexpr uint32_t ELE_NUM_FP16 = 16; // 一个block fp16元素个数
21
- const constexpr uint32_t ELE_NUM_FP32 = 8; // 一个block字节数 fp32元素个数
22
- const constexpr uint32_t MAX_LEN_FP16 = 8192; // 非fp16情况下最大长度(hiddensize)
23
- const constexpr uint8_t DEFAULT_REPEAT_STRIDE = 8; // 默认stride, 8 * 32 = 256
24
- const constexpr int64_t REG_910B = 48; // 饱和模式寄存器位置
25
- const constexpr int64_t REG_310P = 53; // 饱和模式寄存器位置
26
- const constexpr int64_t SLICE_SIZE = 4096; // 切片大小
27
- #endif
@@ -1,74 +0,0 @@
1
- /**
2
- * Copyright 2023-2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASDOP_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_ASDOP_IMPL_H_
18
- #include "asdops/op_desc.h"
19
- #include "asdops/operation.h"
20
- #include "asdops/run_info.h"
21
- #include "asdops/tactic.h"
22
- #include "asdops/tensor.h"
23
- #include "internal_kernel.h"
24
- #include <unordered_map>
25
- namespace mindspore {
26
- namespace internal {
27
-
28
- class AsdOpsImpl : public InternelKernelImpl {
29
- public:
30
- AsdOpsImpl(const OpParamPtr &param) : InternelKernelImpl(param){};
31
- virtual ~AsdOpsImpl() = default;
32
- bool Init(const ValidateInfo &info) override;
33
- bool InitPagedAttention910(const ValidateInfo &info);
34
- void SetInputs(const std::vector<Tensor *> &inputs) override;
35
- void SetAsd910PagedAttentionC8Inputs(const std::vector<Tensor *> &inputs);
36
- void SetOutputs(const std::vector<Tensor *> &outputs) override;
37
- void SetWorkSpace(const std::vector<DeviceRawBuf> &workspace) override;
38
- void SetStream(const void *stream_ptr) override;
39
- void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
40
- int Launch() override;
41
- size_t GetTilingBufSize() override;
42
- int Tiling(HostRawBuf &tilingBuf) override;
43
- std::vector<uint64_t> GetWorkSpaceSize() override;
44
- int InferShape(const std::vector<DIMS> &input_shapes, std::vector<DIMS> &output_shapes) override;
45
- std::string GetOpName() override { return tactic_->GetName(); }
46
- uint32_t GetLaunchCoreNum() override {
47
- auto &kernelInfo = cache_info_.run_info_.GetKernelInfo();
48
- return kernelInfo.GetBlockDim();
49
- }
50
- void UpdateParam(const OpParamPtr &param) override;
51
-
52
- private:
53
- AsdOps::Tactic *InitAndGetTactic();
54
-
55
- protected:
56
- AsdOps::Tactic *tactic_ = nullptr;
57
- AsdOps::Operation *op_ = nullptr;
58
- AsdOps::LaunchParam launch_param_;
59
- AsdOps::OpDesc op_desc_;
60
- bool validated_ = false;
61
- std::string soc_{"Ascend910B4"};
62
- };
63
-
64
- class AsdOps310PImpl : public AsdOpsImpl {
65
- public:
66
- AsdOps310PImpl(const OpParamPtr &param) : AsdOpsImpl(param){};
67
- virtual ~AsdOps310PImpl() = default;
68
- void SetInputs(const std::vector<Tensor *> &inputs) override;
69
- void SetOutputs(const std::vector<Tensor *> &outputs) override;
70
- };
71
-
72
- } // namespace internal
73
- } // namespace mindspore
74
- #endif
@@ -1,74 +0,0 @@
1
- /**
2
- * Copyright 2023-2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef BACKEND_PARAM_H_
17
- #define BACKEND_PARAM_H_
18
- namespace mindspore {
19
- namespace internal {
20
-
21
- struct HardwareInfo {
22
- uint32_t coreNum{0};
23
- uint32_t l2Size{0};
24
- uint32_t l1Size{0};
25
- uint32_t l0aSize{0};
26
- uint32_t l0bSize{0};
27
- uint32_t l0cSize{0};
28
- uint32_t hbmBandWidth{1};
29
- uint32_t l2BandWidth{5};
30
- uint32_t ubSize{0};
31
- };
32
-
33
- static void GetHardwareInfoPPMatmul910B1(HardwareInfo &hwInfo) {
34
- hwInfo.coreNum = 24;
35
- hwInfo.l2Size = 201326592;
36
- hwInfo.l1Size = 524288;
37
- hwInfo.l0aSize = 65536;
38
- hwInfo.l0bSize = 65536;
39
- hwInfo.l0cSize = 131072;
40
- hwInfo.ubSize = 196608;
41
- }
42
-
43
- static void GetHardwareInfoPPMatmul910B2(HardwareInfo &hwInfo) {
44
- hwInfo.coreNum = 24;
45
- hwInfo.l2Size = 201326592;
46
- hwInfo.l1Size = 524288;
47
- hwInfo.l0aSize = 65536;
48
- hwInfo.l0bSize = 65536;
49
- hwInfo.l0cSize = 131072;
50
- hwInfo.ubSize = 196608;
51
- }
52
-
53
- static void GetHardwareInfoPPMatmul910B3(HardwareInfo &hwInfo) {
54
- hwInfo.coreNum = 20;
55
- hwInfo.l2Size = 201326592;
56
- hwInfo.l1Size = 524288;
57
- hwInfo.l0aSize = 65536;
58
- hwInfo.l0bSize = 65536;
59
- hwInfo.l0cSize = 131072;
60
- hwInfo.ubSize = 196608;
61
- }
62
-
63
- static void GetHardwareInfoPPMatmul910B4(HardwareInfo &hwInfo) {
64
- hwInfo.coreNum = 20;
65
- hwInfo.l2Size = 100663296;
66
- hwInfo.l1Size = 524288;
67
- hwInfo.l0aSize = 65536;
68
- hwInfo.l0bSize = 65536;
69
- hwInfo.l0cSize = 131072;
70
- hwInfo.ubSize = 196608;
71
- }
72
- } // namespace internal
73
- } // namespace mindspore
74
- #endif
@@ -1,48 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_CAST_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_CAST_IMPL_H_
18
-
19
- #include <vector>
20
- #include "include/internal_kernel.h"
21
-
22
- namespace mindspore {
23
- namespace internal {
24
- class CastImpl : public InternelKernelImpl {
25
- public:
26
- CastImpl(const OpParamPtr &param) : InternelKernelImpl(param) {}
27
- virtual ~CastImpl() {}
28
- bool Init(const ValidateInfo &info) override;
29
- void SetStream(const void *stream_ptr) override;
30
- void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
31
- int Launch() override;
32
- uint64_t GetTilingBufSize() override;
33
- int Tiling(HostRawBuf &tilingBuf) override;
34
- std::vector<uint64_t> GetWorkSpaceSize() override;
35
- int InferShape(const std::vector<DIMS> &input_shapes, std::vector<DIMS> &output_shapes) override;
36
-
37
- private:
38
- int32_t GetCastDType();
39
- int32_t GetMaxUbCount(uint32_t cast_type);
40
- void DoUbTiling(uint32_t factor, uint32_t total_num, uint32_t &ub_num, uint32_t &ub_loop, uint32_t &ub_tail);
41
-
42
- private:
43
- DeviceRawBuf tiling_buf_;
44
- void *stream_ptr_ = nullptr;
45
- };
46
- } // namespace internal
47
- } // namespace mindspore
48
- #endif // MS_KERNELS_INTERNAL_KERNEL_CAST_IMPL_H_
@@ -1,21 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_CAST_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_CAST_KERNEL_H_
19
- void cast_do(uint32_t block_dim, void *l2ctrl, void *stream, uint8_t *in, uint8_t *out, uint8_t *tiling,
20
- uint32_t cast_type);
21
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_CAST_KERNEL_H_
@@ -1,55 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_COMPARE_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_COMPARE_IMPL_H_
18
-
19
- #include <vector>
20
- #include "include/internal_kernel.h"
21
- #include "src/utils/elewise_utils.h"
22
-
23
- namespace mindspore {
24
- namespace internal {
25
- class CompareImpl : public InternelKernelImpl {
26
- public:
27
- CompareImpl(const OpParamPtr &param) : InternelKernelImpl(param) { GetCompareMode(); }
28
- virtual ~CompareImpl() {}
29
- bool Init(const ValidateInfo &info) override;
30
- void SetStream(const void *stream_ptr) override;
31
- void SetDeviceTilingBuf(const DeviceRawBuf &tilingBuf) override;
32
- int Launch() override;
33
- uint64_t GetTilingBufSize() override;
34
- int Tiling(HostRawBuf &tilingBuf) override;
35
- std::vector<uint64_t> GetWorkSpaceSize() override;
36
- int InferShape(const std::vector<DIMS> &input_shapes, std::vector<DIMS> &output_shapes) override;
37
- bool IsSupported() override;
38
-
39
- private:
40
- int32_t GetMaxUbCount(uint32_t in_dtype);
41
- void GetCompareMode();
42
-
43
- private:
44
- DeviceRawBuf tiling_buf_;
45
- void *stream_ptr_ = nullptr;
46
- uint32_t compare_mode_{0};
47
- uint32_t broadcast_mode_{0};
48
- size_t ndims_{0};
49
- int64_t in0_shape_[MAX_COMPARE_SHAPE_LEN];
50
- int64_t in1_shape_[MAX_COMPARE_SHAPE_LEN];
51
- int64_t out_shape_[MAX_COMPARE_SHAPE_LEN];
52
- };
53
- } // namespace internal
54
- } // namespace mindspore
55
- #endif // MS_KERNELS_INTERNAL_KERNEL_COMPARE_IMPL_H_
@@ -1,27 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_COMPARE_TILING_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_COMPARE_TILING_H_
19
- #include "utils/elewise_tiling.h"
20
- namespace mindspore::internal {
21
- struct CompareTilingData : public ElewiseTailTilingData {
22
- uint32_t input_dtype{0};
23
- uint32_t broadcast_mode{0};
24
- uint32_t compare_mode{0};
25
- };
26
- } // namespace mindspore::internal
27
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_COMPARE_TILING_H_
@@ -1,23 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
-
17
- #ifndef MS_KERNELS_INTERNAL_KERNEL_ASCENDC_COMPARE_KERNEL_H_
18
- #define MS_KERNELS_INTERNAL_KERNEL_ASCENDC_COMPARE_KERNEL_H_
19
- #include <stdint.h>
20
- #define BIT_SIZE 8
21
- void compare(uint32_t blockdim, void *l2ctrl, void *stream, uint8_t *in1, uint8_t *in2, uint8_t *out, uint8_t *tiling,
22
- uint32_t dtype, uint32_t broadcast_mode, uint32_t compare_mode);
23
- #endif // MS_KERNELS_INTERNAL_KERNEL_ASCENDC_NOT_EQUAL_KERNEL_H_
@@ -1,29 +0,0 @@
1
- /**
2
- * Copyright 2024 Huawei Technologies Co., Ltd
3
- *
4
- * Licensed under the Apache License, Version 2.0 (the "License");
5
- * you may not use this file except in compliance with the License.
6
- * You may obtain a copy of the License at
7
- *
8
- * http://www.apache.org/licenses/LICENSE-2.0
9
- *
10
- * Unless required by applicable law or agreed to in writing, software
11
- * distributed under the License is distributed on an "AS IS" BASIS,
12
- * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
- * See the License for the specific language governing permissions and
14
- * limitations under the License.
15
- */
16
- #ifndef MS_KERNELS_INTERNAL_KERNEL_AND_IMPL_H_
17
- #define MS_KERNELS_INTERNAL_KERNEL_AND_IMPL_H_
18
- #include "elewise_binary_impl.h"
19
- namespace mindspore {
20
- namespace internal {
21
- class AndImpl : public ElewiseBinaryImpl {
22
- public:
23
- AndImpl(const OpParamPtr &param) : ElewiseBinaryImpl(param) {}
24
- virtual ~AndImpl() {}
25
- int Launch() override;
26
- };
27
- } // namespace internal
28
- } // namespace mindspore
29
- #endif // MS_KERNELS_INTERNAL_KERNEL_AND_IMPL_H_