mindspore 2.4.10__cp311-cp311-win_amd64.whl → 2.5.0__cp311-cp311-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (366) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/__init__.py +8 -3
  3. mindspore/_c_dataengine.cp311-win_amd64.pyd +0 -0
  4. mindspore/_c_expression.cp311-win_amd64.pyd +0 -0
  5. mindspore/_c_mindrecord.cp311-win_amd64.pyd +0 -0
  6. mindspore/_checkparam.py +0 -5
  7. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  8. mindspore/_extends/parse/compile_config.py +64 -0
  9. mindspore/_extends/parse/deprecated/__init__.py +0 -0
  10. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +375 -0
  11. mindspore/_extends/parse/parser.py +23 -5
  12. mindspore/_extends/parse/standard_method.py +123 -27
  13. mindspore/_extends/pijit/pijit_func_white_list.py +1 -1
  14. mindspore/amp.py +7 -1
  15. mindspore/avcodec-59.dll +0 -0
  16. mindspore/avdevice-59.dll +0 -0
  17. mindspore/avfilter-8.dll +0 -0
  18. mindspore/avformat-59.dll +0 -0
  19. mindspore/avutil-57.dll +0 -0
  20. mindspore/boost/boost_cell_wrapper.py +136 -41
  21. mindspore/common/__init__.py +3 -1
  22. mindspore/common/_register_for_tensor.py +0 -1
  23. mindspore/common/_stub_tensor.py +25 -4
  24. mindspore/common/_tensor_cpp_method.py +17 -0
  25. mindspore/common/_tensor_docs.py +6132 -0
  26. mindspore/common/api.py +98 -21
  27. mindspore/common/dtype.py +34 -34
  28. mindspore/common/dump.py +2 -1
  29. mindspore/common/file_system.py +8 -3
  30. mindspore/common/generator.py +2 -0
  31. mindspore/common/hook_handle.py +3 -1
  32. mindspore/common/initializer.py +3 -4
  33. mindspore/common/lazy_inline.py +8 -2
  34. mindspore/common/mindir_util.py +10 -2
  35. mindspore/common/parameter.py +31 -15
  36. mindspore/common/tensor.py +713 -1337
  37. mindspore/communication/__init__.py +1 -1
  38. mindspore/communication/_comm_helper.py +5 -0
  39. mindspore/communication/comm_func.py +215 -173
  40. mindspore/communication/management.py +23 -20
  41. mindspore/context.py +285 -191
  42. mindspore/dataset/__init__.py +23 -19
  43. mindspore/dataset/callback/ds_callback.py +2 -1
  44. mindspore/dataset/core/config.py +84 -3
  45. mindspore/dataset/engine/cache_admin.py +3 -3
  46. mindspore/dataset/engine/cache_client.py +5 -4
  47. mindspore/dataset/engine/datasets.py +192 -149
  48. mindspore/dataset/engine/datasets_audio.py +14 -0
  49. mindspore/dataset/engine/datasets_standard_format.py +11 -11
  50. mindspore/dataset/engine/datasets_text.py +38 -1
  51. mindspore/dataset/engine/datasets_user_defined.py +100 -66
  52. mindspore/dataset/engine/datasets_vision.py +81 -8
  53. mindspore/dataset/engine/iterators.py +281 -63
  54. mindspore/dataset/engine/obs/util.py +8 -0
  55. mindspore/dataset/engine/queue.py +40 -0
  56. mindspore/dataset/engine/samplers.py +26 -2
  57. mindspore/dataset/engine/serializer_deserializer.py +1 -1
  58. mindspore/dataset/engine/validators.py +43 -11
  59. mindspore/dataset/transforms/py_transforms_util.py +17 -0
  60. mindspore/dataset/transforms/transforms.py +29 -12
  61. mindspore/dataset/vision/validators.py +1 -2
  62. mindspore/device_context/__init__.py +21 -0
  63. mindspore/device_context/ascend/__init__.py +25 -0
  64. mindspore/device_context/ascend/device.py +72 -0
  65. mindspore/device_context/ascend/op_debug.py +94 -0
  66. mindspore/device_context/ascend/op_precision.py +193 -0
  67. mindspore/device_context/ascend/op_tuning.py +127 -0
  68. mindspore/device_context/cpu/__init__.py +25 -0
  69. mindspore/device_context/cpu/device.py +62 -0
  70. mindspore/device_context/cpu/op_tuning.py +43 -0
  71. mindspore/device_context/gpu/__init__.py +21 -0
  72. mindspore/device_context/gpu/device.py +70 -0
  73. mindspore/device_context/gpu/op_precision.py +67 -0
  74. mindspore/device_context/gpu/op_tuning.py +175 -0
  75. mindspore/device_manager.py +134 -0
  76. mindspore/dnnl.dll +0 -0
  77. mindspore/experimental/llm_boost/__init__.py +1 -0
  78. mindspore/experimental/llm_boost/ascend_native/__init__.py +22 -0
  79. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +211 -0
  80. mindspore/experimental/llm_boost/ascend_native/llm_boost.py +52 -0
  81. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  82. mindspore/experimental/llm_boost/atb/llama_boost.py +6 -1
  83. mindspore/experimental/llm_boost/register.py +1 -0
  84. mindspore/experimental/optim/adadelta.py +26 -22
  85. mindspore/experimental/optim/adam.py +3 -0
  86. mindspore/experimental/optim/lr_scheduler.py +33 -24
  87. mindspore/experimental/optim/radam.py +33 -30
  88. mindspore/hal/device.py +28 -0
  89. mindspore/hal/event.py +17 -0
  90. mindspore/hal/memory.py +94 -3
  91. mindspore/hal/stream.py +91 -6
  92. mindspore/include/api/context.h +0 -1
  93. mindspore/jpeg62.dll +0 -0
  94. mindspore/log.py +12 -0
  95. mindspore/mindrecord/__init__.py +1 -1
  96. mindspore/mindrecord/config.py +17 -316
  97. mindspore/mindrecord/filereader.py +1 -9
  98. mindspore/mindrecord/filewriter.py +5 -15
  99. mindspore/mindrecord/mindpage.py +1 -9
  100. mindspore/mindspore_backend.dll +0 -0
  101. mindspore/mindspore_common.dll +0 -0
  102. mindspore/mindspore_core.dll +0 -0
  103. mindspore/mindspore_glog.dll +0 -0
  104. mindspore/mindspore_ops.dll +0 -0
  105. mindspore/mint/__init__.py +824 -218
  106. mindspore/mint/distributed/__init__.py +66 -4
  107. mindspore/mint/distributed/distributed.py +2594 -44
  108. mindspore/mint/linalg/__init__.py +6 -0
  109. mindspore/mint/nn/__init__.py +473 -14
  110. mindspore/mint/nn/functional.py +486 -11
  111. mindspore/mint/nn/layer/__init__.py +17 -4
  112. mindspore/mint/nn/layer/_functions.py +330 -0
  113. mindspore/mint/nn/layer/activation.py +169 -1
  114. mindspore/mint/nn/layer/basic.py +123 -0
  115. mindspore/mint/nn/layer/conv.py +727 -0
  116. mindspore/mint/nn/layer/normalization.py +215 -19
  117. mindspore/mint/nn/layer/padding.py +797 -0
  118. mindspore/mint/nn/layer/pooling.py +170 -0
  119. mindspore/mint/optim/__init__.py +2 -1
  120. mindspore/mint/optim/adam.py +223 -0
  121. mindspore/mint/optim/adamw.py +26 -19
  122. mindspore/mint/special/__init__.py +2 -1
  123. mindspore/multiprocessing/__init__.py +5 -0
  124. mindspore/nn/cell.py +126 -19
  125. mindspore/nn/dynamic_lr.py +2 -1
  126. mindspore/nn/layer/activation.py +6 -6
  127. mindspore/nn/layer/basic.py +35 -25
  128. mindspore/nn/layer/channel_shuffle.py +3 -3
  129. mindspore/nn/layer/embedding.py +3 -3
  130. mindspore/nn/layer/normalization.py +8 -7
  131. mindspore/nn/layer/padding.py +4 -3
  132. mindspore/nn/layer/pooling.py +47 -13
  133. mindspore/nn/layer/rnn_cells.py +1 -1
  134. mindspore/nn/layer/rnns.py +2 -1
  135. mindspore/nn/layer/timedistributed.py +5 -5
  136. mindspore/nn/layer/transformer.py +48 -26
  137. mindspore/nn/learning_rate_schedule.py +5 -3
  138. mindspore/nn/loss/loss.py +31 -36
  139. mindspore/nn/optim/ada_grad.py +1 -0
  140. mindspore/nn/optim/adadelta.py +2 -2
  141. mindspore/nn/optim/adam.py +1 -1
  142. mindspore/nn/optim/lars.py +1 -4
  143. mindspore/nn/optim/optimizer.py +1 -1
  144. mindspore/nn/optim/rprop.py +2 -2
  145. mindspore/nn/optim/thor.py +2 -1
  146. mindspore/nn/utils/init.py +13 -11
  147. mindspore/nn/wrap/cell_wrapper.py +4 -6
  148. mindspore/nn/wrap/loss_scale.py +3 -4
  149. mindspore/numpy/array_creations.py +60 -62
  150. mindspore/numpy/array_ops.py +148 -143
  151. mindspore/numpy/logic_ops.py +41 -42
  152. mindspore/numpy/math_ops.py +361 -359
  153. mindspore/numpy/utils.py +16 -16
  154. mindspore/numpy/utils_const.py +4 -4
  155. mindspore/opencv_core452.dll +0 -0
  156. mindspore/opencv_imgcodecs452.dll +0 -0
  157. mindspore/opencv_imgproc452.dll +0 -0
  158. mindspore/ops/__init__.py +2 -1
  159. mindspore/ops/_grad_experimental/grad_comm_ops.py +94 -13
  160. mindspore/ops/_grad_experimental/grad_debug_ops.py +6 -1
  161. mindspore/ops/_grad_experimental/grad_inner_ops.py +9 -0
  162. mindspore/ops/_grad_experimental/grad_math_ops.py +2 -1
  163. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  164. mindspore/ops/_op_impl/cpu/raise_op.py +28 -0
  165. mindspore/ops/_vmap/vmap_array_ops.py +20 -19
  166. mindspore/ops/_vmap/vmap_base.py +0 -2
  167. mindspore/ops/_vmap/vmap_grad_nn_ops.py +19 -13
  168. mindspore/ops/_vmap/vmap_math_ops.py +11 -9
  169. mindspore/ops/_vmap/vmap_nn_ops.py +20 -34
  170. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +149 -12
  171. mindspore/ops/auto_generate/gen_arg_handler.py +0 -61
  172. mindspore/ops/auto_generate/gen_extend_func.py +554 -60
  173. mindspore/ops/auto_generate/gen_ops_def.py +1621 -115
  174. mindspore/ops/auto_generate/gen_ops_prim.py +8024 -3409
  175. mindspore/ops/auto_generate/pyboost_inner_prim.py +183 -79
  176. mindspore/ops/composite/base.py +1 -1
  177. mindspore/ops/composite/multitype_ops/_compile_utils.py +229 -30
  178. mindspore/ops/composite/multitype_ops/pow_impl.py +0 -29
  179. mindspore/ops/function/__init__.py +12 -0
  180. mindspore/ops/function/array_func.py +561 -159
  181. mindspore/ops/function/clip_func.py +64 -0
  182. mindspore/ops/function/debug_func.py +28 -20
  183. mindspore/ops/function/image_func.py +1 -1
  184. mindspore/ops/function/linalg_func.py +5 -4
  185. mindspore/ops/function/math_func.py +1659 -290
  186. mindspore/ops/function/nn_func.py +988 -317
  187. mindspore/ops/function/parameter_func.py +3 -56
  188. mindspore/ops/function/random_func.py +243 -33
  189. mindspore/ops/function/sparse_unary_func.py +1 -1
  190. mindspore/ops/functional.py +18 -5
  191. mindspore/ops/functional_overload.py +897 -0
  192. mindspore/ops/operations/__init__.py +3 -2
  193. mindspore/ops/operations/_embedding_cache_ops.py +4 -4
  194. mindspore/ops/operations/_grad_ops.py +2 -34
  195. mindspore/ops/operations/_infer_ops.py +2 -1
  196. mindspore/ops/operations/_inner_ops.py +38 -8
  197. mindspore/ops/operations/array_ops.py +45 -303
  198. mindspore/ops/operations/comm_ops.py +19 -16
  199. mindspore/ops/operations/custom_ops.py +11 -55
  200. mindspore/ops/operations/debug_ops.py +42 -47
  201. mindspore/ops/operations/inner_ops.py +6 -4
  202. mindspore/ops/operations/linalg_ops.py +3 -2
  203. mindspore/ops/operations/manually_defined/ops_def.py +185 -104
  204. mindspore/ops/operations/math_ops.py +11 -216
  205. mindspore/ops/operations/nn_ops.py +146 -308
  206. mindspore/ops/primitive.py +23 -21
  207. mindspore/ops/tensor_method.py +1669 -0
  208. mindspore/ops_generate/aclnn_kernel_register_auto_cc_generator.py +110 -0
  209. mindspore/ops_generate/add_tensor_docs_generator.py +54 -0
  210. mindspore/ops_generate/arg_handler.py +0 -61
  211. mindspore/ops_generate/auto_grad_impl_cc_generator.py +135 -0
  212. mindspore/ops_generate/auto_grad_reg_cc_generator.py +93 -0
  213. mindspore/ops_generate/base_generator.py +11 -0
  214. mindspore/ops_generate/cpp_create_prim_instance_helper_generator.py +108 -0
  215. mindspore/ops_generate/functional_map_cpp_generator.py +491 -0
  216. mindspore/ops_generate/functional_overload_py_generator.py +110 -0
  217. mindspore/ops_generate/functions_cc_generator.py +233 -0
  218. mindspore/ops_generate/gen_aclnn_implement.py +110 -114
  219. mindspore/ops_generate/gen_constants.py +157 -3
  220. mindspore/ops_generate/gen_ops.py +245 -990
  221. mindspore/ops_generate/gen_pyboost_func.py +97 -998
  222. mindspore/ops_generate/gen_utils.py +119 -33
  223. mindspore/ops_generate/lite_ops_cpp_generator.py +155 -0
  224. mindspore/ops_generate/op_api_proto.py +206 -0
  225. mindspore/ops_generate/op_def_py_generator.py +131 -0
  226. mindspore/ops_generate/op_prim_py_generator.py +480 -0
  227. mindspore/ops_generate/op_proto.py +373 -108
  228. mindspore/ops_generate/op_template_parser.py +436 -0
  229. mindspore/ops_generate/ops_def_cc_generator.py +288 -0
  230. mindspore/ops_generate/ops_def_h_generator.py +74 -0
  231. mindspore/ops_generate/ops_name_h_generator.py +68 -0
  232. mindspore/ops_generate/ops_primitive_h_generator.py +81 -0
  233. mindspore/ops_generate/pyboost_functions_cpp_generator.py +370 -0
  234. mindspore/ops_generate/pyboost_functions_h_generator.py +68 -0
  235. mindspore/ops_generate/pyboost_functions_py_generator.py +148 -0
  236. mindspore/ops_generate/pyboost_grad_function_cpp_generator.py +154 -0
  237. mindspore/ops_generate/pyboost_inner_prim_generator.py +131 -0
  238. mindspore/ops_generate/pyboost_native_grad_functions_generator.py +268 -0
  239. mindspore/ops_generate/pyboost_op_cpp_code_generator.py +851 -0
  240. mindspore/ops_generate/pyboost_overload_functions_cpp_generator.py +344 -0
  241. mindspore/ops_generate/pyboost_utils.py +92 -33
  242. mindspore/ops_generate/template.py +294 -44
  243. mindspore/ops_generate/tensor_func_reg_cpp_generator.py +422 -0
  244. mindspore/parallel/__init__.py +3 -3
  245. mindspore/parallel/_auto_parallel_context.py +24 -33
  246. mindspore/parallel/_parallel_serialization.py +13 -2
  247. mindspore/parallel/_utils.py +4 -1
  248. mindspore/parallel/algo_parameter_config.py +1 -1
  249. mindspore/parallel/checkpoint_transform.py +44 -0
  250. mindspore/parallel/cluster/process_entity/_api.py +131 -37
  251. mindspore/parallel/cluster/process_entity/_utils.py +41 -6
  252. mindspore/parallel/cluster/run.py +20 -3
  253. mindspore/parallel/parameter_broadcast.py +1 -1
  254. mindspore/parallel/shard.py +3 -0
  255. mindspore/parallel/transform_safetensors.py +119 -253
  256. mindspore/profiler/__init__.py +17 -4
  257. mindspore/profiler/analysis/__init__.py +0 -0
  258. mindspore/profiler/analysis/parser/__init__.py +0 -0
  259. mindspore/profiler/analysis/parser/ascend_cann_parser.py +166 -0
  260. mindspore/profiler/analysis/parser/base_parser.py +158 -0
  261. mindspore/profiler/analysis/parser/framework_cann_relation_parser.py +45 -0
  262. mindspore/profiler/analysis/parser/ms_framework_parser.py +142 -0
  263. mindspore/profiler/analysis/parser/ms_minddata_parser.py +145 -0
  264. mindspore/profiler/analysis/parser/timeline_assembly_factory/__init__.py +0 -0
  265. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +261 -0
  266. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +40 -0
  267. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +84 -0
  268. mindspore/profiler/analysis/parser/timeline_creator/__init__.py +0 -0
  269. mindspore/profiler/analysis/parser/timeline_creator/base_timeline_creator.py +44 -0
  270. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +90 -0
  271. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +76 -0
  272. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +103 -0
  273. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +134 -0
  274. mindspore/profiler/analysis/parser/timeline_event/__init__.py +0 -0
  275. mindspore/profiler/analysis/parser/timeline_event/base_event.py +233 -0
  276. mindspore/profiler/analysis/parser/timeline_event/cpu_op_event.py +47 -0
  277. mindspore/profiler/analysis/parser/timeline_event/flow_event.py +36 -0
  278. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +260 -0
  279. mindspore/profiler/analysis/parser/timeline_event/msprof_event.py +73 -0
  280. mindspore/profiler/analysis/parser/timeline_event/scope_layer_event.py +53 -0
  281. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +146 -0
  282. mindspore/profiler/analysis/task_manager.py +131 -0
  283. mindspore/profiler/analysis/time_converter.py +84 -0
  284. mindspore/profiler/analysis/viewer/__init__.py +0 -0
  285. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +333 -0
  286. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +87 -0
  287. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +252 -0
  288. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +313 -0
  289. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +322 -0
  290. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +265 -0
  291. mindspore/profiler/analysis/viewer/ascend_timeline_viewer.py +58 -0
  292. mindspore/profiler/analysis/viewer/base_viewer.py +26 -0
  293. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +97 -0
  294. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +581 -0
  295. mindspore/profiler/analysis/work_flow.py +73 -0
  296. mindspore/profiler/common/ascend_msprof_exporter.py +138 -0
  297. mindspore/profiler/common/command_executor.py +90 -0
  298. mindspore/profiler/common/constant.py +174 -3
  299. mindspore/profiler/common/file_manager.py +208 -0
  300. mindspore/profiler/common/log.py +130 -0
  301. mindspore/profiler/common/msprof_cmd_tool.py +202 -0
  302. mindspore/profiler/common/path_manager.py +371 -0
  303. mindspore/profiler/common/process_bar.py +168 -0
  304. mindspore/profiler/common/process_pool.py +9 -3
  305. mindspore/profiler/common/profiler_context.py +476 -0
  306. mindspore/profiler/common/profiler_info.py +304 -0
  307. mindspore/profiler/common/profiler_output_path.py +284 -0
  308. mindspore/profiler/common/profiler_parameters.py +210 -0
  309. mindspore/profiler/common/profiler_path_manager.py +120 -0
  310. mindspore/profiler/common/record_function.py +76 -0
  311. mindspore/profiler/common/tlv_decoder.py +76 -0
  312. mindspore/profiler/common/util.py +75 -2
  313. mindspore/profiler/dynamic_profiler.py +270 -37
  314. mindspore/profiler/envprofiler.py +138 -0
  315. mindspore/profiler/mstx.py +199 -0
  316. mindspore/profiler/platform/__init__.py +21 -0
  317. mindspore/profiler/platform/base_profiler.py +40 -0
  318. mindspore/profiler/platform/cpu_profiler.py +124 -0
  319. mindspore/profiler/platform/gpu_profiler.py +74 -0
  320. mindspore/profiler/platform/npu_profiler.py +309 -0
  321. mindspore/profiler/profiler.py +580 -93
  322. mindspore/profiler/profiler_action_controller.py +187 -0
  323. mindspore/profiler/profiler_interface.py +114 -0
  324. mindspore/profiler/schedule.py +208 -0
  325. mindspore/rewrite/api/symbol_tree.py +1 -2
  326. mindspore/run_check/_check_version.py +2 -6
  327. mindspore/runtime/__init__.py +37 -0
  328. mindspore/runtime/device.py +27 -0
  329. mindspore/runtime/event.py +209 -0
  330. mindspore/runtime/executor.py +148 -0
  331. mindspore/runtime/memory.py +392 -0
  332. mindspore/runtime/stream.py +460 -0
  333. mindspore/runtime/thread_bind_core.py +401 -0
  334. mindspore/swresample-4.dll +0 -0
  335. mindspore/swscale-6.dll +0 -0
  336. mindspore/tinyxml2.dll +0 -0
  337. mindspore/train/__init__.py +2 -2
  338. mindspore/train/_utils.py +53 -18
  339. mindspore/train/amp.py +8 -4
  340. mindspore/train/callback/_checkpoint.py +32 -18
  341. mindspore/train/callback/_early_stop.py +1 -1
  342. mindspore/train/callback/_flops_collector.py +105 -69
  343. mindspore/train/callback/_history.py +1 -1
  344. mindspore/train/callback/_summary_collector.py +44 -6
  345. mindspore/train/callback/_tft_register.py +31 -10
  346. mindspore/train/dataset_helper.py +11 -11
  347. mindspore/train/metrics/precision.py +4 -5
  348. mindspore/train/mind_ir_pb2.py +167 -46
  349. mindspore/train/model.py +13 -15
  350. mindspore/train/serialization.py +462 -76
  351. mindspore/train/summary/summary_record.py +1 -2
  352. mindspore/train/train_thor/model_thor.py +1 -1
  353. mindspore/turbojpeg.dll +0 -0
  354. mindspore/utils/__init__.py +4 -2
  355. mindspore/utils/dryrun.py +138 -0
  356. mindspore/utils/runtime_execution_order_check.py +550 -0
  357. mindspore/version.py +1 -1
  358. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/METADATA +2 -3
  359. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/RECORD +362 -238
  360. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/entry_points.txt +1 -1
  361. mindspore/common/_tensor_overload.py +0 -139
  362. mindspore/mindspore_np_dtype.dll +0 -0
  363. mindspore/profiler/envprofiling.py +0 -254
  364. mindspore/profiler/profiling.py +0 -1926
  365. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/WHEEL +0 -0
  366. {mindspore-2.4.10.dist-info → mindspore-2.5.0.dist-info}/top_level.txt +0 -0
@@ -19,6 +19,7 @@ from __future__ import absolute_import
19
19
  import mindspore.numpy as mnp
20
20
  from mindspore.ops import operations as P
21
21
  from mindspore.ops import functional as F
22
+ from mindspore.ops import auto_generate as gen
22
23
  from mindspore.ops.auto_generate import MatMulExt
23
24
  from mindspore.ops.primitive import _primexpr
24
25
  from mindspore.common import Tensor
@@ -29,7 +30,7 @@ from mindspore.ops.primitive import Primitive
29
30
  from mindspore.ops.function import _VmapGeneralRule
30
31
  from mindspore.ops._vmap.vmap_base import vmap_rules_getters, vmap_general_preprocess, get_assign_vmap_rule, \
31
32
  get_unop_vmap_rule, _raise_value_error, _bdim_at_front, _broadcast_by_axis, _handle_broadcasting, \
32
- _vmap_clone_prim, _bdim_at_any, _get_reduce_batch_axis, _get_reduce_out_dim
33
+ _bdim_at_any, _get_reduce_batch_axis, _get_reduce_out_dim
33
34
  from mindspore.ops.operations.math_ops import Bernoulli, BesselI0, BesselI1, BesselJ0, BesselJ1, \
34
35
  BesselK0, BesselK0e, BesselY0, BesselY1, BesselK1, BesselK1e, Median
35
36
 
@@ -128,28 +129,29 @@ def get_addcxxx_vmap_rule(prim, axis_size):
128
129
  return vmap_rule
129
130
 
130
131
 
131
- @vmap_rules_getters.register(P.Cdist)
132
+ @vmap_rules_getters.register(gen.Cdist)
132
133
  def get_cdist_vmap_rule(prim, axis_size):
133
134
  """VmapRule for `cdist` operation."""
134
- if hasattr(prim, 'batch_rank'):
135
- batch_rank = prim.batch_rank + 1
135
+ if prim.has_label("batch_rank"):
136
+ batch_rank = prim.get_label("batch_rank") + 1
136
137
  else:
137
138
  batch_rank = 1
138
139
 
139
- batch_prim = _vmap_clone_prim(prim)
140
- batch_prim.add_prim_attr("batch_rank", batch_rank)
140
+ prim = prim.clone()
141
+ prim.set_label('batch_rank', batch_rank)
141
142
 
142
- def vmap_rule(x_bdim, y_bdim):
143
+ def vmap_rule(x_bdim, y_bdim, p_bdim):
143
144
  x, x_dim = x_bdim
144
145
  y, y_dim = y_bdim
146
+ p, _ = p_bdim
145
147
 
146
- if x_dim is None and y_dim is None:
148
+ if x_dim is None and y_dim is None and p is None:
147
149
  out = prim(x, y)
148
150
  return (out, None)
149
151
  x = _bdim_at_front(x, x_dim, axis_size)
150
152
  y = _bdim_at_front(y, y_dim, axis_size)
151
153
 
152
- out = batch_prim(x, y)
154
+ out = prim(x, y, p)
153
155
  return out, 0
154
156
 
155
157
  return vmap_rule
@@ -987,28 +987,16 @@ def get_kl_div_loss_grad_vmap_rule(prim, axis_size):
987
987
  @vmap_rules_getters.register(P.SmoothL1Loss)
988
988
  def get_smooth_l1_loss_vmap_rule(prim, axis_size):
989
989
  """VmapRule for `SmoothL1Loss` operation."""
990
- if isinstance(prim, str):
991
- prim = Primitive(prim)
992
- prim_beta = 1.0
993
- prim_reduction = 'none'
994
- else:
995
- prim_reduction = prim.reduction
996
- prim_beta = prim.beta
997
-
998
- smooth_l1_loss_op = P.SmoothL1Loss(prim_beta, 'none')
999
- if prim_reduction == 'mean':
1000
- reduce_op = P.ReduceMean()
1001
- elif prim_reduction == "sum":
1002
- reduce_op = P.ReduceSum()
1003
-
1004
- def vmap_rule(x_bdim, target_bdim):
990
+ def vmap_rule(x_bdim, target_bdim, beta_bdim, reduction_bdim):
1005
991
  is_all_none, result = vmap_general_preprocess(
1006
- prim, x_bdim, target_bdim)
992
+ prim, x_bdim, target_bdim, beta_bdim, reduction_bdim)
1007
993
  if is_all_none:
1008
994
  return result
1009
995
 
1010
996
  x, x_dim = x_bdim
1011
997
  target, target_dim = target_bdim
998
+ beta, _ = beta_bdim
999
+ reduction, _ = reduction_bdim
1012
1000
  x_ndim = F.rank(x)
1013
1001
  target_ndim = F.rank(target)
1014
1002
  max_rank = max(x_ndim, target_ndim)
@@ -1020,15 +1008,20 @@ def get_smooth_l1_loss_vmap_rule(prim, axis_size):
1020
1008
  reduce_indexes = tuple(range(1, max_rank))
1021
1009
 
1022
1010
  # elementwise style when reduction='none', otherwise reduce style
1023
- if prim_reduction == "none":
1024
- out = prim(x, target)
1025
- elif prim_reduction in ("mean", "sum"):
1026
- out = smooth_l1_loss_op(x, target)
1011
+ # reduction is number
1012
+ none_enum = handler.str_to_enum("SmoothL1Loss", "reduction", "none")
1013
+ mean_enum = handler.str_to_enum("SmoothL1Loss", "reduction", "mean")
1014
+ sum_enum = handler.str_to_enum("SmoothL1Loss", "reduction", "sum")
1015
+ if reduction in (none_enum, mean_enum, sum_enum):
1016
+ out = prim(x, target, beta, none_enum)
1027
1017
  if reduce_indexes is not None:
1028
- out = reduce_op(out, reduce_indexes)
1018
+ if reduction == mean_enum:
1019
+ out = P.ReduceMean()(out, reduce_indexes)
1020
+ elif reduction == sum_enum:
1021
+ out = P.ReduceSum()(out, reduce_indexes)
1029
1022
  else:
1030
1023
  raise RuntimeError("For SmoothL1Loss vmap, reduction should be one of "
1031
- "['none', 'mean', 'sum'], but got '{}'".format(prim_reduction))
1024
+ "['none', 'mean', 'sum'], but got '{}'".format(reduction))
1032
1025
  return out, 0
1033
1026
 
1034
1027
  return vmap_rule
@@ -1037,29 +1030,22 @@ def get_smooth_l1_loss_vmap_rule(prim, axis_size):
1037
1030
  @vmap_rules_getters.register(G.SmoothL1LossGrad)
1038
1031
  def get_smooth_l1_loss_grad_vmap_rule(prim, axis_size):
1039
1032
  """VmapRule for `SmoothL1LossGrad`."""
1040
- if isinstance(prim, str):
1041
- prim = Primitive(prim)
1042
- reduction = "none"
1043
- beta = 1.0
1044
- else:
1045
- reduction = prim.reduction
1046
- beta = prim.beta
1047
- smooth_l1_loss_grad = G.SmoothL1LossGrad(beta, reduction)
1048
-
1049
- def vmap_rule(x_bdim, target_bdim, dy_bdim):
1033
+ def vmap_rule(x_bdim, target_bdim, dy_bdim, beta_bdim, reduction_bdim):
1050
1034
  is_all_none, result = vmap_general_preprocess(
1051
- prim, dy_bdim, x_bdim, target_bdim)
1035
+ prim, dy_bdim, x_bdim, target_bdim, beta_bdim, reduction_bdim)
1052
1036
  if is_all_none:
1053
1037
  return result
1054
1038
 
1055
1039
  dy, dy_dim = dy_bdim
1056
1040
  x, x_dim = x_bdim
1057
1041
  target, target_dim = target_bdim
1042
+ beta, _ = beta_bdim
1043
+ reduction, _ = reduction_bdim
1058
1044
  dy = _bdim_at_front(dy, dy_dim, axis_size)
1059
1045
  x = _bdim_at_front(x, x_dim, axis_size)
1060
1046
  target = _bdim_at_front(target, target_dim, axis_size)
1061
1047
 
1062
- out = smooth_l1_loss_grad(x, target, dy)
1048
+ out = prim(x, target, dy, beta, reduction)
1063
1049
  return out, 0
1064
1050
 
1065
1051
  return vmap_rule
@@ -21,6 +21,11 @@ op_args_default_value = {
21
21
  "AdamW": {"amsgrad": False, "maximize": False},
22
22
  "AddExt": {"alpha": 1},
23
23
  "AddLayerNormV2": {"epsilon": 1e-5, "additionalOut": False},
24
+ "AddRmsNorm": {"epsilon": 1e-6},
25
+ "Addbmm": {"beta": 1, "alpha": 1},
26
+ "Addmm": {"beta": 1, "alpha": 1},
27
+ "Addmv": {"beta": 1, "alpha": 1},
28
+ "AllGatherMatmul": {"bias": None, "gather_index": 0, "gather_output": True, "comm_turn": 0, "trans_input": False, "trans_x2": False},
24
29
  "ApplyAdamW": {"max_grad_norm": None, "amsgrad": False, "maximize": False},
25
30
  "ApplyCamePart2": {"sum_r": None, "global_shape": None},
26
31
  "ApplyCamePart3": {"global_shape": None, "use_first_moment": False},
@@ -33,13 +38,18 @@ op_args_default_value = {
33
38
  "ArgMinExt": {"dim": None, "keepdim": False},
34
39
  "Argmin": {"axis": -1, "output_type": mstype.int32},
35
40
  "ArgMinWithValue": {"axis": 0, "keep_dims": False},
41
+ "ArgSort": {"dim": -1, "descending": False},
42
+ "AsStrided": {"storage_offset": 0},
43
+ "AvgPool1D": {"stride": None, "padding": 0, "ceil_mode": False, "count_include_pad": True},
36
44
  "AvgPool2DGrad": {"padding": 0, "ceil_mode": False, "count_include_pad": True, "divisor_override": None},
37
45
  "AvgPool2D": {"padding": 0, "ceil_mode": False, "count_include_pad": True, "divisor_override": None},
38
46
  "AvgPoolGrad": {"kernel_size": 1, "strides": 1, "pad_mode": 'VALID', "data_format": 'NCHW'},
39
47
  "AvgPool": {"kernel_size": 1, "strides": 1, "pad_mode": 'VALID', "data_format": 'NCHW'},
40
48
  "BatchMatMul": {"transpose_a": False, "transpose_b": False},
49
+ "BatchNormElemt": {"weight": None, "bias": None, "mean": None, "invstd": None, "eps": 1e-5},
41
50
  "BatchNormExt": {"running_mean": None, "runnning_var": None, "training": False, "momentum": 0.1, "epsilon": 1e-5},
42
- "BatchNormGradExt": {"running_mean": None, "running_var": None, "saved_mean": None, "saved_rstd": None, "training": False, "eps": 1e-5},
51
+ "BatchNormGatherStatsWithCounts": {"running_mean": None, "running_var": None, "momentum": 1e-1, "eps": 1e-5, "counts": None},
52
+ "BatchNormGradExt": {"running_mean": None, "running_var": None, "saved_mean": None, "saved_rstd": None, "training": False, "eps": 1e-5, "output_mask": (1, 1, 1)},
43
53
  "BatchNormGradGrad": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
44
54
  "BatchNormGrad": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
45
55
  "BatchNormGradWithActivation": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
@@ -52,6 +62,9 @@ op_args_default_value = {
52
62
  "BinaryCrossEntropy": {"weight": None, "reduction": 'mean'},
53
63
  "BinaryCrossEntropyWithLogitsBackward": {"weight": None, "posWeight": None, "reduction": 'mean'},
54
64
  "BCEWithLogitsLoss": {"weight": None, "posWeight": None, "reduction": 'mean'},
65
+ "BincountExt": {"weights": None, "minlength": 0},
66
+ "CdistGrad": {"p": 2.0},
67
+ "Cdist": {"p": 2.0},
55
68
  "CeLU": {"alpha": 1.0},
56
69
  "CholeskyInverse": {"upper": False},
57
70
  "Cholesky": {"upper": False},
@@ -62,8 +75,15 @@ op_args_default_value = {
62
75
  "Col2ImGrad": {"dilation": 1, "padding": 0, "stride": 1},
63
76
  "Concat": {"axis": 0},
64
77
  "ConstantPadND": {"value": 0.0},
65
- "ConvolutionGrad": {"bias": None, "stride": 1, "padding": 0, "dilation": 1, "transposed": False, "output_padding": 0, "groups": 1, "output_mask": ()},
78
+ "Conv2DExt": {"bias": None, "stride": 1, "padding": 0, "dilation": 1, "groups": 1},
79
+ "Conv2DPadding": {"bias": None, "stride": 1, "padding": 'valid', "dilation": 1, "groups": 1},
80
+ "Conv3DExt": {"bias": None, "stride": 1, "padding": 0, "dilation": 1, "groups": 1},
81
+ "Conv3DPadding": {"bias": None, "stride": 1, "padding": 'valid', "dilation": 1, "groups": 1},
82
+ "ConvTranspose2D": {"bias": None, "stride": 1, "padding": 0, "output_padding": 0, "groups": 1, "dilation": 1},
83
+ "ConvolutionGrad": {"bias": None, "stride": 1, "padding": 0, "dilation": (1, 1), "transposed": False, "output_padding": 0, "groups": 1, "output_mask": ()},
66
84
  "Convolution": {"bias": None, "stride": 1, "padding": 0, "dilation": 1, "transposed": False, "output_padding": 0, "groups": 1},
85
+ "ConvolutionStrGrad": {"bias": None, "stride": 1, "padding": 'valid', "dilation": 1, "transposed": False, "output_padding": 0, "groups": 1, "output_mask": ()},
86
+ "ConvolutionStr": {"bias": None, "stride": 1, "padding": 'valid', "dilation": 1, "transposed": False, "output_padding": 0, "groups": 1},
67
87
  "Correlate": {"mode": 'valid'},
68
88
  "CountNonZero": {"dim": None},
69
89
  "Cross": {"dim": -65530},
@@ -75,6 +95,7 @@ op_args_default_value = {
75
95
  "Dense": {"bias": None},
76
96
  "Diagonal": {"offset": 0, "dim1": 0, "dim2": 1},
77
97
  "DivMod": {"rounding_mode": None},
98
+ "DivMods": {"rounding_mode": None},
78
99
  "Dropout": {"keep_prob": 0.5, "Seed0": 0, "Seed1": 0},
79
100
  "Eig": {"compute_v": False},
80
101
  "EluExt": {"alpha": 1.0},
@@ -92,6 +113,8 @@ op_args_default_value = {
92
113
  "EmbeddingFeatureMappingImport": {"only_offset_flag": True, "num": 1},
93
114
  "Embedding": {"padding_idx": None, "max_norm": None, "norm_type": 2.0, "scale_grad_by_freq": False},
94
115
  "EmbeddingTableEvict": {"steps_to_live": 0},
116
+ "EmptyLike": {"dtype": None, "device": None},
117
+ "Empty": {"dtype": None, "device": None},
95
118
  "ExtractImagePatches": {"padding": 'VALID'},
96
119
  "FFNExt": {"expertTokens": None, "bias1": None, "bias2": None, "scale": None, "offset": None, "deqScale1": None, "deqScale2": None, "antiquant_scale1": None, "antiquant_scale2": None, "antiquant_offset1": None, "antiquant_offset2": None, "activation": 'fastgelu', "inner_precise": 0},
97
120
  "FFT2": {"s": None, "dim": (-2, -1), "norm": None},
@@ -106,14 +129,20 @@ op_args_default_value = {
106
129
  "FlashAttentionScoreGrad": {"pse_shift": None, "drop_mask": None, "padding_mask": None, "atten_mask": None, "softmax_max": None, "softmax_sum": None, "softmax_in": None, "attention_in": None, "prefix": None, "actual_seq_qlen": None, "actual_seq_kvlen": None, "keep_prob": 1.0, "scale_value": 1.0, "pre_tokens": 65536, "next_tokens": 65536, "inner_precise": 1, "input_layout": 'BSH', "sparse_mode": 0},
107
130
  "FlashAttentionScore": {"real_shift": None, "drop_mask": None, "padding_mask": None, "attn_mask": None, "prefix": None, "actual_seq_qlen": None, "actual_seq_kvlen": None, "keep_prob": 1.0, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 2147483647, "inner_precise": 0, "input_layout": 'BSH', "sparse_mode": 0},
108
131
  "FlattenExt": {"start_dim": 0, "end_dim": -1},
132
+ "FullLike": {"dtype": None},
109
133
  "Gather": {"batch_dims": 0},
110
134
  "GenerateEodMaskV2": {"start": 0, "steps": 1, "error_mode": 'cycle', "flip_mode": 'bitflip', "multiply_factor": 0.0, "bit_pos": 0, "flip_probability": 0.0},
111
- "GridSampler2DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False},
135
+ "GLU": {"axis": -1},
136
+ "GmmBackward": {"group_list": None},
137
+ "GmmV2Backward": {"group_list": None, "group_list_type": 0},
138
+ "GridSampler2DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False, "output_mask": (1, 1)},
112
139
  "GridSampler2D": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False},
113
- "GridSampler3DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False},
140
+ "GridSampler3DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False, "output_mask": (1, 1)},
114
141
  "GridSampler3D": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False},
115
142
  "GroupNormGrad": {"dx_is_require": True, "dgamma_is_require": True, "dbeta_is_require": True},
116
143
  "GroupNorm": {"weight": None, "bias": None, "eps": 1e-5},
144
+ "HardtanhGrad": {"min_val": -1, "max_val": 1},
145
+ "Hardtanh": {"min_val": -1, "max_val": 1},
117
146
  "HFFT2": {"s": None, "dim": (-2, -1), "norm": None},
118
147
  "HFFT": {"n": None, "dim": -1, "norm": None},
119
148
  "HFFTN": {"s": None, "dim": None, "norm": None},
@@ -132,18 +161,30 @@ op_args_default_value = {
132
161
  "Im2ColExt": {"dilation": 1, "padding": 0, "stride": 1},
133
162
  "IncreFlashAttention": {"attn_mask": None, "actual_seq_lengths": None, "pse_shift": None, "dequant_scale1": None, "quant_scale1": None, "dequant_scale2": None, "quant_scale2": None, "quant_offset2": None, "antiquant_scale": None, "antiquant_offset": None, "block_table": None, "kv_padding_size": None, "num_heads": 1, "input_layout": 'BSH', "scale_value": 1.0, "num_key_value_heads": 0, "block_size": 0, "inner_precise": 1},
134
163
  "IndexAddExt": {"alpha": 1},
164
+ "InnerInplaceIndexPut": {"accumulate": False},
135
165
  "InplaceAddExt": {"alpha": 1},
136
166
  "InplaceAddmm": {"beta": 1, "alpha": 1},
137
167
  "InplaceAddsExt": {"alpha": 1},
168
+ "InplaceClampScalar": {"min": None, "max": None},
169
+ "InplaceClampTensor": {"min": None, "max": None},
170
+ "InplaceDivMod": {"rounding_mode": None},
171
+ "InplaceDivMods": {"rounding_mode": None},
172
+ "InplaceHardtanh": {"min_val": -1, "max_val": 1},
173
+ "InplaceIndexAddExt": {"alpha": 1},
174
+ "InplaceIndexPut": {"accumulate": False},
175
+ "InplaceRandom": {"from_": 0, "to": None, "seed": 0, "offset": 0},
176
+ "InplaceSubExt": {"alpha": 1},
177
+ "InplaceSubScalar": {"alpha": 1},
138
178
  "InsertGemV2InBackward": {"start": 0, "steps": 1, "error_mode": 'cycle', "flip_mode": 'bitflip', "multiply_factor": 0.0, "bit_pos": 0, "flip_probability": 0.0},
139
179
  "IRFFT2": {"s": None, "dim": (-2, -1), "norm": None},
140
180
  "IRFFTDouble": {"dim": -1},
141
181
  "IRFFT": {"n": None, "dim": -1, "norm": None},
142
182
  "IRFFTN": {"s": None, "dim": None, "norm": None},
143
- "IsClose": {"rtol": 1e-05, "atol": 1e-08, "equal_nan": True},
183
+ "IsClose": {"rtol": 1e-05, "atol": 1e-08, "equal_nan": False},
144
184
  "L1LossBackwardExt": {"reduction": 'mean'},
145
185
  "L1LossExt": {"reduction": 'mean'},
146
186
  "LayerNormExt": {"weight": None, "bias": None, "eps": 1e-5},
187
+ "LayerNormGradExt": {"output_mask": (1, 1, 1)},
147
188
  "LayerNormGradGrad": {"begin_norm_axis": 1, "begin_params_axis": 1},
148
189
  "LayerNormGrad": {"begin_norm_axis": 1, "begin_params_axis": 1},
149
190
  "LayerNormGradV3": {"begin_norm_axis": 1, "begin_params_axis": 1},
@@ -152,26 +193,38 @@ op_args_default_value = {
152
193
  "LeakyReLUExt": {"negative_slope": 0.01},
153
194
  "LeakyReLUGradExt": {"negative_slope": 0.01, "is_result": False},
154
195
  "LinSpaceExt": {"dtype": None},
196
+ "LinalgVectorNorm": {"ord": 2, "dim": None, "keepdim": False, "dtype": None},
155
197
  "LogSoftmaxExt": {"dim": None, "dtype": None},
156
198
  "LogSoftmaxGrad": {"axis": -1},
157
199
  "LogSoftmax": {"axis": -1},
158
200
  "LogitGrad": {"eps": -1.0},
159
201
  "Logit": {"eps": -1.0},
160
- "LpNormV2": {"p": 2.0, "dim": None, "keepdim": False, "epsilon": 1e-12},
202
+ "LogSumExp": {"keepdim": False},
203
+ "LpNormV2": {"p": 2, "dim": None, "keepdim": False, "epsilon": 1e-12},
161
204
  "LstsqV2": {"driver": None},
162
205
  "MatMul": {"transpose_a": False, "transpose_b": False},
206
+ "MatmulReduceScatter": {"reduce_op": 'sum', "bias": None, "comm_turn": 0, "trans_input": False, "trans_x2": False},
207
+ "MaxDim": {"keepdim": False},
163
208
  "MaxPoolGradWithIndices": {"strides": None, "pads": 0, "dilation": (1, 1), "ceil_mode": False, "argmax_type": mstype.int64},
164
209
  "MaxPoolGradWithMask": {"strides": None, "pads": 0, "dilation": (1, 1), "ceil_mode": False, "argmax_type": mstype.int64},
165
210
  "MaxPoolWithIndices": {"strides": None, "pads": 0, "dilation": (1, 1), "ceil_mode": False, "argmax_type": mstype.int64},
166
211
  "MaxPoolWithMask": {"strides": None, "pads": 0, "dilation": (1, 1), "ceil_mode": False, "argmax_type": mstype.int64},
212
+ "MaxUnpool2DExt": {"stride": None, "padding": 0, "output_size": None},
167
213
  "MaximumGradGrad": {"grad_x": True, "grad_y": True},
168
214
  "MaximumGrad": {"grad_x": True, "grad_y": True},
169
- "MeanExt": {"axis": None, "keep_dims": False, "dtype": None},
215
+ "MeanExt": {"dim": None, "keepdim": False, "dtype": None},
170
216
  "MedianDim": {"dim": -1, "keepdim": False},
217
+ "Meshgrid": {"indexing": 'xy'},
218
+ "MinDim": {"keepdim": False},
171
219
  "MinimumGrad": {"grad_x": True, "grad_y": True},
172
220
  "MSELossExt": {"reduction": 'mean'},
173
221
  "MSELossGradExt": {"reduction": 'mean'},
174
222
  "NanToNum": {"nan": None, "posinf": None, "neginf": None},
223
+ "Nansum": {"dim": None, "keepdim": False, "dtype": None},
224
+ "NewEmpty": {"dtype": None, "device": None},
225
+ "NewOnes": {"dtype": None},
226
+ "NewZeros": {"dtype": None},
227
+ "NLLLoss2d": {"reduction": 'mean', "ignore_index": -100},
175
228
  "NLLLossGrad": {"reduction": 'mean', "ignore_index": -100},
176
229
  "NLLLoss": {"reduction": 'mean', "ignore_index": -100},
177
230
  "Norm": {"p": 2.0, "dim": None, "keepdim": False, "dtype": None},
@@ -181,7 +234,8 @@ op_args_default_value = {
181
234
  "Ones": {"dtype": None},
182
235
  "PagedAttentionMask": {"antiquant_scale": None, "antiquant_offset": None, "alibi_mask": None, "kv_cache_quant_mode": 'DEFAULT'},
183
236
  "PagedAttention": {"antiquant_scale": None, "antiquant_offset": None, "attn_mask": None, "q_seq_lens": None, "kv_cache_quant_mode": 'DEFAULT'},
184
- "ProdExt": {"axis": None, "keep_dims": False, "dtype": None},
237
+ "ProdExt": {"dim": None, "keepdim": False, "dtype": None},
238
+ "PromptFlashAttention": {"attn_mask": None, "actual_seq_lengths": None, "actual_seq_lengths_kv": None, "pse_shift": None, "deq_scale1": None, "quant_scale1": None, "deq_scale2": None, "quant_scale2": None, "quant_offset2": None, "num_heads": 1, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 0, "input_layout": 'BSH', "num_key_value_heads": 0, "sparse_mode": 0, "inner_precise": 1},
185
239
  "PromptKVCache": {"align_mode": 'LEFT'},
186
240
  "Qr": {"full_matrices": False},
187
241
  "RandExt": {"dtype": None},
@@ -222,6 +276,7 @@ op_args_default_value = {
222
276
  "Roll": {"axis": None},
223
277
  "RotaryPositionEmbeddingGrad": {"dx": None, "mode": 0},
224
278
  "RotaryPositionEmbedding": {"mode": 0},
279
+ "RotatedIou": {"trans": False, "mode": 0, "is_cross": True, "v_threshold": 0.0, "e_threshold": 0.0},
225
280
  "Round": {"decimals": 0},
226
281
  "ScalarToTensor": {"dtype": None},
227
282
  "Scatter": {"reduce": 'none'},
@@ -229,6 +284,9 @@ op_args_default_value = {
229
284
  "SearchSorted": {"sorter": None, "dtype": mstype.int64, "right": False},
230
285
  "SequenceConcat": {"axis": 0},
231
286
  "SilentCheckV2": {"c_min_steps": 7, "c_thresh_l1": 1000000.0, "c_coeff_l1": 100000.0, "c_thresh_l2": 10000.0, "c_coeff_l2": 5000.0, "npu_asd_detect": 1},
287
+ "SilentCheckV3": {"c_thresh_l1": 1000000.0, "c_thresh_l2": 10000.0, "beta1": 0.0, "npu_asd_detect": 1},
288
+ "SmoothL1LossGrad": {"beta": 1.0, "reduction": 'none'},
289
+ "SmoothL1Loss": {"beta": 1.0, "reduction": 'none'},
232
290
  "SoftmaxBackward": {"dim": -1},
233
291
  "Softmax": {"axis": -1},
234
292
  "SoftplusExt": {"beta": 1, "threshold": 20},
@@ -238,9 +296,12 @@ op_args_default_value = {
238
296
  "SolveTriangular": {"trans": 0, "lower": False, "unit_diagonal": False},
239
297
  "SortExt": {"dim": -1, "descending": False, "stable": False},
240
298
  "Split": {"axis": 0, "output_num": 1},
241
- "SplitTensor": {"axis": 0},
242
- "SplitWithSize": {"axis": 0},
299
+ "SplitTensor": {"dim": 0},
300
+ "SplitWithSize": {"dim": 0},
301
+ "Squeeze": {"axis": ()},
243
302
  "StackExt": {"dim": 0},
303
+ "StdMean": {"dim": None, "correction": 1, "keepdim": False},
304
+ "Std": {"dim": None, "correction": 1, "keepdim": False},
244
305
  "StridedSlice": {"begin_mask": 0, "end_mask": 0, "ellipsis_mask": 0, "new_axis_mask": 0, "shrink_axis_mask": 0},
245
306
  "SubExt": {"alpha": 1},
246
307
  "SumExt": {"dim": None, "keepdim": False, "dtype": None},
@@ -255,7 +316,8 @@ op_args_default_value = {
255
316
  "Triu": {"diagonal": 0},
256
317
  "TupleToTensor": {"dtype": None},
257
318
  "Unique2": {"sorted": True, "return_inverse": False, "return_counts": False},
258
- "UnstackExt": {"axis": 0},
319
+ "UniqueConsecutive": {"return_idx": False, "return_counts": False, "axis": None},
320
+ "UnstackExt": {"dim": 0},
259
321
  "UpsampleBicubic2DGrad": {"output_size": None, "scales": None, "align_corners": False},
260
322
  "UpsampleBicubic2D": {"output_size": None, "scales": None, "align_corners": False},
261
323
  "UpsampleBilinear2DGrad": {"output_size": None, "scales": None, "align_corners": False},
@@ -270,17 +332,59 @@ op_args_default_value = {
270
332
  "UpsampleNearest3D": {"output_size": None, "scales": None},
271
333
  "UpsampleTrilinear3DGrad": {"output_size": None, "scales": None, "align_corners": False},
272
334
  "UpsampleTrilinear3D": {"output_size": None, "scales": None, "align_corners": False},
335
+ "VarMean": {"dim": None, "correction": 1, "keepdim": False},
336
+ "Var": {"dim": None, "correction": 1, "keepdim": False},
273
337
  "ZerosLikeExt": {"dtype": None},
274
338
  "Zeros": {"dtype": None},
339
+ "AddRmsNormDynamicQuant": {"smooth_scale2": None, "epsilon": 1e-5},
275
340
  "AddRmsNormQuantV2": {"epsilon": 1e-5},
276
341
  "DynamicQuantExt": {"smooth_scales": None},
277
342
  "FusedInferAttentionScore": {"pse_shift": None, "attn_mask": None, "actual_seq_lengths": None, "actual_seq_lengths_kv": None, "dequant_scale1": None, "quant_scale1": None, "dequant_scale2": None, "quant_scale2": None, "quant_offset2": None, "antiquant_scale": None, "antiquant_offset": None, "block_table": None, "query_padding_size": None, "kv_padding_size": None, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 2147483647, "input_layout": 'BSH', "num_key_value_heads": 0, "sparse_mode": 0, "inner_precise": 1, "block_size": 0, "antiquant_mode": 0, "softmax_lse_flag": False},
278
343
  "GroupedMatmul": {"bias": None, "scale": None, "offset": None, "antiquant_scale": None, "antiquant_offset": None, "group_list": None, "split_item": 0, "group_type": -1},
344
+ "GroupedMatmulV2": {"bias": None, "scale": None, "offset": None, "antiquant_scale": None, "antiquant_offset": None, "group_list": None, "split_item": 0, "group_type": -1},
345
+ "GroupedMatmulV4": {"bias": None, "scale": None, "offset": None, "antiquant_scale": None, "antiquant_offset": None, "pre_token_scale": None, "group_list": None, "activation_input": None, "activation_quant_scale": None, "activation_quant_offset": None, "split_item": 0, "group_type": -1, "group_list_type": 0, "act_type": 0},
279
346
  "KVCacheScatterUpdate": {"reduce": 'none'},
347
+ "MatmulAllReduceAddRmsNorm": {"reduce_op": 'sum', "comm_turn": 0, "stream_mode": 1},
280
348
  "MoeFinalizeRouting": {"x2": None, "bias": None, "scales": None, "expanded_row_idx": None, "expanded_expert_idx": None},
349
+ "MoeGatingTopKSoftmax": {"finished": None, "k": 1},
281
350
  "QuantBatchMatmul": {"offset": None, "bias": None, "pertokenScaleOptional": None, "transpose_x1": False, "transpose_x2": False, "dtype": mstype.float16},
282
351
  "QuantV2": {"sqrt_mode": False, "rounding_mode": 'ROUND', "dst_type": mstype.int8},
283
352
  "WeightQuantBatchMatmul": {"antiquant_offset": None, "quant_scale": None, "quant_offset": None, "bias": None, "transpose_x": False, "transpose_weight": False, "antiquant_group_size": 0},
353
+ "DeprecatedAddbmm": {"beta": 1, "alpha": 1},
354
+ "DeprecatedAddmm": {"beta": 1, "alpha": 1},
355
+ "DeprecatedAddmv": {"beta": 1, "alpha": 1},
356
+ "DeprecatedReduceAll": {"dim": None, "keepdim": False},
357
+ "DeprecatedAllclose": {"rtol": 1e-05, "atol": 1e-08, "equal_nan": False},
358
+ "DeprecatedReduceAny": {"axis": None, "keep_dims": False},
359
+ "DeprecatedAny": {"dim": None, "keepdim": False},
360
+ "DeprecatedArgmax": {"axis": -1, "keepdims": False},
361
+ "DeprecatedArgmin": {"axis": None, "keepdims": False},
362
+ "DeprecatedArgsort": {"axis": -1, "descending": False},
363
+ "DeprecatedBincount": {"weights": None, "minlength": 0},
364
+ "DeprecatedChunk": {"axis": 0},
365
+ "DeprecatedCumsum": {"axis": None, "dtype": None},
366
+ "DeprecatedDiv": {"rounding_mode": None},
367
+ "DeprecatedFlatten": {"order": 'C', "start_dim": 0, "end_dim": -1},
368
+ "DeprecatedGather": {"batch_dims": 0},
369
+ "DeprecatedHistc": {"bins": 100, "min": 0, "max": 0},
370
+ "DeprecatedIsclose": {"rtol": 1e-05, "atol": 1e-08, "equal_nan": False},
371
+ "DeprecatedMax": {"axis": None, "keepdims": False, "initial": None, "where": True, "return_indices": False},
372
+ "DeprecatedMean": {"axis": None, "keep_dims": False},
373
+ "DeprecatedMedian": {"axis": -1, "keepdims": False},
374
+ "DeprecatedMin": {"axis": None, "keepdims": False, "initial": None, "where": True, "return_indices": False},
375
+ "DeprecatedNansum": {"axis": None, "keepdims": False, "dtype": None},
376
+ "DeprecatedProd": {"dim": None, "keepdim": False, "dtype": None},
377
+ "DeprecatedRepeatInterleave": {"dim": None},
378
+ "DeprecatedSort": {"axis": -1, "descending": False},
379
+ "DeprecatedSplit": {"axis": 0},
380
+ "DeprecatedStd": {"axis": None, "ddof": 0, "keepdims": False},
381
+ "DeprecatedSum": {"axis": None, "dtype": None, "keepdims": False, "initial": None},
382
+ "DeprecatedTopk": {"dim": None, "largest": True, "sorted": True},
383
+ "DeprecatedTranspose": {"axes": None},
384
+ "DeprecatedTril": {"diagonal": 0},
385
+ "DeprecatedUnstack": {"dim": 0},
386
+ "DeprecatedUnique": {"sorted": True, "return_inverse": False, "return_counts": False, "dim": None},
387
+ "DeprecatedVar": {"axis": None, "ddof": 0, "keepdims": False},
284
388
  }
285
389
 
286
390
  op_labels = {
@@ -289,8 +393,12 @@ op_labels = {
289
393
  "ApplyAdamW": {"side_effect_mem": True},
290
394
  "AssignAdd": {"side_effect_mem": True},
291
395
  "Assign": {"side_effect_mem": True},
292
- "CopyExt": {"side_effect_mem": True},
396
+ "AssignSub": {"side_effect_mem": True},
397
+ "BatchNormElemt": {"side_effect_mem": True},
398
+ "BatchNormGatherStatsWithCounts": {"side_effect_mem": True},
293
399
  "DecoderKVCache": {"side_effect_mem": True},
400
+ "DistCommAllReduce": {"side_effect_mem": True},
401
+ "DistCommReduce": {"side_effect_mem": True},
294
402
  "DropoutExt": {"side_effect_hidden": True},
295
403
  "DropoutGenMaskExt": {"side_effect_hidden": True},
296
404
  "Dropout": {"side_effect_hidden": True},
@@ -303,13 +411,42 @@ op_labels = {
303
411
  "Embedding": {"side_effect_mem": True},
304
412
  "EmbeddingTableEvict": {"_process_node_engine_id": 'PS'},
305
413
  "Generator": {"side_effect_mem": True},
414
+ "InnerInplaceIndexPut": {"side_effect_mem": True},
306
415
  "InplaceAddExt": {"side_effect_mem": True},
307
416
  "InplaceAddmm": {"side_effect_mem": True},
308
417
  "InplaceAddsExt": {"side_effect_mem": True},
418
+ "InplaceCopy": {"side_effect_mem": True},
419
+ "InplaceDiv": {"side_effect_mem": True},
420
+ "InplaceDivMod": {"side_effect_mem": True},
421
+ "InplaceDivMods": {"side_effect_mem": True},
422
+ "InplaceDivs": {"side_effect_mem": True},
423
+ "InplaceExp": {"side_effect_mem": True},
424
+ "InplaceFillScalar": {"side_effect_mem": True},
425
+ "InplaceFillTensor": {"side_effect_mem": True},
426
+ "InplaceFloor": {"side_effect_mem": True},
427
+ "InplaceHardtanh": {"side_effect_mem": True},
428
+ "InplaceIndexAddExt": {"side_effect_mem": True},
429
+ "InplaceIndexPut": {"side_effect_mem": True},
430
+ "InplaceMaskedFillScalar": {"side_effect_mem": True},
431
+ "InplaceMaskedFillTensor": {"side_effect_mem": True},
432
+ "InplaceMul": {"side_effect_mem": True},
433
+ "InplaceMuls": {"side_effect_mem": True},
434
+ "InplaceNormal": {"side_effect_mem": True},
435
+ "InplaceRandom": {"side_effect_mem": True},
436
+ "InplaceReLU": {"side_effect_mem": True},
437
+ "InplaceScatterAdd": {"side_effect_mem": True},
438
+ "InplaceScatterSrc": {"side_effect_mem": True},
439
+ "InplaceScatterSrcReduce": {"side_effect_mem": True},
440
+ "InplaceScatterValue": {"side_effect_mem": True},
441
+ "InplaceScatterValueReduce": {"side_effect_mem": True},
442
+ "InplaceSubExt": {"side_effect_mem": True},
443
+ "InplaceSubScalar": {"side_effect_mem": True},
444
+ "InplaceTanh": {"side_effect_mem": True},
309
445
  "Log": {"cust_aicpu": 'Log', "base": -1.0, "scale": 1.0, "shift": 0.0},
310
446
  "PromptKVCache": {"side_effect_mem": True},
311
447
  "ReshapeAndCache": {"side_effect_mem": True},
312
448
  "ResizeD": {"mode": 'linear'},
313
449
  "SilentCheckV2": {"side_effect_mem": True},
450
+ "SilentCheckV3": {"side_effect_mem": True},
314
451
  "KVCacheScatterUpdate": {"side_effect_mem": True},
315
452
  }
@@ -116,67 +116,6 @@ def to_2d_paddings(op_name, arg_name, pad):
116
116
  raise ValueError(arg_invalid_info(op_name, arg_name, pad))
117
117
 
118
118
 
119
- def to_paddings(op_name, arg_name, pad):
120
- """
121
- convert paddings: int -> tuple[int*4].
122
- """
123
- if isinstance(pad, int):
124
- return (pad,) * 4
125
- if isinstance(pad, (tuple, list)):
126
- return pad
127
- raise ValueError(arg_invalid_info(op_name, arg_name, pad))
128
-
129
-
130
- def to_3d_kernel_size(op_name, arg_name, kernel_size):
131
- """
132
- convert 3d kernel_size: int/tuple[int*6] -> tuple[int*3].
133
- """
134
- if isinstance(kernel_size, int):
135
- return (kernel_size, kernel_size, kernel_size)
136
- if isinstance(kernel_size, (tuple, list)):
137
- if len(kernel_size) == 5:
138
- return (kernel_size[2], kernel_size[3], kernel_size[4])
139
- return kernel_size
140
- raise ValueError(arg_invalid_info(op_name, arg_name, kernel_size))
141
-
142
-
143
- def to_3d_strides(op_name, arg_name, stride):
144
- """
145
- convert 3d stride: int/tuple[int*6] -> tuple[int*3].
146
- """
147
- if isinstance(stride, int):
148
- return (stride, stride, stride)
149
- if isinstance(stride, (tuple, list)):
150
- if len(stride) == 5:
151
- return (stride[2], stride[3], stride[4])
152
- return stride
153
- raise ValueError(arg_invalid_info(op_name, arg_name, stride))
154
-
155
-
156
- def to_3d_dilations(op_name, arg_name, dilation):
157
- """
158
- convert 3d dilation: int/tuple[int*6] -> tuple[int*3].
159
- """
160
- if isinstance(dilation, int):
161
- return (dilation, dilation, dilation)
162
- if isinstance(dilation, (tuple, list)):
163
- if len(dilation) == 5:
164
- return (dilation[2], dilation[3], dilation[4])
165
- return dilation
166
- raise ValueError(arg_invalid_info(op_name, arg_name, dilation))
167
-
168
-
169
- def to_3d_paddings(op_name, arg_name, pad):
170
- """
171
- convert 3d paddings: int -> tuple[int*6].
172
- """
173
- if isinstance(pad, int):
174
- return (pad,) * 6
175
- if isinstance(pad, (tuple, list)):
176
- return pad
177
- raise ValueError(arg_invalid_info(op_name, arg_name, pad))
178
-
179
-
180
119
  def generator_handler(op_name, arg_name, inputs):
181
120
  """
182
121
  convert constant value in tuple to tensor