mindspore 2.6.0rc1__cp311-cp311-win_amd64.whl → 2.7.0__cp311-cp311-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (458) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
  3. mindspore/Newtonsoft.Json.dll +0 -0
  4. mindspore/__init__.py +2 -2
  5. mindspore/_c_dataengine.cp311-win_amd64.pyd +0 -0
  6. mindspore/_c_expression.cp311-win_amd64.pyd +0 -0
  7. mindspore/_c_mindrecord.cp311-win_amd64.pyd +0 -0
  8. mindspore/_checkparam.py +42 -11
  9. mindspore/_extends/builtin_operations.py +3 -3
  10. mindspore/{_deprecated → _extends/optimize}/__init__.py +9 -3
  11. mindspore/_extends/optimize/cell_utils.py +96 -0
  12. mindspore/_extends/parallel_compile/akg_compiler/custom.py +1109 -0
  13. mindspore/_extends/parallel_compile/akg_compiler/gen_custom_op_files.py +1 -1
  14. mindspore/_extends/parse/__init__.py +3 -3
  15. mindspore/_extends/parse/compile_config.py +44 -22
  16. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +1 -2
  17. mindspore/_extends/parse/parser.py +65 -84
  18. mindspore/_extends/parse/resources.py +39 -0
  19. mindspore/_extends/parse/standard_method.py +58 -14
  20. mindspore/_extends/parse/trope.py +8 -1
  21. mindspore/_extends/pijit/__init__.py +1 -2
  22. mindspore/_extends/pijit/pijit_func_white_list.py +2 -5
  23. mindspore/amp.py +4 -22
  24. mindspore/atlprov.dll +0 -0
  25. mindspore/avcodec-59.dll +0 -0
  26. mindspore/avdevice-59.dll +0 -0
  27. mindspore/avfilter-8.dll +0 -0
  28. mindspore/avformat-59.dll +0 -0
  29. mindspore/avutil-57.dll +0 -0
  30. mindspore/boost/adasum.py +1 -1
  31. mindspore/boost/boost_cell_wrapper.py +4 -4
  32. mindspore/c1.dll +0 -0
  33. mindspore/c1xx.dll +0 -0
  34. mindspore/c2.dll +0 -0
  35. mindspore/common/__init__.py +43 -12
  36. mindspore/common/_grad_function.py +2 -1
  37. mindspore/common/_pijit_context.py +28 -7
  38. mindspore/common/_stub_tensor.py +1 -209
  39. mindspore/common/_tensor_cpp_method.py +1 -1
  40. mindspore/common/_tensor_docs.py +178 -53
  41. mindspore/common/_utils.py +9 -1
  42. mindspore/common/api.py +377 -203
  43. mindspore/common/dtype.py +108 -57
  44. mindspore/common/dump.py +11 -16
  45. mindspore/common/dynamic_shape/__init__.py +0 -0
  46. mindspore/common/{auto_dynamic_shape.py → dynamic_shape/auto_dynamic_shape.py} +17 -23
  47. mindspore/common/dynamic_shape/enable_dynamic.py +197 -0
  48. mindspore/common/file_system.py +59 -9
  49. mindspore/common/generator.py +5 -3
  50. mindspore/common/hook_handle.py +33 -5
  51. mindspore/common/jit_config.py +1 -1
  52. mindspore/common/jit_trace.py +84 -105
  53. mindspore/common/np_dtype.py +3 -3
  54. mindspore/common/parameter.py +27 -29
  55. mindspore/common/recompute.py +5 -7
  56. mindspore/common/sparse_tensor.py +0 -3
  57. mindspore/common/symbol.py +0 -1
  58. mindspore/common/tensor.py +117 -131
  59. mindspore/communication/_comm_helper.py +46 -4
  60. mindspore/communication/management.py +79 -7
  61. mindspore/context.py +67 -55
  62. mindspore/dataset/__init__.py +1 -1
  63. mindspore/dataset/audio/transforms.py +1 -1
  64. mindspore/dataset/core/config.py +38 -4
  65. mindspore/dataset/engine/datasets.py +350 -322
  66. mindspore/dataset/engine/datasets_user_defined.py +70 -24
  67. mindspore/dataset/engine/iterators.py +2 -2
  68. mindspore/dataset/engine/obs/config_loader.py +2 -2
  69. mindspore/dataset/engine/obs/obs_mindrecord_dataset.py +8 -0
  70. mindspore/dataset/transforms/c_transforms.py +2 -2
  71. mindspore/dataset/transforms/py_transforms.py +7 -3
  72. mindspore/dataset/transforms/transforms.py +10 -6
  73. mindspore/dataset/vision/__init__.py +1 -1
  74. mindspore/dataset/vision/py_transforms.py +8 -8
  75. mindspore/dataset/vision/transforms.py +17 -5
  76. mindspore/dataset/vision/utils.py +632 -21
  77. mindspore/dataset/vision/validators.py +1 -0
  78. mindspore/device_context/ascend/device.py +1 -1
  79. mindspore/device_context/ascend/op_tuning.py +35 -1
  80. mindspore/device_context/gpu/__init__.py +2 -2
  81. mindspore/device_context/gpu/device.py +1 -1
  82. mindspore/device_context/gpu/op_precision.py +4 -2
  83. mindspore/device_context/gpu/op_tuning.py +6 -3
  84. mindspore/device_manager.py +16 -9
  85. mindspore/dnnl.dll +0 -0
  86. mindspore/dpcmi.dll +0 -0
  87. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +3 -4
  88. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  89. mindspore/experimental/optim/adadelta.py +13 -20
  90. mindspore/experimental/optim/adagrad.py +15 -22
  91. mindspore/experimental/optim/adam.py +17 -24
  92. mindspore/experimental/optim/adamax.py +14 -22
  93. mindspore/experimental/optim/adamw.py +28 -34
  94. mindspore/experimental/optim/asgd.py +15 -25
  95. mindspore/experimental/optim/lr_scheduler.py +27 -45
  96. mindspore/experimental/optim/nadam.py +14 -24
  97. mindspore/experimental/optim/optimizer.py +13 -23
  98. mindspore/experimental/optim/radam.py +18 -24
  99. mindspore/experimental/optim/rmsprop.py +14 -25
  100. mindspore/experimental/optim/rprop.py +15 -26
  101. mindspore/experimental/optim/sgd.py +9 -19
  102. mindspore/hal/__init__.py +4 -4
  103. mindspore/hal/contiguous_tensors_handle.py +2 -2
  104. mindspore/hal/memory.py +27 -7
  105. mindspore/include/api/cell.h +65 -5
  106. mindspore/include/api/cfg.h +24 -7
  107. mindspore/include/api/context.h +1 -0
  108. mindspore/include/api/delegate.h +10 -2
  109. mindspore/include/api/dual_abi_helper.h +100 -19
  110. mindspore/include/api/graph.h +14 -1
  111. mindspore/include/api/kernel.h +16 -3
  112. mindspore/include/api/kernel_api.h +9 -1
  113. mindspore/include/api/metrics/accuracy.h +9 -0
  114. mindspore/include/api/model.h +8 -1
  115. mindspore/include/api/model_group.h +4 -0
  116. mindspore/include/api/model_parallel_runner.h +2 -0
  117. mindspore/include/api/status.h +48 -10
  118. mindspore/include/api/types.h +8 -3
  119. mindspore/include/c_api/model_c.h +0 -58
  120. mindspore/include/c_api/tensor_c.h +0 -26
  121. mindspore/include/dataset/constants.h +9 -0
  122. mindspore/include/dataset/vision_ascend.h +1 -1
  123. mindspore/jpeg62.dll +0 -0
  124. mindspore/mindrecord/tools/cifar10.py +61 -11
  125. mindspore/mindrecord/tools/cifar10_to_mr.py +5 -0
  126. mindspore/mindspore_backend_common.dll +0 -0
  127. mindspore/mindspore_backend_manager.dll +0 -0
  128. mindspore/mindspore_common.dll +0 -0
  129. mindspore/mindspore_core.dll +0 -0
  130. mindspore/mindspore_cpu_res_manager.dll +0 -0
  131. mindspore/mindspore_dump.dll +0 -0
  132. mindspore/mindspore_frontend.dll +0 -0
  133. mindspore/mindspore_glog.dll +0 -0
  134. mindspore/mindspore_memory_pool.dll +0 -0
  135. mindspore/mindspore_ms_backend.dll +0 -0
  136. mindspore/mindspore_ops.dll +0 -0
  137. mindspore/mindspore_ops_host.dll +0 -0
  138. mindspore/mindspore_ops_kernel_common.dll +0 -0
  139. mindspore/mindspore_profiler.dll +0 -0
  140. mindspore/mindspore_pyboost.dll +0 -0
  141. mindspore/mindspore_pynative.dll +0 -0
  142. mindspore/mindspore_res_manager.dll +0 -0
  143. mindspore/mindspore_runtime_pipeline.dll +0 -0
  144. mindspore/mint/__init__.py +6 -46
  145. mindspore/mint/distributed/__init__.py +5 -0
  146. mindspore/mint/distributed/distributed.py +429 -23
  147. mindspore/mint/nn/__init__.py +1 -1
  148. mindspore/mint/nn/functional.py +53 -6
  149. mindspore/mint/nn/layer/_functions.py +163 -294
  150. mindspore/mint/nn/layer/activation.py +8 -6
  151. mindspore/mint/nn/layer/conv.py +140 -104
  152. mindspore/mint/nn/layer/normalization.py +11 -25
  153. mindspore/mint/optim/adam.py +19 -18
  154. mindspore/mint/optim/adamw.py +14 -8
  155. mindspore/mint/optim/sgd.py +5 -5
  156. mindspore/msobj140.dll +0 -0
  157. mindspore/mspdb140.dll +0 -0
  158. mindspore/mspdbcore.dll +0 -0
  159. mindspore/mspdbst.dll +0 -0
  160. mindspore/mspft140.dll +0 -0
  161. mindspore/msvcdis140.dll +0 -0
  162. mindspore/msvcp140_1.dll +0 -0
  163. mindspore/msvcp140_2.dll +0 -0
  164. mindspore/msvcp140_atomic_wait.dll +0 -0
  165. mindspore/msvcp140_codecvt_ids.dll +0 -0
  166. mindspore/nn/cell.py +491 -623
  167. mindspore/nn/grad/cell_grad.py +11 -12
  168. mindspore/nn/layer/activation.py +36 -36
  169. mindspore/nn/layer/basic.py +74 -77
  170. mindspore/nn/layer/channel_shuffle.py +4 -4
  171. mindspore/nn/layer/combined.py +4 -2
  172. mindspore/nn/layer/conv.py +117 -110
  173. mindspore/nn/layer/dense.py +9 -7
  174. mindspore/nn/layer/embedding.py +50 -52
  175. mindspore/nn/layer/image.py +38 -40
  176. mindspore/nn/layer/math.py +111 -112
  177. mindspore/nn/layer/normalization.py +56 -44
  178. mindspore/nn/layer/pooling.py +58 -63
  179. mindspore/nn/layer/rnn_cells.py +33 -33
  180. mindspore/nn/layer/rnns.py +56 -56
  181. mindspore/nn/layer/thor_layer.py +74 -73
  182. mindspore/nn/layer/transformer.py +11 -1
  183. mindspore/nn/learning_rate_schedule.py +20 -20
  184. mindspore/nn/loss/loss.py +79 -81
  185. mindspore/nn/optim/adam.py +4 -6
  186. mindspore/nn/optim/adasum.py +2 -2
  187. mindspore/nn/optim/asgd.py +2 -0
  188. mindspore/nn/optim/lamb.py +1 -3
  189. mindspore/nn/optim/optimizer.py +1 -1
  190. mindspore/nn/optim/tft_wrapper.py +2 -3
  191. mindspore/nn/optim/thor.py +2 -2
  192. mindspore/nn/probability/distribution/_utils/utils.py +2 -2
  193. mindspore/nn/probability/distribution/exponential.py +2 -1
  194. mindspore/nn/probability/distribution/poisson.py +2 -1
  195. mindspore/nn/sparse/sparse.py +3 -3
  196. mindspore/nn/wrap/cell_wrapper.py +73 -42
  197. mindspore/nn/wrap/grad_reducer.py +37 -52
  198. mindspore/nn/wrap/loss_scale.py +72 -74
  199. mindspore/numpy/array_creations.py +7 -7
  200. mindspore/numpy/fft.py +1 -1
  201. mindspore/numpy/math_ops.py +5 -5
  202. mindspore/numpy/utils_const.py +1 -1
  203. mindspore/opencv_core452.dll +0 -0
  204. mindspore/opencv_imgcodecs452.dll +0 -0
  205. mindspore/opencv_imgproc452.dll +0 -0
  206. mindspore/ops/_grad_experimental/grad_comm_ops.py +51 -13
  207. mindspore/ops/_grad_experimental/grad_debug_ops.py +14 -0
  208. mindspore/ops/_grad_experimental/grad_inner_ops.py +0 -9
  209. mindspore/ops/_op_impl/cpu/__init__.py +1 -0
  210. mindspore/{experimental/es/__init__.py → ops/_op_impl/cpu/joinedstr_op.py} +12 -6
  211. mindspore/ops/_vmap/vmap_array_ops.py +31 -13
  212. mindspore/ops/_vmap/vmap_nn_ops.py +8 -16
  213. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +54 -13
  214. mindspore/ops/auto_generate/gen_extend_func.py +27 -145
  215. mindspore/ops/auto_generate/gen_ops_def.py +1027 -347
  216. mindspore/ops/auto_generate/gen_ops_prim.py +2341 -1117
  217. mindspore/ops/auto_generate/pyboost_inner_prim.py +31 -1
  218. mindspore/ops/composite/__init__.py +10 -0
  219. mindspore/ops/composite/base.py +9 -5
  220. mindspore/ops/composite/multitype_ops/__init__.py +12 -1
  221. mindspore/ops/composite/multitype_ops/_compile_utils.py +133 -109
  222. mindspore/ops/composite/multitype_ops/_constexpr_utils.py +1 -1
  223. mindspore/ops/composite/multitype_ops/add_impl.py +70 -2
  224. mindspore/ops/composite/multitype_ops/div_impl.py +49 -0
  225. mindspore/ops/composite/multitype_ops/floordiv_impl.py +29 -0
  226. mindspore/ops/composite/multitype_ops/getitem_impl.py +11 -0
  227. mindspore/ops/composite/multitype_ops/mod_impl.py +5 -3
  228. mindspore/ops/composite/multitype_ops/mul_impl.py +49 -0
  229. mindspore/ops/composite/multitype_ops/setitem_impl.py +57 -0
  230. mindspore/ops/composite/multitype_ops/sub_impl.py +34 -0
  231. mindspore/ops/composite/multitype_ops/zeros_like_impl.py +14 -0
  232. mindspore/ops/function/__init__.py +4 -1
  233. mindspore/ops/function/_add_attr_func.py +11 -6
  234. mindspore/ops/function/array_func.py +19 -102
  235. mindspore/ops/function/debug_func.py +8 -5
  236. mindspore/ops/function/grad/grad_func.py +5 -13
  237. mindspore/ops/function/math_func.py +77 -572
  238. mindspore/ops/function/nn_func.py +46 -94
  239. mindspore/ops/function/other_func.py +4 -1
  240. mindspore/ops/function/random_func.py +44 -5
  241. mindspore/ops/function/vmap_func.py +2 -1
  242. mindspore/ops/functional.py +4 -4
  243. mindspore/ops/functional_overload.py +594 -18
  244. mindspore/ops/op_info_register.py +21 -0
  245. mindspore/ops/operations/__init__.py +16 -11
  246. mindspore/ops/operations/_custom_ops_utils.py +689 -34
  247. mindspore/ops/operations/_inner_ops.py +14 -18
  248. mindspore/ops/operations/_sequence_ops.py +1 -1
  249. mindspore/ops/operations/array_ops.py +5 -51
  250. mindspore/ops/operations/comm_ops.py +186 -41
  251. mindspore/ops/operations/custom_ops.py +303 -177
  252. mindspore/ops/operations/debug_ops.py +59 -4
  253. mindspore/ops/operations/image_ops.py +13 -13
  254. mindspore/ops/operations/manually_defined/ops_def.py +27 -28
  255. mindspore/ops/operations/math_ops.py +8 -9
  256. mindspore/ops/operations/nn_ops.py +8 -40
  257. mindspore/ops/primitive.py +9 -20
  258. mindspore/ops/tensor_method.py +63 -15
  259. mindspore/ops_generate/api/cpp_create_prim_instance_helper_generator.py +1 -1
  260. mindspore/ops_generate/api/functional_map_cpp_generator.py +10 -9
  261. mindspore/ops_generate/api/functions_cc_generator.py +58 -10
  262. mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +1 -1
  263. mindspore/ops_generate/common/base_generator.py +14 -0
  264. mindspore/ops_generate/common/gen_constants.py +8 -3
  265. mindspore/ops_generate/common/gen_utils.py +0 -19
  266. mindspore/ops_generate/common/op_proto.py +11 -4
  267. mindspore/ops_generate/common/template.py +88 -11
  268. mindspore/ops_generate/gen_ops.py +1 -1
  269. mindspore/ops_generate/op_def/lite_ops_cpp_generator.py +4 -4
  270. mindspore/ops_generate/op_def/ops_def_cc_generator.py +0 -3
  271. mindspore/ops_generate/op_def/ops_name_h_generator.py +0 -3
  272. mindspore/ops_generate/op_def/ops_primitive_h_generator.py +0 -4
  273. mindspore/ops_generate/op_def_py/op_prim_py_generator.py +5 -2
  274. mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +49 -8
  275. mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +2 -2
  276. mindspore/ops_generate/pyboost/gen_pyboost_func.py +31 -16
  277. mindspore/ops_generate/pyboost/op_template_parser.py +98 -72
  278. mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +70 -273
  279. mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +14 -6
  280. mindspore/ops_generate/pyboost/pyboost_functions_impl_cpp_generator.py +316 -0
  281. mindspore/ops_generate/pyboost/pyboost_functions_py_generator.py +1 -1
  282. mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +5 -3
  283. mindspore/ops_generate/pyboost/pyboost_inner_prim_generator.py +1 -1
  284. mindspore/ops_generate/pyboost/pyboost_internal_functions_cpp_generator.py +76 -0
  285. mindspore/ops_generate/pyboost/pyboost_internal_functions_h_generator.py +76 -0
  286. mindspore/ops_generate/pyboost/pyboost_internal_kernel_info_adapter_generator.py +125 -0
  287. mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +4 -3
  288. mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +348 -61
  289. mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +1 -1
  290. mindspore/ops_generate/pyboost/pyboost_utils.py +118 -9
  291. mindspore/ops_generate/tensor_py_cc_generator.py +1 -24
  292. mindspore/parallel/_auto_parallel_context.py +16 -23
  293. mindspore/parallel/_cell_wrapper.py +113 -45
  294. mindspore/parallel/_parallel_serialization.py +4 -3
  295. mindspore/parallel/_ps_context.py +4 -6
  296. mindspore/parallel/_tensor.py +167 -12
  297. mindspore/parallel/_transformer/moe.py +1 -1
  298. mindspore/parallel/_transformer/transformer.py +17 -12
  299. mindspore/parallel/_utils.py +5 -11
  300. mindspore/parallel/auto_parallel.py +35 -14
  301. mindspore/parallel/checkpoint_convert.py +3 -3
  302. mindspore/parallel/checkpoint_transform.py +13 -7
  303. mindspore/parallel/cluster/process_entity/_api.py +88 -49
  304. mindspore/parallel/cluster/process_entity/_utils.py +95 -7
  305. mindspore/parallel/cluster/run.py +48 -7
  306. mindspore/parallel/function/__init__.py +8 -1
  307. mindspore/parallel/function/reshard_func.py +12 -12
  308. mindspore/parallel/nn/__init__.py +15 -2
  309. mindspore/parallel/nn/parallel_cell_wrapper.py +50 -14
  310. mindspore/parallel/nn/parallel_grad_reducer.py +7 -14
  311. mindspore/parallel/shard.py +10 -25
  312. mindspore/parallel/transform_safetensors.py +469 -174
  313. mindspore/pgodb140.dll +0 -0
  314. mindspore/pgort140.dll +0 -0
  315. mindspore/profiler/__init__.py +2 -1
  316. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +7 -7
  317. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +3 -0
  318. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +12 -6
  319. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +3 -3
  320. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +3 -3
  321. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +4 -4
  322. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +3 -3
  323. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +4 -1
  324. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +2 -1
  325. mindspore/profiler/analysis/task_manager.py +1 -1
  326. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +5 -1
  327. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +2 -1
  328. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +10 -9
  329. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +43 -23
  330. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +3 -2
  331. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +9 -5
  332. mindspore/profiler/analysis/viewer/ms_operator_details_viewer.py +132 -0
  333. mindspore/profiler/common/constant.py +16 -0
  334. mindspore/profiler/common/msprof_cmd_tool.py +2 -2
  335. mindspore/profiler/common/path_manager.py +9 -0
  336. mindspore/profiler/common/profiler_context.py +50 -29
  337. mindspore/profiler/common/profiler_info.py +0 -16
  338. mindspore/profiler/common/profiler_meta_data.py +1 -0
  339. mindspore/profiler/common/profiler_op_analyse.py +239 -0
  340. mindspore/profiler/common/profiler_output_path.py +23 -8
  341. mindspore/profiler/common/profiler_parameters.py +128 -35
  342. mindspore/profiler/dynamic_profile/__init__.py +0 -0
  343. mindspore/profiler/dynamic_profile/dynamic_monitor_proxy.py +39 -0
  344. mindspore/profiler/dynamic_profile/dynamic_profiler_config_context.py +666 -0
  345. mindspore/profiler/dynamic_profile/dynamic_profiler_utils.py +62 -0
  346. mindspore/profiler/dynamic_profiler.py +374 -338
  347. mindspore/profiler/envprofiler.py +42 -12
  348. mindspore/profiler/experimental_config.py +112 -7
  349. mindspore/profiler/mstx.py +33 -12
  350. mindspore/profiler/platform/__init__.py +2 -3
  351. mindspore/profiler/platform/cpu_profiler.py +10 -4
  352. mindspore/profiler/platform/npu_profiler.py +30 -20
  353. mindspore/profiler/profiler.py +218 -154
  354. mindspore/profiler/profiler_action_controller.py +65 -77
  355. mindspore/profiler/profiler_interface.py +2 -2
  356. mindspore/profiler/schedule.py +10 -4
  357. mindspore/rewrite/common/config.py +1 -0
  358. mindspore/rewrite/common/namer.py +1 -0
  359. mindspore/rewrite/common/namespace.py +1 -0
  360. mindspore/rewrite/node/node.py +31 -11
  361. mindspore/rewrite/parsers/assign_parser.py +1 -1
  362. mindspore/rewrite/symbol_tree/symbol_tree.py +2 -2
  363. mindspore/run_check/_check_version.py +7 -10
  364. mindspore/runtime/__init__.py +8 -6
  365. mindspore/runtime/event.py +10 -4
  366. mindspore/runtime/executor.py +87 -45
  367. mindspore/runtime/memory.py +31 -32
  368. mindspore/runtime/thread_bind_core.py +299 -165
  369. mindspore/safeguard/rewrite_obfuscation.py +12 -13
  370. mindspore/swresample-4.dll +0 -0
  371. mindspore/swscale-6.dll +0 -0
  372. mindspore/tbbmalloc.dll +0 -0
  373. mindspore/tinyxml2.dll +0 -0
  374. mindspore/train/_utils.py +17 -7
  375. mindspore/train/amp.py +43 -23
  376. mindspore/train/callback/__init__.py +5 -5
  377. mindspore/train/callback/_callback.py +2 -1
  378. mindspore/train/callback/_checkpoint.py +4 -14
  379. mindspore/train/callback/_flops_collector.py +11 -7
  380. mindspore/train/callback/_landscape.py +0 -1
  381. mindspore/train/callback/_train_fault_tolerance.py +98 -21
  382. mindspore/train/data_sink.py +15 -6
  383. mindspore/train/dataset_helper.py +14 -5
  384. mindspore/train/model.py +133 -69
  385. mindspore/train/serialization.py +168 -126
  386. mindspore/train/summary/summary_record.py +13 -2
  387. mindspore/train/train_thor/model_thor.py +2 -2
  388. mindspore/turbojpeg.dll +0 -0
  389. mindspore/utils/__init__.py +3 -2
  390. mindspore/utils/dryrun.py +0 -6
  391. mindspore/utils/runtime_execution_order_check.py +163 -77
  392. mindspore/utils/sdc_detect.py +68 -0
  393. mindspore/utils/utils.py +14 -17
  394. mindspore/vcmeta.dll +0 -0
  395. mindspore/vcruntime140.dll +0 -0
  396. mindspore/vcruntime140_1.dll +0 -0
  397. mindspore/version.py +1 -1
  398. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0.dist-info}/METADATA +5 -4
  399. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0.dist-info}/RECORD +403 -442
  400. mindspore/_deprecated/jit.py +0 -198
  401. mindspore/_extends/remote/kernel_build_server_ascend.py +0 -75
  402. mindspore/communication/_hccl_management.py +0 -297
  403. mindspore/experimental/es/embedding_service.py +0 -891
  404. mindspore/experimental/es/embedding_service_layer.py +0 -581
  405. mindspore/profiler/common/validator/__init__.py +0 -14
  406. mindspore/profiler/common/validator/validate_path.py +0 -84
  407. mindspore/profiler/parser/__init__.py +0 -14
  408. mindspore/profiler/parser/aicpu_data_parser.py +0 -272
  409. mindspore/profiler/parser/ascend_analysis/__init__.py +0 -14
  410. mindspore/profiler/parser/ascend_analysis/constant.py +0 -71
  411. mindspore/profiler/parser/ascend_analysis/file_manager.py +0 -180
  412. mindspore/profiler/parser/ascend_analysis/function_event.py +0 -185
  413. mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +0 -136
  414. mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +0 -131
  415. mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +0 -104
  416. mindspore/profiler/parser/ascend_analysis/path_manager.py +0 -313
  417. mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +0 -123
  418. mindspore/profiler/parser/ascend_analysis/tlv_decoder.py +0 -86
  419. mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +0 -75
  420. mindspore/profiler/parser/ascend_cluster_generator.py +0 -116
  421. mindspore/profiler/parser/ascend_communicate_generator.py +0 -314
  422. mindspore/profiler/parser/ascend_flops_generator.py +0 -116
  423. mindspore/profiler/parser/ascend_fpbp_generator.py +0 -82
  424. mindspore/profiler/parser/ascend_hccl_generator.py +0 -271
  425. mindspore/profiler/parser/ascend_integrate_generator.py +0 -42
  426. mindspore/profiler/parser/ascend_memory_generator.py +0 -185
  427. mindspore/profiler/parser/ascend_msprof_exporter.py +0 -282
  428. mindspore/profiler/parser/ascend_msprof_generator.py +0 -187
  429. mindspore/profiler/parser/ascend_op_generator.py +0 -334
  430. mindspore/profiler/parser/ascend_steptrace_generator.py +0 -94
  431. mindspore/profiler/parser/ascend_timeline_generator.py +0 -545
  432. mindspore/profiler/parser/base_timeline_generator.py +0 -483
  433. mindspore/profiler/parser/container.py +0 -229
  434. mindspore/profiler/parser/cpu_gpu_timeline_generator.py +0 -697
  435. mindspore/profiler/parser/flops_parser.py +0 -531
  436. mindspore/profiler/parser/framework_enum.py +0 -111
  437. mindspore/profiler/parser/framework_parser.py +0 -464
  438. mindspore/profiler/parser/framework_struct.py +0 -61
  439. mindspore/profiler/parser/gpu_analysis/__init__.py +0 -14
  440. mindspore/profiler/parser/gpu_analysis/function_event.py +0 -44
  441. mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +0 -89
  442. mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +0 -72
  443. mindspore/profiler/parser/hccl_parser.py +0 -573
  444. mindspore/profiler/parser/hwts_log_parser.py +0 -122
  445. mindspore/profiler/parser/integrator.py +0 -526
  446. mindspore/profiler/parser/memory_usage_parser.py +0 -277
  447. mindspore/profiler/parser/minddata_analyzer.py +0 -800
  448. mindspore/profiler/parser/minddata_parser.py +0 -186
  449. mindspore/profiler/parser/minddata_pipeline_parser.py +0 -299
  450. mindspore/profiler/parser/op_intermediate_parser.py +0 -149
  451. mindspore/profiler/parser/optime_parser.py +0 -250
  452. mindspore/profiler/parser/profiler_info.py +0 -213
  453. mindspore/profiler/parser/step_trace_parser.py +0 -666
  454. mindspore/utils/hooks.py +0 -81
  455. /mindspore/common/{_auto_dynamic.py → dynamic_shape/_auto_dynamic.py} +0 -0
  456. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0.dist-info}/WHEEL +0 -0
  457. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0.dist-info}/entry_points.txt +0 -0
  458. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0.dist-info}/top_level.txt +0 -0
@@ -214,6 +214,31 @@ def get_transpose_vmap_rule(prim, axis_size):
214
214
  return vmap_rule
215
215
 
216
216
 
217
+ @vmap_rules_getters.register("TransposeExtView")
218
+ def get_transpose_ext_vmap_rule(prim, axis_size):
219
+ """VmapRule for `TransposeExtView` operation."""
220
+ if isinstance(prim, str):
221
+ prim = Primitive(prim)
222
+
223
+ def vmap_rule(x_bdim, dim1_bdim, dim2_bdim):
224
+ is_all_none, result = vmap_general_preprocess(prim, x_bdim, dim1_bdim, dim2_bdim)
225
+ if is_all_none:
226
+ return result
227
+
228
+ x, dim = x_bdim
229
+ dim1, dim1_dim = dim1_bdim
230
+ dim2, dim2_dim = dim2_bdim
231
+ if dim1_dim is not None or dim2_dim is not None:
232
+ _raise_value_error("The source axis of dim1_dim and dim2_dim in `TransposeExtView` must be None, "
233
+ "but got {} and {}.".format(dim1_dim, dim2_dim))
234
+ batch_dim1 = dim1 if dim1 < dim else dim1 + 1
235
+ batch_dim2 = dim2 if dim2 < dim else dim2 + 1
236
+ out = prim(x, batch_dim1, batch_dim2)
237
+ return out, dim
238
+
239
+ return vmap_rule
240
+
241
+
217
242
  @vmap_rules_getters.register("Tile")
218
243
  def get_tile_vmap_rule(prim, axis_size):
219
244
  """VmapRule for `P.Tile` operation."""
@@ -1502,14 +1527,13 @@ def get_meshgrid_vmap_rule(prim, axis_size):
1502
1527
 
1503
1528
  if not isinstance(inputs_bdim, (tuple)):
1504
1529
  _raise_value_error("The inputs of P.Meshgrid is not tuple.")
1505
- args = inputs_bdim
1506
- if len(args) <= 1:
1530
+ if len(inputs_bdim) <= 1:
1507
1531
  _raise_value_error(
1508
1532
  "The input number of P.Meshgrid must be greater than 1.")
1509
1533
 
1510
1534
  output_shape = []
1511
1535
  ones_shape = []
1512
- for each_arg in args:
1536
+ for each_arg in inputs_bdim:
1513
1537
  x, bdim = each_arg
1514
1538
  if bdim is None:
1515
1539
  _raise_value_error(
@@ -1523,22 +1547,16 @@ def get_meshgrid_vmap_rule(prim, axis_size):
1523
1547
  output_shape.insert(0, axis_size)
1524
1548
  ones_shape.insert(0, axis_size)
1525
1549
 
1526
- indexing, _ = indexing_bdim
1527
-
1528
- if indexing == Indexing.xy.value:
1550
+ if indexing_bdim[0] == Indexing.xy.value:
1529
1551
  output_shape[1], output_shape[2] = output_shape[2], output_shape[1]
1530
- shape = tuple(output_shape)
1531
-
1532
- input_0, _ = args[0]
1533
- dtype = F.dtype(input_0)
1534
- ones_tensor = F.fill(dtype, shape, 1)
1552
+ ones_tensor = F.fill(F.dtype(inputs_bdim[0][0]), tuple(output_shape), 1)
1535
1553
 
1536
1554
  index = 0
1537
1555
  vals_out_tuple = ()
1538
- for each_arg in args:
1556
+ for each_arg in inputs_bdim:
1539
1557
  x, bdim = each_arg
1540
1558
  x = _bdim_at_front(x, bdim, axis_size)
1541
- shape_index = (1 - index) if (index <= 1 and indexing == Indexing.xy.value) else index
1559
+ shape_index = (1 - index) if (index <= 1 and indexing_bdim[0] == Indexing.xy.value) else index
1542
1560
  ones_shape[shape_index + 1] = output_shape[shape_index + 1]
1543
1561
  x = P.Reshape()(x, tuple(ones_shape))
1544
1562
  output = P.Mul()(x, ones_tensor)
@@ -2068,14 +2068,15 @@ def get_sparse_apply_adagrad_vmap_rule(prim, axis_size):
2068
2068
  indices, indices_dim = indices_bdim
2069
2069
  if var_dim is None:
2070
2070
  if any(dim is not None for dim in [accum_dim, grad_dim, indices_dim]):
2071
- ValueError("The source axis of `var` is None, but the source "
2072
- "axis of `accum/grad/indices` is not None. The execution order of "
2073
- "operator `{}` cannot be guaranteed.".format(prim_name))
2071
+ _raise_value_error("The source axis of `var` is None, but the source "
2072
+ "axis of `accum/grad/indices` is not None. The execution "
2073
+ "order of operator `{}` cannot be guaranteed.".format(prim_name))
2074
2074
  var, accum = prim(var, accum, grad, indices, u_monad)
2075
2075
  return (var, None), (accum, None)
2076
2076
  if var_dim != 0 or accum_dim != var_dim:
2077
- ValueError("For `{}`, the source axis of `var` must be equal to `accum`, and not equal to 0, "
2078
- "but got the source axis of `var`: {}, `accum`: {}.".format(prim_name, var_dim, accum_dim))
2077
+ _raise_value_error("For `{}`, the source axis of `var` must be equal to `accum`, "
2078
+ "and not equal to 0, but got the source axis of `var`: {}, "
2079
+ "`accum`: {}.".format(prim_name, var_dim, accum_dim))
2079
2080
 
2080
2081
  grad = _bdim_at_front(grad, grad_dim, axis_size)
2081
2082
  indices = _bdim_at_front(indices, indices_dim, axis_size)
@@ -2094,27 +2095,18 @@ def get_sparse_apply_ftrl_vmap_rule(prim, axis_size):
2094
2095
  else:
2095
2096
  batch_rank = 1
2096
2097
 
2097
- prim_name = prim.name
2098
2098
  batch_prim = _vmap_clone_prim(prim)
2099
2099
  batch_prim.add_prim_attr('batch_rank', batch_rank)
2100
2100
 
2101
2101
  def vmap_rule(var_bdim, accum_bdim, linear_bdim, grad_bdim, indices_bdim, u_monad):
2102
2102
  var, var_dim = var_bdim
2103
- accum, accum_dim = accum_bdim
2104
- linear, linear_dim = linear_bdim
2103
+ accum, _ = accum_bdim
2104
+ linear, _ = linear_bdim
2105
2105
  grad, grad_dim = grad_bdim
2106
2106
  indices, indices_dim = indices_bdim
2107
2107
  if var_dim is None:
2108
- if any(dim is not None for dim in [accum_dim, linear_dim, grad_dim, indices_dim]):
2109
- ValueError("The source axis of `var` is None, but the source "
2110
- "axis of `accum/linear/grad/indices` is not None. The execution order of "
2111
- "operator `{}` cannot be guaranteed.".format(prim_name))
2112
2108
  var, accum, linear = prim(var, accum, linear, grad, indices, u_monad)
2113
2109
  return (var, None), (accum, None), (linear, None)
2114
- if var_dim != 0 or accum_dim != var_dim or linear_dim != var_dim:
2115
- ValueError("For `{}`, the source axis of `var`, `accum` and `linear` must be equal, and "
2116
- "not equal to 0, but got the source axis of `var`: {}, `accum`: {}, "
2117
- "`linear`:{}.".format(prim_name, var_dim, accum_dim, linear_dim))
2118
2110
 
2119
2111
  grad = _bdim_at_front(grad, grad_dim, axis_size)
2120
2112
  indices = _bdim_at_front(indices, indices_dim, axis_size)
@@ -53,9 +53,9 @@ op_args_default_value = {
53
53
  "Baddbmm": {"beta": 1, "alpha": 1},
54
54
  "BatchMatMul": {"transpose_a": False, "transpose_b": False},
55
55
  "BatchNormElemt": {"weight": None, "bias": None, "mean": None, "invstd": None, "eps": 1e-5},
56
- "BatchNormExt": {"running_mean": None, "runnning_var": None, "training": False, "momentum": 0.1, "epsilon": 1e-5},
56
+ "BatchNormExt": {"weight": None, "bias": None, "running_mean": None, "runnning_var": None, "training": False, "momentum": 0.1, "epsilon": 1e-5},
57
57
  "BatchNormGatherStatsWithCounts": {"running_mean": None, "running_var": None, "momentum": 1e-1, "eps": 1e-5, "counts": None},
58
- "BatchNormGradExt": {"running_mean": None, "running_var": None, "saved_mean": None, "saved_rstd": None, "training": False, "eps": 1e-5, "output_mask": (1, 1, 1)},
58
+ "BatchNormGradExt": {"weight": None, "running_mean": None, "running_var": None, "saved_mean": None, "saved_rstd": None, "training": False, "eps": 1e-5, "output_mask": (1, 1, 1)},
59
59
  "BatchNormGradGrad": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
60
60
  "BatchNormGrad": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
61
61
  "BatchNormGradWithActivation": {"is_training": False, "epsilon": 1e-5, "data_format": 'NCHW'},
@@ -76,6 +76,7 @@ op_args_default_value = {
76
76
  "CholeskyInverse": {"upper": False},
77
77
  "Cholesky": {"upper": False},
78
78
  "Chunk": {"dim": 0},
79
+ "ChunkView": {"dim": 0},
79
80
  "ClampScalar": {"min": None, "max": None},
80
81
  "ClampTensor": {"min": None, "max": None},
81
82
  "Col2ImExt": {"dilation": 1, "padding": 0, "stride": 1},
@@ -95,6 +96,8 @@ op_args_default_value = {
95
96
  "ConvTranspose2D": {"bias": None, "stride": 1, "padding": 0, "output_padding": 0, "groups": 1, "dilation": 1},
96
97
  "Correlate": {"pad_mode": 'valid'},
97
98
  "CountNonZero": {"dim": None},
99
+ "CrossEntropyLossGrad": {"weight": None, "grad_zloss": None, "lse_for_zloss": None, "reduction": 'mean', "ignore_index": -100, "label_smoothing": 0.0, "lse_square_scale_for_zloss": 0.0},
100
+ "CrossEntropyLoss": {"weight": None, "reduction": 'mean', "ignore_index": -100, "label_smoothing": 0.0, "lse_square_scale_for_zloss": 0.0, "return_zloss": False},
98
101
  "Cross": {"dim": -65530},
99
102
  "CumsumExt": {"dtype": None},
100
103
  "CumProd": {"exclusive": False, "reverse": False},
@@ -103,6 +106,7 @@ op_args_default_value = {
103
106
  "DCT": {"type": 2, "n": None, "axis": -1, "norm": None},
104
107
  "Dense": {"bias": None},
105
108
  "Diagonal": {"offset": 0, "dim1": 0, "dim2": 1},
109
+ "DiagonalView": {"offset": 0, "dim1": 0, "dim2": 1},
106
110
  "DiagExt": {"diagonal": 0},
107
111
  "DivMods": {"rounding_mode": None},
108
112
  "DivMod": {"rounding_mode": None},
@@ -140,13 +144,12 @@ op_args_default_value = {
140
144
  "FlashAttentionScore": {"real_shift": None, "drop_mask": None, "padding_mask": None, "attn_mask": None, "prefix": None, "actual_seq_qlen": None, "actual_seq_kvlen": None, "keep_prob": 1.0, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 2147483647, "inner_precise": 0, "input_layout": 'BSH', "sparse_mode": 0},
141
145
  "FlattenExt": {"start_dim": 0, "end_dim": -1},
142
146
  "FullLike": {"dtype": None},
147
+ "FusedAddTopKDiv": {"activate_type": 0, "is_norm": True, "scale": 2.5, "mapping_num": None, "mapping_table": None, "enable_expert_mapping": False},
143
148
  "Gather": {"batch_dims": 0},
144
149
  "GeluExt": {"approximate": 'none'},
145
150
  "GeluGradExt": {"approximate": 'none'},
146
151
  "GenerateEodMaskV2": {"start": 0, "steps": 1, "error_mode": 'cycle', "flip_mode": 'bitflip', "multiply_factor": 0.0, "bit_pos": 0, "flip_probability": 0.0},
147
152
  "GLU": {"axis": -1},
148
- "GmmBackward": {"group_list": None},
149
- "GmmV2Backward": {"group_list": None, "group_list_type": 0},
150
153
  "GridSampler2DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False, "output_mask": (1, 1)},
151
154
  "GridSampler2D": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False},
152
155
  "GridSampler3DGrad": {"interpolation_mode": 'bilinear', "padding_mode": 'zeros', "align_corners": False, "output_mask": (1, 1)},
@@ -175,11 +178,13 @@ op_args_default_value = {
175
178
  "IncreFlashAttention": {"attn_mask": None, "actual_seq_lengths": None, "pse_shift": None, "dequant_scale1": None, "quant_scale1": None, "dequant_scale2": None, "quant_scale2": None, "quant_offset2": None, "antiquant_scale": None, "antiquant_offset": None, "block_table": None, "kv_padding_size": None, "num_heads": 1, "input_layout": 'BSH', "scale_value": 1.0, "num_key_value_heads": 0, "block_size": 0, "inner_precise": 1},
176
179
  "IndexAddExt": {"alpha": 1},
177
180
  "InnerInplaceIndexPut": {"accumulate": False},
181
+ "InnerMoeTokenUnpermute": {"probs": None, "padded_mode": False, "restore_shape": None},
178
182
  "InplaceAddmm": {"beta": 1, "alpha": 1},
179
183
  "InplaceAddsExt": {"alpha": 1},
180
184
  "InplaceAddExt": {"alpha": 1},
181
185
  "InplaceClampScalar": {"min": None, "max": None},
182
186
  "InplaceClampTensor": {"min": None, "max": None},
187
+ "InplaceCopy": {"non_blocking": False},
183
188
  "InplaceDivMods": {"rounding_mode": None},
184
189
  "InplaceDivMod": {"rounding_mode": None},
185
190
  "InplaceElu": {"alpha": 1.0},
@@ -237,15 +242,19 @@ op_args_default_value = {
237
242
  "Meshgrid": {"indexing": 'xy'},
238
243
  "MinimumGrad": {"grad_x": True, "grad_y": True},
239
244
  "MinDim": {"keepdim": False},
245
+ "Mla": {"attn_mask": None, "deq_scale_qk": None, "deq_scale_pv": None, "q_seq_lens": None, "context_lens": None, "head_num": 32, "scale_value": 0.0, "kv_head_num": 1, "mask_mode": 'MASK_NONE', "is_ring": 0},
246
+ "MlaPreprocess": {"param_cache_mode": 0},
247
+ "MoeDistributeCombine": {"tp_send_counts": None, "x_active_mask": None, "activate_scale": None, "weight_scale": None, "group_list": None, "expand_scales": None, "group_ep": None, "group_tp": None, "tp_world_size": 0, "tp_rank_id": 0, "expert_shard_type": 0, "shared_expert_num": 0, "shared_export_rank_num": 0, "global_bs": 0, "out_dtype": 0, "common_quant_mode": 0, "group_list_type": 0},
248
+ "MoeDistributeDispatch": {"expert_scales": None, "scales": None, "x_active_mask": None, "group_ep": None, "group_tp": None, "tp_world_size": 0, "tp_rank_id": 0, "expert_shard_type": 0, "shared_expert_num": 0, "shared_expert_rank_num": 0, "quant_mode": 0, "global_bs": 0, "expert_token_nums_type": 0},
240
249
  "MoeTokenPermuteGrad": {"num_topk": 1, "padded_mode": False},
241
250
  "MoeTokenPermute": {"num_out_tokens": None, "padded_mode": False},
242
251
  "MoeTokenUnpermuteGrad": {"probs": None, "padded_mode": False, "restore_shape": None},
243
- "MoeTokenUnpermute": {"probs": None, "padded_mode": False, "restore_shape": None},
244
252
  "MSELossExt": {"reduction": 'mean'},
245
253
  "MSELossGradExt": {"reduction": 'mean'},
246
254
  "Nansum": {"dim": None, "keepdim": False, "dtype": None},
247
255
  "NanToNum": {"nan": None, "posinf": None, "neginf": None},
248
256
  "NewEmpty": {"dtype": None, "device": None},
257
+ "NewFull": {"dtype": None},
249
258
  "NewOnes": {"dtype": None},
250
259
  "NewZeros": {"dtype": None},
251
260
  "NLLLoss2d": {"reduction": 'mean', "ignore_index": -100},
@@ -257,10 +266,9 @@ op_args_default_value = {
257
266
  "OneHotExt": {"axis": -1},
258
267
  "OneHot": {"axis": -1},
259
268
  "PagedAttentionMask": {"antiquant_scale": None, "antiquant_offset": None, "alibi_mask": None, "kv_cache_quant_mode": 'DEFAULT'},
260
- "PagedAttention": {"antiquant_scale": None, "antiquant_offset": None, "attn_mask": None, "q_seq_lens": None, "alibi_mask": None, "kv_cache_quant_mode": 'DEFAULT', "mask_mode": 'MASK_DEFAULT', "mla_v_dim": 0},
269
+ "PagedAttention": {"value_cache": None, "block_tables": None, "context_lens": None, "antiquant_scale": None, "antiquant_offset": None, "attn_mask": None, "q_seq_lens": None, "alibi_mask": None, "kv_cache_quant_mode": 'DEFAULT', "mask_mode": 'MASK_DEFAULT', "mla_v_dim": 0},
261
270
  "ProdExt": {"dim": None, "keepdim": False, "dtype": None},
262
271
  "PromptFlashAttention": {"attn_mask": None, "actual_seq_lengths": None, "actual_seq_lengths_kv": None, "pse_shift": None, "deq_scale1": None, "quant_scale1": None, "deq_scale2": None, "quant_scale2": None, "quant_offset2": None, "num_heads": 1, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 0, "input_layout": 'BSH', "num_key_value_heads": 0, "sparse_mode": 0, "inner_precise": 1},
263
- "PromptKVCache": {"align_mode": 'LEFT'},
264
272
  "Qr": {"full_matrices": False},
265
273
  "RandIntLike": {"dtype": None},
266
274
  "RandInt": {"dtype": None},
@@ -297,6 +305,7 @@ op_args_default_value = {
297
305
  "RFFTFreq": {"d": 1.0, "dtype": None},
298
306
  "RFFTN": {"s": None, "dim": None, "norm": None},
299
307
  "RFFT": {"n": None, "dim": -1, "norm": None},
308
+ "RingAttentionUpdate": {"actual_seq_qlen": None, "layout": 'SBH'},
300
309
  "RmsNorm": {"epsilon": 1e-6},
301
310
  "Roll": {"dims": None},
302
311
  "RotaryPositionEmbeddingGrad": {"dx": None, "mode": 0},
@@ -326,7 +335,9 @@ op_args_default_value = {
326
335
  "SpeedFusionAttention": {"pse": None, "padding_mask": None, "atten_mask": None, "scale": 1.0, "keep_prob": 1.0, "pre_tokens": 2147483647, "next_tokens": 2147483647, "inner_precise": 0, "prefix": None, "actual_seq_qlen": None, "actual_seq_kvlen": None, "sparse_mode": 0, "gen_mask_parallel": True, "sync": False, "pse_type": 1, "q_start_idx": None, "kv_start_idx": None},
327
336
  "Split": {"axis": 0, "output_num": 1},
328
337
  "SplitTensor": {"dim": 0},
338
+ "SplitTensorView": {"dim": 0},
329
339
  "SplitWithSize": {"dim": 0},
340
+ "SplitWithSizeView": {"dim": 0},
330
341
  "Squeeze": {"axis": ()},
331
342
  "StackExt": {"dim": 0},
332
343
  "StdMean": {"dim": None, "correction": 1, "keepdim": False},
@@ -341,6 +352,7 @@ op_args_default_value = {
341
352
  "TensorScatterElements": {"axis": 0, "reduce": 'none'},
342
353
  "TopKRouter": {"drop_type": 0},
343
354
  "TopkExt": {"dim": -1, "largest": True, "sorted": True},
355
+ "TopPRouter": {"drop_type": 0, "threshold": 0.0, "router_prob": 0.0},
344
356
  "TraceV2Grad": {"offset": 0, "axis1": 1, "axis2": 0},
345
357
  "TraceV2": {"offset": 0, "axis1": 1, "axis2": 0, "dtype": None},
346
358
  "TriangularSolve": {"upper": True, "transpose": False, "unitriangular": False},
@@ -349,7 +361,7 @@ op_args_default_value = {
349
361
  "TupleToTensor": {"dtype": None},
350
362
  "Unique2": {"sorted": True, "return_inverse": False, "return_counts": False},
351
363
  "UniqueConsecutive": {"return_inverse": False, "return_counts": False, "dim": None},
352
- "UnstackExt": {"dim": 0},
364
+ "UnstackExtView": {"dim": 0},
353
365
  "UpsampleBicubic2DGrad": {"output_size": None, "scales": None, "align_corners": False},
354
366
  "UpsampleBicubic2D": {"output_size": None, "scales": None, "align_corners": False},
355
367
  "UpsampleBilinear2DGrad": {"output_size": None, "scales": None, "align_corners": False},
@@ -370,6 +382,7 @@ op_args_default_value = {
370
382
  "Zeros": {"dtype": None},
371
383
  "AddRmsNormDynamicQuant": {"smooth_scale2": None, "epsilon": 1e-5},
372
384
  "AddRmsNormQuantV2": {"epsilon": 1e-5},
385
+ "DynamicNTK": {"dtype": mstype.float16},
373
386
  "DynamicQuantExt": {"smooth_scales": None},
374
387
  "FusedInferAttentionScore": {"pse_shift": None, "attn_mask": None, "actual_seq_lengths": None, "actual_seq_lengths_kv": None, "dequant_scale1": None, "quant_scale1": None, "dequant_scale2": None, "quant_scale2": None, "quant_offset2": None, "antiquant_scale": None, "antiquant_offset": None, "block_table": None, "query_padding_size": None, "kv_padding_size": None, "key_antiquant_scale": None, "key_antiquant_offset": None, "value_antiquant_scale": None, "value_antiquant_offset": None, "key_shared_prefix": None, "value_shared_prefix": None, "actual_shared_prefix_len": None, "num_heads": 1, "scale_value": 1.0, "pre_tokens": 2147483647, "next_tokens": 2147483647, "input_layout": 'BSH', "num_key_value_heads": 0, "sparse_mode": 0, "inner_precise": 1, "block_size": 0, "antiquant_mode": 0, "softmax_lse_flag": False, "key_antiquant_mode": 0, "value_antiquant_mode": 0},
375
388
  "GroupedMatmul": {"bias": None, "scale": None, "offset": None, "antiquant_scale": None, "antiquant_offset": None, "group_list": None, "split_item": 0, "group_type": -1, "transpose_a": False, "transpose_b": False},
@@ -379,25 +392,35 @@ op_args_default_value = {
379
392
  "MatmulAllReduceAddRmsNorm": {"reduce_op": 'sum', "comm_turn": 0, "stream_mode": 1},
380
393
  "MoeFinalizeRouting": {"x2": None, "bias": None, "scales": None, "expanded_row_idx": None, "expanded_expert_idx": None},
381
394
  "MoeGatingTopKSoftmax": {"finished": None, "k": 1},
395
+ "MoeInitRoutingQuantV2": {"scale": None, "offset": None},
382
396
  "QuantBatchMatmul": {"offset": None, "bias": None, "pertokenScaleOptional": None, "transpose_x1": False, "transpose_x2": False, "dtype": mstype.float16},
397
+ "QuantMatmul": {"offset": None, "pertoken_scale": None, "bias": None, "output_dtype": None, "x1_dtype": None, "x2_dtype": None, "pertoken_scale_dtype": None, "scale_dtype": None, "group_sizes": None},
383
398
  "QuantV2": {"sqrt_mode": False, "rounding_mode": 'ROUND', "dst_type": mstype.int8},
384
399
  "RmsNormQuant": {"beta": None, "epsilon": 1e-6},
400
+ "SwiGLUDynamicQuant": {"smooth_scale": None},
385
401
  "TransposeBatchMatmulTranspose": {"transpose_a": False, "transpose_b": False},
386
402
  "WeightQuantBatchMatmul": {"antiquant_offset": None, "quant_scale": None, "quant_offset": None, "bias": None, "transpose_x": False, "transpose_weight": False, "antiquant_group_size": 0},
403
+ "AnyExt": {"keepdim": False},
404
+ "FuncMaxPool2D": {"stride": None, "padding": 0, "dilation": (1, 1), "ceil_mode": False, "return_indices": False},
405
+ "GmmBackwardFusion": {"group_list": None, "group_list_type": 0},
406
+ "GmmBackward": {"group_list": None, "group_list_type": 0},
407
+ "Gmm": {"bias": None, "group_list": None, "group_type": 0, "group_list_type": 0},
408
+ "GmmV2BackwardFusion": {"group_list": None, "group_list_type": 0},
409
+ "GmmV2Backward": {"group_list": None, "group_list_type": 0},
410
+ "GmmV2": {"bias": None, "group_list": None, "group_type": 0, "group_list_type": 0},
411
+ "MoeTokenUnpermute": {"probs": None, "padded_mode": False, "restore_shape": None},
387
412
  "DeprecatedAddbmm": {"beta": 1, "alpha": 1},
388
413
  "DeprecatedAddmm": {"beta": 1, "alpha": 1},
389
414
  "DeprecatedAddmv": {"beta": 1, "alpha": 1},
390
415
  "DeprecatedReduceAll": {"dim": None, "keepdim": False},
391
416
  "DeprecatedAllclose": {"rtol": 1e-05, "atol": 1e-08, "equal_nan": False},
392
417
  "DeprecatedReduceAny": {"axis": None, "keep_dims": False},
393
- "DeprecatedAny": {"dim": None, "keepdim": False},
394
418
  "DeprecatedArgmax": {"axis": -1, "keepdims": False},
395
419
  "DeprecatedArgmin": {"axis": None, "keepdims": False},
396
420
  "DeprecatedArgsort": {"axis": -1, "descending": False},
397
421
  "DeprecatedBaddbmm": {"beta": 1, "alpha": 1},
398
422
  "DeprecatedBincount": {"weights": None, "minlength": 0},
399
423
  "DeprecatedChunk": {"axis": 0},
400
- "DeprecatedInplaceCopy": {"non_blocking": False},
401
424
  "DeprecatedCountNonzero": {"axis": (), "keep_dims": False, "dtype": None},
402
425
  "DeprecatedCumsum": {"axis": None, "dtype": None},
403
426
  "DeprecatedDiv": {"rounding_mode": None},
@@ -437,7 +460,9 @@ op_labels = {
437
460
  "AssignSub": {"side_effect_mem": True},
438
461
  "BatchNormElemt": {"side_effect_mem": True},
439
462
  "BatchNormGatherStatsWithCounts": {"side_effect_mem": True},
440
- "DecoderKVCache": {"side_effect_mem": True},
463
+ "BroadcastToView": {"side_effect_mem": True},
464
+ "ChunkView": {"side_effect_mem": True},
465
+ "DiagonalView": {"side_effect_mem": True},
441
466
  "DistCommAllReduce": {"side_effect_mem": True},
442
467
  "DistCommReduce": {"side_effect_mem": True},
443
468
  "DropoutExt": {"side_effect_hidden": True},
@@ -451,12 +476,15 @@ op_labels = {
451
476
  "EmbeddingApplySgd": {"_process_node_engine_id": 'PS'},
452
477
  "Embedding": {"side_effect_mem": True},
453
478
  "EmbeddingTableEvict": {"_process_node_engine_id": 'PS'},
479
+ "ExpandDimsView": {"side_effect_mem": True},
454
480
  "Generator": {"side_effect_mem": True},
455
481
  "GroupTopk": {"side_effect_mem": True},
456
482
  "InnerInplaceIndexPut": {"side_effect_mem": True},
457
483
  "InplaceAddmm": {"side_effect_mem": True},
458
484
  "InplaceAddsExt": {"side_effect_mem": True},
459
485
  "InplaceAddExt": {"side_effect_mem": True},
486
+ "InplaceBernoulliScalar": {"side_effect_mem": True},
487
+ "InplaceBernoulliTensor": {"side_effect_mem": True},
460
488
  "InplaceCopy": {"side_effect_mem": True},
461
489
  "InplaceDivMods": {"side_effect_mem": True},
462
490
  "InplaceDivMod": {"side_effect_mem": True},
@@ -478,28 +506,41 @@ op_labels = {
478
506
  "InplaceLog": {"side_effect_mem": True},
479
507
  "InplaceMaskedFillScalar": {"side_effect_mem": True},
480
508
  "InplaceMaskedFillTensor": {"side_effect_mem": True},
509
+ "InplaceMatmulAdd": {"side_effect_mem": True},
481
510
  "InplaceMuls": {"side_effect_mem": True},
482
511
  "InplaceMul": {"side_effect_mem": True},
483
512
  "InplaceNormal": {"side_effect_mem": True},
484
513
  "InplacePut": {"side_effect_mem": True},
485
514
  "InplaceRandom": {"side_effect_mem": True},
486
515
  "InplaceReLU": {"side_effect_mem": True},
516
+ "InplaceRemainderTensorScalar": {"side_effect_mem": True},
517
+ "InplaceRemainderTensorTensor": {"side_effect_mem": True},
487
518
  "InplaceScatterAdd": {"side_effect_mem": True},
488
519
  "InplaceScatterSrc": {"side_effect_mem": True},
489
520
  "InplaceScatterSrcReduce": {"side_effect_mem": True},
490
521
  "InplaceScatterValue": {"side_effect_mem": True},
491
522
  "InplaceScatterValueReduce": {"side_effect_mem": True},
523
+ "InplaceSiLU": {"side_effect_mem": True},
492
524
  "InplaceSubExt": {"side_effect_mem": True},
493
525
  "InplaceSubScalar": {"side_effect_mem": True},
494
526
  "InplaceTanh": {"side_effect_mem": True},
495
527
  "InplaceThreshold": {"side_effect_mem": True},
496
528
  "InplaceUniform": {"side_effect_mem": True},
529
+ "KvScaleCache": {"side_effect_mem": True},
497
530
  "Log": {"cust_aicpu": 'Log', "base": -1.0, "scale": 1.0, "shift": 0.0},
498
- "PromptKVCache": {"side_effect_mem": True},
531
+ "MlaPreprocess": {"side_effect_mem": True},
532
+ "NarrowView": {"side_effect_mem": True},
499
533
  "ReshapeAndCache": {"side_effect_mem": True},
500
534
  "ResizeD": {"mode": 'linear'},
535
+ "SelectExtView": {"side_effect_mem": True},
501
536
  "SilentCheckV2": {"side_effect_mem": True},
502
537
  "SilentCheckV3": {"side_effect_mem": True},
538
+ "SliceExtView": {"side_effect_mem": True},
539
+ "SplitTensorView": {"side_effect_mem": True},
540
+ "SplitWithSizeView": {"side_effect_mem": True},
541
+ "TransposeExtView": {"side_effect_mem": True},
542
+ "TransposeView": {"side_effect_mem": True},
543
+ "UnstackExtView": {"side_effect_mem": True},
503
544
  "KVCacheScatterUpdate": {"side_effect_mem": True},
504
- "DeprecatedInplaceCopy": {"side_effect_mem": True},
545
+ "InplaceExponential": {"side_effect_mem": True},
505
546
  }