mindspore 2.5.0__cp39-cp39-win_amd64.whl → 2.6.0rc1__cp39-cp39-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (491) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
  3. mindspore/Newtonsoft.Json.dll +0 -0
  4. mindspore/__init__.py +6 -4
  5. mindspore/_c_dataengine.cp39-win_amd64.pyd +0 -0
  6. mindspore/_c_expression.cp39-win_amd64.pyd +0 -0
  7. mindspore/_c_mindrecord.cp39-win_amd64.pyd +0 -0
  8. mindspore/_check_jit_forbidden_api.py +3 -0
  9. mindspore/_checkparam.py +3 -33
  10. mindspore/_deprecated/__init__.py +17 -0
  11. mindspore/_deprecated/jit.py +198 -0
  12. mindspore/_extends/builtin_operations.py +1 -1
  13. mindspore/_extends/parse/__init__.py +6 -7
  14. mindspore/_extends/parse/compile_config.py +19 -0
  15. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +22 -3
  16. mindspore/_extends/parse/jit_fallback_modules/__init__.py +0 -0
  17. mindspore/_extends/parse/jit_fallback_modules/check_utils.py +123 -0
  18. mindspore/_extends/parse/jit_fallback_modules/third_party_modules.py +50 -0
  19. mindspore/_extends/parse/parser.py +24 -193
  20. mindspore/_extends/parse/resources.py +1 -5
  21. mindspore/_extends/parse/standard_method.py +97 -74
  22. mindspore/_extends/pijit/__init__.py +2 -2
  23. mindspore/_extends/pijit/pijit_func_white_list.py +16 -11
  24. mindspore/_extends/pijit/tensor_func_list.py +27 -0
  25. mindspore/_extends/utils.py +1 -1
  26. mindspore/amp.py +4 -4
  27. mindspore/atlprov.dll +0 -0
  28. mindspore/avcodec-59.dll +0 -0
  29. mindspore/avdevice-59.dll +0 -0
  30. mindspore/avfilter-8.dll +0 -0
  31. mindspore/avformat-59.dll +0 -0
  32. mindspore/avutil-57.dll +0 -0
  33. mindspore/boost/__init__.py +2 -2
  34. mindspore/boost/base.py +3 -7
  35. mindspore/boost/boost_cell_wrapper.py +2 -2
  36. mindspore/c1.dll +0 -0
  37. mindspore/c1xx.dll +0 -0
  38. mindspore/c2.dll +0 -0
  39. mindspore/common/__init__.py +4 -3
  40. mindspore/common/_grad_function.py +56 -0
  41. mindspore/common/_pijit_context.py +14 -5
  42. mindspore/common/_register_for_tensor.py +1 -1
  43. mindspore/common/_stub_tensor.py +5 -10
  44. mindspore/common/_tensor_cpp_method.py +1 -1
  45. mindspore/common/_tensor_docs.py +1915 -3287
  46. mindspore/common/api.py +341 -354
  47. mindspore/common/auto_dynamic_shape.py +41 -44
  48. mindspore/common/dtype.py +5 -2
  49. mindspore/common/dump.py +7 -5
  50. mindspore/common/file_system.py +3 -0
  51. mindspore/common/hook_handle.py +5 -3
  52. mindspore/common/initializer.py +10 -6
  53. mindspore/common/jit_begin_end.py +94 -0
  54. mindspore/common/jit_config.py +6 -1
  55. mindspore/common/jit_context.py +76 -0
  56. mindspore/common/jit_trace.py +378 -0
  57. mindspore/common/lazy_inline.py +2 -2
  58. mindspore/common/mutable.py +5 -4
  59. mindspore/common/parameter.py +106 -39
  60. mindspore/common/seed.py +2 -2
  61. mindspore/common/sparse_tensor.py +23 -17
  62. mindspore/common/tensor.py +297 -714
  63. mindspore/communication/__init__.py +7 -5
  64. mindspore/communication/_comm_helper.py +47 -2
  65. mindspore/communication/comm_func.py +70 -53
  66. mindspore/communication/management.py +83 -17
  67. mindspore/context.py +214 -560
  68. mindspore/dataset/__init__.py +44 -20
  69. mindspore/dataset/audio/__init__.py +2 -8
  70. mindspore/dataset/audio/transforms.py +3 -17
  71. mindspore/dataset/core/config.py +3 -3
  72. mindspore/dataset/engine/cache_client.py +1 -1
  73. mindspore/dataset/engine/datasets.py +102 -120
  74. mindspore/dataset/engine/datasets_audio.py +22 -22
  75. mindspore/dataset/engine/datasets_standard_format.py +43 -24
  76. mindspore/dataset/engine/datasets_text.py +78 -85
  77. mindspore/dataset/engine/datasets_user_defined.py +108 -76
  78. mindspore/dataset/engine/datasets_vision.py +111 -108
  79. mindspore/dataset/engine/iterators.py +5 -3
  80. mindspore/dataset/engine/obs/obs_mindrecord_dataset.py +1 -1
  81. mindspore/dataset/engine/samplers.py +279 -57
  82. mindspore/dataset/engine/serializer_deserializer.py +2 -1
  83. mindspore/dataset/engine/validators.py +10 -0
  84. mindspore/dataset/text/__init__.py +7 -6
  85. mindspore/dataset/text/transforms.py +6 -5
  86. mindspore/dataset/text/utils.py +3 -3
  87. mindspore/dataset/transforms/__init__.py +0 -9
  88. mindspore/dataset/transforms/transforms.py +3 -3
  89. mindspore/dataset/utils/browse_dataset.py +1 -1
  90. mindspore/dataset/vision/__init__.py +2 -9
  91. mindspore/dataset/vision/transforms.py +202 -158
  92. mindspore/dataset/vision/utils.py +7 -5
  93. mindspore/device_context/ascend/op_debug.py +60 -1
  94. mindspore/device_context/ascend/op_tuning.py +0 -4
  95. mindspore/device_manager.py +39 -3
  96. mindspore/dnnl.dll +0 -0
  97. mindspore/dpcmi.dll +0 -0
  98. mindspore/experimental/es/embedding_service.py +35 -27
  99. mindspore/experimental/map_parameter.py +4 -4
  100. mindspore/experimental/optim/adadelta.py +22 -26
  101. mindspore/experimental/optim/adagrad.py +4 -4
  102. mindspore/experimental/optim/adam.py +4 -0
  103. mindspore/experimental/optim/adamax.py +4 -4
  104. mindspore/experimental/optim/adamw.py +4 -0
  105. mindspore/experimental/optim/asgd.py +1 -1
  106. mindspore/experimental/optim/lr_scheduler.py +40 -22
  107. mindspore/experimental/optim/radam.py +5 -5
  108. mindspore/experimental/optim/rprop.py +1 -1
  109. mindspore/experimental/optim/sgd.py +1 -1
  110. mindspore/hal/contiguous_tensors_handle.py +6 -10
  111. mindspore/hal/device.py +55 -81
  112. mindspore/hal/event.py +38 -55
  113. mindspore/hal/memory.py +93 -144
  114. mindspore/hal/stream.py +81 -125
  115. mindspore/include/dataset/constants.h +7 -4
  116. mindspore/include/dataset/execute.h +2 -2
  117. mindspore/jpeg62.dll +0 -0
  118. mindspore/log.py +40 -2
  119. mindspore/mindrecord/__init__.py +20 -7
  120. mindspore/mindspore_backend_common.dll +0 -0
  121. mindspore/mindspore_backend_manager.dll +0 -0
  122. mindspore/mindspore_common.dll +0 -0
  123. mindspore/mindspore_core.dll +0 -0
  124. mindspore/mindspore_dump.dll +0 -0
  125. mindspore/mindspore_frontend.dll +0 -0
  126. mindspore/mindspore_glog.dll +0 -0
  127. mindspore/mindspore_memory_pool.dll +0 -0
  128. mindspore/mindspore_ms_backend.dll +0 -0
  129. mindspore/mindspore_ops.dll +0 -0
  130. mindspore/{mindspore_backend.dll → mindspore_ops_host.dll} +0 -0
  131. mindspore/mindspore_ops_kernel_common.dll +0 -0
  132. mindspore/mindspore_profiler.dll +0 -0
  133. mindspore/mindspore_pyboost.dll +0 -0
  134. mindspore/mindspore_pynative.dll +0 -0
  135. mindspore/mindspore_res_manager.dll +0 -0
  136. mindspore/mindspore_runtime_pipeline.dll +0 -0
  137. mindspore/mint/__init__.py +131 -700
  138. mindspore/mint/distributed/__init__.py +5 -1
  139. mindspore/mint/distributed/distributed.py +194 -109
  140. mindspore/mint/linalg/__init__.py +2 -0
  141. mindspore/mint/nn/__init__.py +280 -18
  142. mindspore/mint/nn/functional.py +282 -64
  143. mindspore/mint/nn/layer/__init__.py +4 -0
  144. mindspore/mint/nn/layer/_functions.py +7 -3
  145. mindspore/mint/nn/layer/activation.py +120 -13
  146. mindspore/mint/nn/layer/conv.py +218 -24
  147. mindspore/mint/nn/layer/normalization.py +15 -16
  148. mindspore/mint/nn/layer/padding.py +1 -1
  149. mindspore/mint/nn/layer/pooling.py +66 -1
  150. mindspore/mint/optim/__init__.py +2 -1
  151. mindspore/mint/optim/sgd.py +171 -0
  152. mindspore/msobj140.dll +0 -0
  153. mindspore/mspdb140.dll +0 -0
  154. mindspore/mspdbcore.dll +0 -0
  155. mindspore/mspdbst.dll +0 -0
  156. mindspore/mspft140.dll +0 -0
  157. mindspore/msvcdis140.dll +0 -0
  158. mindspore/msvcp140_1.dll +0 -0
  159. mindspore/msvcp140_2.dll +0 -0
  160. mindspore/msvcp140_atomic_wait.dll +0 -0
  161. mindspore/msvcp140_codecvt_ids.dll +0 -0
  162. mindspore/nn/__init__.py +4 -1
  163. mindspore/nn/cell.py +1250 -176
  164. mindspore/nn/layer/activation.py +23 -21
  165. mindspore/nn/layer/basic.py +22 -16
  166. mindspore/nn/layer/container.py +1 -1
  167. mindspore/nn/layer/conv.py +22 -17
  168. mindspore/nn/layer/embedding.py +9 -8
  169. mindspore/nn/layer/normalization.py +48 -42
  170. mindspore/nn/layer/pooling.py +75 -31
  171. mindspore/nn/layer/transformer.py +11 -10
  172. mindspore/nn/learning_rate_schedule.py +4 -2
  173. mindspore/nn/loss/loss.py +27 -19
  174. mindspore/nn/optim/ada_grad.py +6 -5
  175. mindspore/nn/optim/adadelta.py +9 -7
  176. mindspore/nn/optim/adafactor.py +1 -1
  177. mindspore/nn/optim/adam.py +16 -12
  178. mindspore/nn/optim/adamax.py +8 -7
  179. mindspore/nn/optim/adasum.py +5 -5
  180. mindspore/nn/optim/asgd.py +1 -1
  181. mindspore/nn/optim/ftrl.py +11 -9
  182. mindspore/nn/optim/lamb.py +1 -1
  183. mindspore/nn/optim/lazyadam.py +12 -10
  184. mindspore/nn/optim/momentum.py +7 -6
  185. mindspore/nn/optim/optimizer.py +2 -2
  186. mindspore/nn/optim/proximal_ada_grad.py +12 -10
  187. mindspore/nn/optim/rmsprop.py +13 -12
  188. mindspore/nn/optim/rprop.py +9 -7
  189. mindspore/nn/optim/sgd.py +9 -6
  190. mindspore/nn/optim/tft_wrapper.py +5 -2
  191. mindspore/nn/probability/bijector/bijector.py +17 -11
  192. mindspore/nn/probability/bijector/gumbel_cdf.py +5 -5
  193. mindspore/nn/probability/bijector/invert.py +2 -2
  194. mindspore/nn/probability/bijector/scalar_affine.py +3 -3
  195. mindspore/nn/probability/bijector/softplus.py +3 -2
  196. mindspore/nn/probability/distribution/beta.py +3 -3
  197. mindspore/nn/probability/distribution/categorical.py +1 -1
  198. mindspore/nn/probability/distribution/cauchy.py +4 -2
  199. mindspore/nn/probability/distribution/exponential.py +6 -7
  200. mindspore/nn/probability/distribution/gamma.py +2 -2
  201. mindspore/nn/probability/distribution/gumbel.py +2 -2
  202. mindspore/nn/probability/distribution/half_normal.py +5 -3
  203. mindspore/nn/probability/distribution/logistic.py +5 -3
  204. mindspore/nn/probability/distribution/poisson.py +1 -1
  205. mindspore/nn/probability/distribution/uniform.py +5 -3
  206. mindspore/nn/reinforcement/_tensors_queue.py +1 -1
  207. mindspore/nn/reinforcement/tensor_array.py +1 -1
  208. mindspore/nn/wrap/__init__.py +6 -6
  209. mindspore/nn/wrap/cell_wrapper.py +178 -117
  210. mindspore/nn/wrap/grad_reducer.py +45 -36
  211. mindspore/nn/wrap/loss_scale.py +3 -3
  212. mindspore/numpy/array_creations.py +3 -3
  213. mindspore/numpy/array_ops.py +1 -1
  214. mindspore/numpy/math_ops.py +4 -4
  215. mindspore/numpy/utils.py +1 -2
  216. mindspore/numpy/utils_const.py +1 -2
  217. mindspore/opencv_core452.dll +0 -0
  218. mindspore/opencv_imgcodecs452.dll +0 -0
  219. mindspore/opencv_imgproc452.dll +0 -0
  220. mindspore/ops/__init__.py +3 -2
  221. mindspore/ops/_grad_experimental/grad_comm_ops.py +18 -3
  222. mindspore/ops/_grad_experimental/grad_debug_ops.py +8 -1
  223. mindspore/ops/_grad_experimental/taylor_rule.py +29 -0
  224. mindspore/ops/_register_for_op.py +0 -11
  225. mindspore/{ops_generate → ops/_utils}/arg_dtype_cast.py +123 -4
  226. mindspore/{ops_generate → ops/_utils}/arg_handler.py +3 -4
  227. mindspore/ops/_vmap/vmap_array_ops.py +7 -6
  228. mindspore/ops/_vmap/vmap_grad_nn_ops.py +2 -1
  229. mindspore/ops/_vmap/vmap_math_ops.py +4 -7
  230. mindspore/ops/_vmap/vmap_nn_ops.py +9 -8
  231. mindspore/ops/auto_generate/__init__.py +4 -3
  232. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +102 -49
  233. mindspore/ops/auto_generate/gen_extend_func.py +281 -135
  234. mindspore/ops/auto_generate/gen_ops_def.py +2574 -2326
  235. mindspore/ops/auto_generate/gen_ops_prim.py +8566 -2755
  236. mindspore/ops/auto_generate/pyboost_inner_prim.py +106 -76
  237. mindspore/ops/composite/__init__.py +2 -1
  238. mindspore/ops/composite/base.py +19 -24
  239. mindspore/ops/composite/math_ops.py +6 -16
  240. mindspore/ops/composite/multitype_ops/__init__.py +5 -2
  241. mindspore/ops/composite/multitype_ops/_compile_utils.py +2 -3
  242. mindspore/ops/composite/multitype_ops/_constexpr_utils.py +1 -2
  243. mindspore/ops/composite/multitype_ops/add_impl.py +2 -1
  244. mindspore/ops/composite/multitype_ops/bitwise_and_impl.py +2 -1
  245. mindspore/ops/composite/multitype_ops/bitwise_or_impl.py +2 -1
  246. mindspore/ops/composite/multitype_ops/bitwise_xor_impl.py +2 -1
  247. mindspore/ops/composite/multitype_ops/div_impl.py +6 -4
  248. mindspore/ops/composite/multitype_ops/equal_impl.py +4 -3
  249. mindspore/ops/composite/multitype_ops/floordiv_impl.py +2 -1
  250. mindspore/ops/composite/multitype_ops/getitem_impl.py +3 -2
  251. mindspore/ops/composite/multitype_ops/greater_equal_impl.py +4 -3
  252. mindspore/ops/composite/multitype_ops/greater_impl.py +4 -3
  253. mindspore/ops/composite/multitype_ops/in_impl.py +2 -1
  254. mindspore/ops/composite/multitype_ops/invert_impl.py +50 -0
  255. mindspore/ops/composite/multitype_ops/left_shift_impl.py +2 -1
  256. mindspore/ops/composite/multitype_ops/less_equal_impl.py +4 -3
  257. mindspore/ops/composite/multitype_ops/less_impl.py +4 -3
  258. mindspore/ops/composite/multitype_ops/logic_not_impl.py +3 -2
  259. mindspore/ops/composite/multitype_ops/logical_and_impl.py +2 -1
  260. mindspore/ops/composite/multitype_ops/logical_or_impl.py +2 -1
  261. mindspore/ops/composite/multitype_ops/mod_impl.py +2 -1
  262. mindspore/ops/composite/multitype_ops/mul_impl.py +3 -2
  263. mindspore/ops/composite/multitype_ops/negative_impl.py +2 -1
  264. mindspore/ops/composite/multitype_ops/not_equal_impl.py +2 -1
  265. mindspore/ops/composite/multitype_ops/not_in_impl.py +2 -1
  266. mindspore/ops/composite/multitype_ops/ones_like_impl.py +18 -0
  267. mindspore/ops/composite/multitype_ops/pow_impl.py +2 -1
  268. mindspore/ops/composite/multitype_ops/right_shift_impl.py +2 -1
  269. mindspore/ops/composite/multitype_ops/setitem_impl.py +2 -1
  270. mindspore/ops/composite/multitype_ops/sub_impl.py +2 -1
  271. mindspore/ops/function/__init__.py +28 -2
  272. mindspore/ops/function/_add_attr_func.py +58 -0
  273. mindspore/ops/function/array_func.py +1629 -2345
  274. mindspore/ops/function/clip_func.py +38 -45
  275. mindspore/ops/function/debug_func.py +36 -44
  276. mindspore/ops/function/grad/__init__.py +1 -0
  277. mindspore/ops/function/grad/grad_func.py +104 -71
  278. mindspore/ops/function/image_func.py +1 -1
  279. mindspore/ops/function/linalg_func.py +46 -78
  280. mindspore/ops/function/math_func.py +3035 -3705
  281. mindspore/ops/function/nn_func.py +676 -241
  282. mindspore/ops/function/other_func.py +159 -1
  283. mindspore/ops/function/parameter_func.py +17 -30
  284. mindspore/ops/function/random_func.py +204 -361
  285. mindspore/ops/function/reshard_func.py +4 -70
  286. mindspore/ops/function/sparse_func.py +3 -3
  287. mindspore/ops/function/sparse_unary_func.py +5 -5
  288. mindspore/ops/function/spectral_func.py +25 -58
  289. mindspore/ops/function/vmap_func.py +24 -17
  290. mindspore/ops/functional.py +6 -4
  291. mindspore/ops/functional_overload.py +547 -4
  292. mindspore/ops/op_info_register.py +32 -244
  293. mindspore/ops/operations/__init__.py +10 -5
  294. mindspore/ops/operations/_custom_ops_utils.py +247 -0
  295. mindspore/ops/operations/_grad_ops.py +1 -10
  296. mindspore/ops/operations/_inner_ops.py +5 -76
  297. mindspore/ops/operations/_ms_kernel.py +4 -10
  298. mindspore/ops/operations/_rl_inner_ops.py +1 -1
  299. mindspore/ops/operations/_scalar_ops.py +3 -2
  300. mindspore/ops/operations/_sequence_ops.py +1 -1
  301. mindspore/ops/operations/_tensor_array.py +1 -1
  302. mindspore/ops/operations/array_ops.py +37 -22
  303. mindspore/ops/operations/comm_ops.py +150 -107
  304. mindspore/ops/operations/custom_ops.py +221 -23
  305. mindspore/ops/operations/debug_ops.py +115 -16
  306. mindspore/ops/operations/inner_ops.py +1 -1
  307. mindspore/ops/operations/linalg_ops.py +1 -58
  308. mindspore/ops/operations/manually_defined/_inner.py +1 -1
  309. mindspore/ops/operations/manually_defined/ops_def.py +746 -79
  310. mindspore/ops/operations/math_ops.py +21 -18
  311. mindspore/ops/operations/nn_ops.py +65 -191
  312. mindspore/ops/operations/other_ops.py +62 -9
  313. mindspore/ops/operations/random_ops.py +13 -7
  314. mindspore/ops/operations/reshard_ops.py +1 -1
  315. mindspore/ops/operations/sparse_ops.py +2 -2
  316. mindspore/ops/primitive.py +43 -32
  317. mindspore/ops/tensor_method.py +232 -13
  318. mindspore/ops_generate/__init__.py +0 -5
  319. mindspore/ops_generate/aclnn/__init__.py +0 -0
  320. mindspore/ops_generate/{aclnn_kernel_register_auto_cc_generator.py → aclnn/aclnn_kernel_register_auto_cc_generator.py} +43 -18
  321. mindspore/ops_generate/{gen_aclnn_implement.py → aclnn/gen_aclnn_implement.py} +49 -51
  322. mindspore/ops_generate/api/__init__.py +0 -0
  323. mindspore/ops_generate/{add_tensor_docs_generator.py → api/add_tensor_docs_generator.py} +9 -7
  324. mindspore/ops_generate/{cpp_create_prim_instance_helper_generator.py → api/cpp_create_prim_instance_helper_generator.py} +6 -9
  325. mindspore/ops_generate/{functional_map_cpp_generator.py → api/functional_map_cpp_generator.py} +25 -12
  326. mindspore/ops_generate/{functional_overload_py_generator.py → api/functional_overload_py_generator.py} +8 -6
  327. mindspore/ops_generate/{functions_cc_generator.py → api/functions_cc_generator.py} +14 -10
  328. mindspore/ops_generate/api/gen_api.py +103 -0
  329. mindspore/ops_generate/{op_api_proto.py → api/op_api_proto.py} +98 -69
  330. mindspore/ops_generate/{tensor_func_reg_cpp_generator.py → api/tensor_func_reg_cpp_generator.py} +82 -43
  331. mindspore/ops_generate/common/__init__.py +0 -0
  332. mindspore/ops_generate/common/gen_constants.py +91 -0
  333. mindspore/ops_generate/{gen_utils.py → common/gen_utils.py} +72 -19
  334. mindspore/ops_generate/{op_proto.py → common/op_proto.py} +64 -1
  335. mindspore/ops_generate/{template.py → common/template.py} +96 -84
  336. mindspore/ops_generate/gen_ops.py +23 -325
  337. mindspore/ops_generate/op_def/__init__.py +0 -0
  338. mindspore/ops_generate/op_def/gen_op_def.py +90 -0
  339. mindspore/ops_generate/{lite_ops_cpp_generator.py → op_def/lite_ops_cpp_generator.py} +47 -11
  340. mindspore/ops_generate/{ops_def_cc_generator.py → op_def/ops_def_cc_generator.py} +18 -7
  341. mindspore/ops_generate/{ops_def_h_generator.py → op_def/ops_def_h_generator.py} +5 -5
  342. mindspore/ops_generate/{ops_name_h_generator.py → op_def/ops_name_h_generator.py} +30 -15
  343. mindspore/ops_generate/op_def/ops_primitive_h_generator.py +125 -0
  344. mindspore/ops_generate/op_def_py/__init__.py +0 -0
  345. mindspore/ops_generate/op_def_py/gen_op_def_py.py +47 -0
  346. mindspore/ops_generate/{op_def_py_generator.py → op_def_py/op_def_py_generator.py} +6 -5
  347. mindspore/ops_generate/{op_prim_py_generator.py → op_def_py/op_prim_py_generator.py} +24 -15
  348. mindspore/ops_generate/pyboost/__init__.py +0 -0
  349. mindspore/ops_generate/{auto_grad_impl_cc_generator.py → pyboost/auto_grad_impl_cc_generator.py} +11 -7
  350. mindspore/ops_generate/{auto_grad_reg_cc_generator.py → pyboost/auto_grad_reg_cc_generator.py} +7 -7
  351. mindspore/ops_generate/{gen_pyboost_func.py → pyboost/gen_pyboost_func.py} +40 -16
  352. mindspore/ops_generate/{op_template_parser.py → pyboost/op_template_parser.py} +105 -24
  353. mindspore/ops_generate/{pyboost_functions_cpp_generator.py → pyboost/pyboost_functions_cpp_generator.py} +55 -18
  354. mindspore/ops_generate/{pyboost_functions_h_generator.py → pyboost/pyboost_functions_h_generator.py} +42 -10
  355. mindspore/ops_generate/{pyboost_functions_py_generator.py → pyboost/pyboost_functions_py_generator.py} +6 -6
  356. mindspore/ops_generate/{pyboost_grad_function_cpp_generator.py → pyboost/pyboost_grad_function_cpp_generator.py} +11 -10
  357. mindspore/ops_generate/{pyboost_inner_prim_generator.py → pyboost/pyboost_inner_prim_generator.py} +8 -7
  358. mindspore/ops_generate/{pyboost_native_grad_functions_generator.py → pyboost/pyboost_native_grad_functions_generator.py} +14 -10
  359. mindspore/ops_generate/{pyboost_op_cpp_code_generator.py → pyboost/pyboost_op_cpp_code_generator.py} +140 -53
  360. mindspore/ops_generate/{pyboost_overload_functions_cpp_generator.py → pyboost/pyboost_overload_functions_cpp_generator.py} +28 -15
  361. mindspore/ops_generate/{pyboost_utils.py → pyboost/pyboost_utils.py} +88 -4
  362. mindspore/ops_generate/resources/__init__.py +0 -0
  363. mindspore/ops_generate/resources/resource_list.py +30 -0
  364. mindspore/ops_generate/resources/resource_loader.py +36 -0
  365. mindspore/ops_generate/resources/resource_manager.py +64 -0
  366. mindspore/ops_generate/resources/yaml_loader.py +88 -0
  367. mindspore/ops_generate/tensor_py_cc_generator.py +122 -0
  368. mindspore/parallel/__init__.py +6 -2
  369. mindspore/parallel/_auto_parallel_context.py +133 -6
  370. mindspore/parallel/_cell_wrapper.py +130 -15
  371. mindspore/parallel/_parallel_serialization.py +95 -4
  372. mindspore/parallel/_ps_context.py +1 -1
  373. mindspore/parallel/_recovery_context.py +7 -2
  374. mindspore/parallel/_tensor.py +142 -18
  375. mindspore/parallel/_utils.py +198 -25
  376. mindspore/parallel/algo_parameter_config.py +3 -3
  377. mindspore/parallel/auto_parallel.py +732 -0
  378. mindspore/parallel/checkpoint_convert.py +159 -0
  379. mindspore/parallel/checkpoint_transform.py +656 -37
  380. mindspore/parallel/cluster/process_entity/_api.py +151 -19
  381. mindspore/parallel/cluster/run.py +1 -1
  382. mindspore/parallel/function/__init__.py +24 -0
  383. mindspore/parallel/function/reshard_func.py +259 -0
  384. mindspore/parallel/nn/__init__.py +25 -0
  385. mindspore/parallel/nn/parallel_cell_wrapper.py +263 -0
  386. mindspore/parallel/nn/parallel_grad_reducer.py +169 -0
  387. mindspore/parallel/parameter_broadcast.py +24 -13
  388. mindspore/parallel/shard.py +137 -61
  389. mindspore/parallel/transform_safetensors.py +287 -95
  390. mindspore/pgodb140.dll +0 -0
  391. mindspore/pgort140.dll +0 -0
  392. mindspore/profiler/__init__.py +9 -5
  393. mindspore/profiler/analysis/parser/ascend_cann_parser.py +6 -2
  394. mindspore/profiler/analysis/parser/ms_framework_parser.py +4 -4
  395. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +7 -4
  396. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +22 -0
  397. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +3 -3
  398. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +241 -86
  399. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +41 -2
  400. mindspore/profiler/analysis/viewer/ascend_kernel_details_viewer.py +33 -35
  401. mindspore/profiler/analysis/viewer/ascend_memory_viewer.py +7 -0
  402. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +8 -3
  403. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +141 -30
  404. mindspore/profiler/analysis/viewer/ms_dataset_viewer.py +5 -6
  405. mindspore/profiler/common/ascend_msprof_exporter.py +5 -4
  406. mindspore/profiler/common/constant.py +12 -0
  407. mindspore/profiler/common/msprof_cmd_tool.py +42 -23
  408. mindspore/profiler/common/path_manager.py +24 -0
  409. mindspore/profiler/common/profiler_context.py +26 -2
  410. mindspore/profiler/common/profiler_meta_data.py +74 -0
  411. mindspore/profiler/common/profiler_parameters.py +59 -18
  412. mindspore/profiler/common/profiler_path_manager.py +66 -7
  413. mindspore/profiler/dynamic_profiler.py +112 -79
  414. mindspore/profiler/envprofiler.py +26 -1
  415. mindspore/profiler/experimental_config.py +197 -0
  416. mindspore/profiler/mstx.py +57 -14
  417. mindspore/profiler/platform/npu_profiler.py +33 -7
  418. mindspore/profiler/profiler.py +541 -45
  419. mindspore/profiler/profiler_action_controller.py +1 -1
  420. mindspore/profiler/profiler_interface.py +4 -0
  421. mindspore/profiler/schedule.py +57 -22
  422. mindspore/rewrite/api/node.py +15 -13
  423. mindspore/rewrite/api/symbol_tree.py +1 -1
  424. mindspore/run_check/_check_version.py +25 -14
  425. mindspore/run_check/run_check.py +1 -1
  426. mindspore/runtime/__init__.py +2 -2
  427. mindspore/runtime/executor.py +40 -11
  428. mindspore/runtime/memory.py +25 -8
  429. mindspore/safeguard/rewrite_obfuscation.py +12 -9
  430. mindspore/swresample-4.dll +0 -0
  431. mindspore/swscale-6.dll +0 -0
  432. mindspore/tbbmalloc.dll +0 -0
  433. mindspore/tinyxml2.dll +0 -0
  434. mindspore/train/__init__.py +8 -8
  435. mindspore/train/_utils.py +35 -7
  436. mindspore/train/amp.py +1 -1
  437. mindspore/train/callback/__init__.py +2 -2
  438. mindspore/train/callback/_callback.py +2 -16
  439. mindspore/train/callback/_checkpoint.py +24 -40
  440. mindspore/train/callback/_cluster_monitor.py +14 -18
  441. mindspore/train/callback/_flops_collector.py +2 -3
  442. mindspore/train/callback/_history.py +7 -4
  443. mindspore/train/callback/_lambda_callback.py +2 -2
  444. mindspore/train/callback/_landscape.py +0 -3
  445. mindspore/train/callback/_loss_monitor.py +2 -1
  446. mindspore/train/callback/_on_request_exit.py +6 -5
  447. mindspore/train/callback/_reduce_lr_on_plateau.py +11 -6
  448. mindspore/train/callback/_summary_collector.py +8 -13
  449. mindspore/train/callback/_time_monitor.py +2 -1
  450. mindspore/train/callback/{_tft_register.py → _train_fault_tolerance.py} +179 -103
  451. mindspore/train/data_sink.py +25 -2
  452. mindspore/train/dataset_helper.py +4 -5
  453. mindspore/train/loss_scale_manager.py +8 -7
  454. mindspore/train/metrics/accuracy.py +3 -3
  455. mindspore/train/metrics/confusion_matrix.py +9 -9
  456. mindspore/train/metrics/error.py +3 -3
  457. mindspore/train/metrics/hausdorff_distance.py +4 -4
  458. mindspore/train/metrics/mean_surface_distance.py +3 -3
  459. mindspore/train/metrics/metric.py +0 -12
  460. mindspore/train/metrics/occlusion_sensitivity.py +4 -2
  461. mindspore/train/metrics/precision.py +8 -6
  462. mindspore/train/metrics/recall.py +9 -9
  463. mindspore/train/metrics/root_mean_square_surface_distance.py +2 -2
  464. mindspore/train/mind_ir_pb2.py +19 -12
  465. mindspore/train/model.py +176 -103
  466. mindspore/train/serialization.py +246 -988
  467. mindspore/train/summary/_summary_adapter.py +2 -2
  468. mindspore/train/summary/summary_record.py +1 -1
  469. mindspore/turbojpeg.dll +0 -0
  470. mindspore/utils/__init__.py +3 -2
  471. mindspore/utils/dryrun.py +4 -2
  472. mindspore/utils/hooks.py +81 -0
  473. mindspore/utils/utils.py +138 -4
  474. mindspore/vcmeta.dll +0 -0
  475. mindspore/vcruntime140.dll +0 -0
  476. mindspore/vcruntime140_1.dll +0 -0
  477. mindspore/version.py +1 -1
  478. {mindspore-2.5.0.dist-info → mindspore-2.6.0rc1.dist-info}/METADATA +2 -1
  479. {mindspore-2.5.0.dist-info → mindspore-2.6.0rc1.dist-info}/RECORD +483 -438
  480. mindspore/_install_custom.py +0 -43
  481. mindspore/common/_register_for_adapter.py +0 -74
  482. mindspore/ops/auto_generate/gen_arg_dtype_cast.py +0 -252
  483. mindspore/ops/auto_generate/gen_arg_handler.py +0 -136
  484. mindspore/ops/operations/_opaque_predicate_registry.py +0 -41
  485. mindspore/ops_generate/gen_constants.py +0 -190
  486. mindspore/ops_generate/gen_ops_inner_prim.py +0 -131
  487. mindspore/ops_generate/ops_primitive_h_generator.py +0 -81
  488. /mindspore/ops_generate/{base_generator.py → common/base_generator.py} +0 -0
  489. {mindspore-2.5.0.dist-info → mindspore-2.6.0rc1.dist-info}/WHEEL +0 -0
  490. {mindspore-2.5.0.dist-info → mindspore-2.6.0rc1.dist-info}/entry_points.txt +0 -0
  491. {mindspore-2.5.0.dist-info → mindspore-2.6.0rc1.dist-info}/top_level.txt +0 -0
@@ -19,15 +19,18 @@ import sys
19
19
  import signal
20
20
  import subprocess
21
21
  import socket
22
+ import psutil
22
23
  import mindspore.log as logger
23
- from ._utils import _generate_cmd_args_list, _generate_cmd_args_list_with_core, _generate_url,\
24
- _is_local_ip, _convert_addr_to_ip, _send_scale_num, _get_local_ip
24
+ from ._utils import _generate_cmd_args_list, _generate_cmd_args_list_with_core, _generate_url, \
25
+ _is_local_ip, _convert_addr_to_ip, _send_scale_num, _get_local_ip
26
+
25
27
 
26
28
  class _Node:
27
29
  """
28
30
  Base class for dynamic networking nodes.
29
31
 
30
32
  """
33
+
31
34
  def __init__(self, worker_num, sched_host, sched_port, timeout, args_list, output_file, tail_worker_log,
32
35
  join, is_simulation):
33
36
  self.worker_num = worker_num
@@ -40,24 +43,26 @@ class _Node:
40
43
  self.join = join
41
44
  self.is_simulation = is_simulation
42
45
 
43
-
44
46
  def run(self):
45
47
  """
46
48
  Runs the node by setting environment variables and executing the entrypoint command or script.
47
49
 
48
50
  """
49
51
  os.environ["MS_WORKER_NUM"] = str(self.worker_num)
50
- # If simulation level is set, environment variables for dynamic networking will not be set and scheduler will not be started.
52
+ # If simulation level is set, environment variables for dynamic networking will not be set,
53
+ # and scheduler will not be started.
51
54
  if not self.is_simulation:
52
55
  os.environ["MS_SCHED_HOST"] = self.sched_host
53
56
  os.environ["MS_SCHED_PORT"] = str(self.sched_port)
54
57
  os.environ["MS_TOPO_TIMEOUT"] = str(self.timeout)
55
58
 
59
+
56
60
  class _MetaServerNode(_Node):
57
61
  """
58
62
  Scheduler node for dynamic networking. Inherits from the Node class.
59
63
 
60
64
  """
65
+
61
66
  def run(self):
62
67
  """
63
68
  Runs the MetaServerNode by setting environment variables, setting the MS_ROLE variable to
@@ -68,17 +73,18 @@ class _MetaServerNode(_Node):
68
73
  with open(self.output_file, "w") as file_handle:
69
74
  return subprocess.Popen(self.args_list, stdout=file_handle, stderr=subprocess.STDOUT)
70
75
 
76
+
71
77
  class _ComputeGraphNode(_Node):
72
78
  """
73
79
  Worker node for dynamic networking. Inherits from the Node class.
74
80
  """
81
+
75
82
  def __init__(self, worker_num, sched_host, sched_port, timeout, node_id, args_list, output_file,
76
83
  tail_worker_log, join, is_simulation):
77
84
  super().__init__(worker_num, sched_host, sched_port, timeout, args_list, output_file,
78
85
  tail_worker_log, join, is_simulation)
79
86
  self.node_id = node_id
80
87
 
81
-
82
88
  def run(self):
83
89
  """
84
90
  Runs the ComputeGraphNode by setting environment variables, setting the MS_NODE_ID variable
@@ -127,6 +133,7 @@ class _ProcessManager:
127
133
  training
128
134
 
129
135
  """
136
+
130
137
  def __init__(self, args):
131
138
  """
132
139
  Initializes a ProcessManager object.
@@ -198,6 +205,21 @@ class _ProcessManager:
198
205
  finally:
199
206
  os.umask(origin_mask)
200
207
 
208
+ self.proc_rank_map = {}
209
+ self.enable_mindx = False
210
+ tft_env = os.getenv("MS_ENABLE_TFT", "")
211
+ if ("TTP:1" in tft_env) or ("UCE:1" in tft_env) or ("ARF:1" in tft_env):
212
+ try:
213
+ from taskd.python.framework.agent.ms_mgr.msrun_plugin import MSRunPlugin
214
+ self.msmgr = MSRunPlugin()
215
+ self.msmgr.register_callbacks("KILL_WORKER", self.kill_workers)
216
+ self.msmgr.register_callbacks("START_ALL_WORKER", self.start_all_workers)
217
+ self.msmgr.register_callbacks("MONITOR", self.monitor_rank_status)
218
+ self.enable_mindx = True
219
+ os.environ["MS_ENABLE_RECOVERY"] = str(1)
220
+ except Exception as e: # pylint: disable=broad-except
221
+ logger.warning(f"mindx is not installed, using original mindspore recovery strategy.: {str(e)}")
222
+
201
223
  def run(self):
202
224
  """
203
225
  Runs the process manager.
@@ -218,11 +240,13 @@ class _ProcessManager:
218
240
  else:
219
241
  if self.is_master and not self.is_simulation:
220
242
  self.start_scheduler()
221
- self.start_workers()
222
-
223
- if self.join:
224
- logger.warning("Distributed job is spawned. Waiting all processes to exit...")
225
- self.join_processes()
243
+ if self.enable_mindx:
244
+ self.msmgr.start()
245
+ else:
246
+ self.start_workers()
247
+ if self.join:
248
+ logger.warning("Distributed job is spawned. Waiting all processes to exit...")
249
+ self.join_processes()
226
250
 
227
251
  def start_scheduler(self):
228
252
  """
@@ -262,17 +286,17 @@ class _ProcessManager:
262
286
  # If node_id is generated in '_get_node_id_and_log_path' method, export 'RANK_ID' environment variable.
263
287
  # This is for rank_table method's compatibility consideration.
264
288
  os.environ["RANK_ID"] = str(node_id)
265
- logger.warning(f"Start worker process with rank id:{node_id}, log file:{log_name}. "
266
- "Environment variable [RANK_ID] is exported.")
289
+ print(f"Start worker process with rank id:{node_id}, log file:{log_name}. "
290
+ f"Environment variable [RANK_ID={node_id}] is exported.", flush=True)
267
291
  if self.is_simulation and (self.sim_rank_id != -1):
268
292
  # Reset RANK_ID env to sim_rank_id if sim_rank_id is set.
269
293
  os.environ["RANK_ID"] = str(self.sim_rank_id)
270
294
  logger.warning(f"In dryrun case, RANK_ID is assigned to {self.sim_rank_id}.")
271
295
 
272
- cpu_num = subprocess.getoutput("cat /proc/cpuinfo|grep processor|wc -l")
273
- if not cpu_num.isdigit():
274
- raise RuntimeError("Fail to get cpu number from /proc/cpuinfo.")
275
296
  if self.bind_core:
297
+ cpu_num = subprocess.getoutput("cat /proc/cpuinfo|grep processor|wc -l")
298
+ if not cpu_num.isdigit():
299
+ raise RuntimeError(f"Got cpu number from '/proc/cpuinfo' is {cpu_num}, failed to bind core.")
276
300
  avg = int(cpu_num) // self.local_worker_num
277
301
  cpu_start = avg * i
278
302
  cpu_end = cpu_start + avg - 1
@@ -284,7 +308,7 @@ class _ProcessManager:
284
308
  process, tail_process = cgn.run()
285
309
  self.cgn_processes.append(process)
286
310
  self.tail_cgn_processes.append(tail_process)
287
-
311
+ self.proc_rank_map[i] = process
288
312
 
289
313
  def join_processes(self):
290
314
  """
@@ -292,6 +316,7 @@ class _ProcessManager:
292
316
  If there's any process does not exit normally, logs will be analyzed
293
317
  so that understandable root cause of exception could be returned.
294
318
  """
319
+
295
320
  def signal_handler(sig, frame):
296
321
  logger.warning("msrun process received SIGNIN (Ctrl+C), terminating all workers.")
297
322
  self.kill_all_processes()
@@ -331,7 +356,7 @@ class _ProcessManager:
331
356
  logger.error(f"Scheduler process {self.msn_process.pid} exit with exception.")
332
357
 
333
358
  if has_exception:
334
- logger.warning("Analyzing exception log...")
359
+ logger.info("Analyzing exception log...")
335
360
  self._analyze_log()
336
361
  raise RuntimeError("Distributed job exited with exception. Please check logs in "
337
362
  f"directory: {self.log_dir}.")
@@ -388,6 +413,115 @@ class _ProcessManager:
388
413
  self.start_scheduler()
389
414
  self.start_workers()
390
415
 
416
+ def kill_all_workers(self):
417
+ """
418
+ Kill all running worker processes.
419
+
420
+ Args:
421
+ NA.
422
+ """
423
+ for p in self.cgn_processes:
424
+ if p.poll() is None:
425
+ p.kill()
426
+ self.cgn_processes.clear()
427
+
428
+ for p in self.tail_cgn_processes:
429
+ if p is not None:
430
+ p.kill()
431
+ self.tail_cgn_processes.clear()
432
+
433
+ def kill_single_worker(self, pid):
434
+ """
435
+ Kill one worker process with specified pid.
436
+
437
+ Args:
438
+ pid: Worker process' pid.
439
+ """
440
+ kill_status = False
441
+ for i in range(len(self.cgn_processes)):
442
+ p = self.cgn_processes[i]
443
+ if p.pid == pid and p.poll() is None:
444
+ p.kill()
445
+ del self.cgn_processes[i]
446
+ tail_p = self.tail_cgn_processes[i]
447
+ if tail_p is not None:
448
+ tail_p.kill()
449
+ del self.tail_cgn_processes[i]
450
+ kill_status = True
451
+ break
452
+ if not kill_status:
453
+ logger.warning(f"There's no active worker with pid: {pid}")
454
+
455
+ def kill_workers(self, pids):
456
+ """
457
+ Kill worker process according to pids. Worker process with pid within pids list will be killed.
458
+
459
+ Args:
460
+ pids(list): a list of worker process pid. When local_ranks pids -1, kill all worker process.
461
+ """
462
+ if -1 in pids:
463
+ self.kill_all_workers()
464
+ else:
465
+ for pid in pids:
466
+ self.kill_single_worker(pid)
467
+ return 0
468
+
469
+ def monitor_rank_status(self, local_ranks):
470
+ """
471
+ Monitor the status of workers whose rank is within local_ranks list.
472
+
473
+ Args:
474
+ local_ranks(list): a list of local worker ranks. When local_ranks contains -1,
475
+ monitor all workers' status.
476
+ """
477
+ rank_status = {}
478
+ if -1 in local_ranks:
479
+ local_ranks = list(range(self.local_worker_num))
480
+ for i in local_ranks:
481
+ single_status = self.monitor_single_rank(i)
482
+ if single_status:
483
+ rank_status[i] = single_status
484
+ return rank_status
485
+
486
+ def monitor_single_rank(self, rank_id):
487
+ """
488
+ Monitor the status of a single worker with rank_id
489
+
490
+ Args:
491
+ rank_id: worker process's local rank, which is also device_id.
492
+ """
493
+ if 0 <= rank_id < self.local_worker_num:
494
+ global_rank_id = rank_id
495
+ if self.node_rank >= 0:
496
+ global_rank_id = self.node_rank * self.local_worker_num + rank_id
497
+ try:
498
+ p = self.proc_rank_map[rank_id]
499
+ p_status = p.poll()
500
+ if (not psutil.pid_exists(p.pid)) and (p_status != 0):
501
+ p_status = 300
502
+ return {"pid": p.pid, "status": p_status, "global_rank": global_rank_id}
503
+ except KeyError:
504
+ logger.info(f"Process rank {rank_id} has not been initialized.")
505
+ return {"pid": None, "status": 200, "global_rank": global_rank_id}
506
+ else:
507
+ logger.warning(f"Invalid rank id!")
508
+ return {}
509
+
510
+ def start_all_workers(self):
511
+ """
512
+ Start all worker processes after killing all workers.
513
+
514
+ Args:
515
+ NA.
516
+ """
517
+ if self.cgn_processes:
518
+ self.kill_all_workers()
519
+ self.start_workers()
520
+ worker_status = self.monitor_rank_status([-1])
521
+ for i in range(self.local_worker_num):
522
+ if worker_status[i]["status"] != None: # pylint: disable=singleton-comparison
523
+ return 1
524
+ return 0
391
525
 
392
526
  def _get_node_id_and_log_path(self, index):
393
527
  """
@@ -410,7 +544,6 @@ class _ProcessManager:
410
544
  log_name = os.path.join(self.log_dir, formatted_log_name + "_" + str(index) + ".log")
411
545
  return node_id, log_name
412
546
 
413
-
414
547
  def _analyze_log(self):
415
548
  """
416
549
  Analyze exception logs.
@@ -432,7 +565,6 @@ class _ProcessManager:
432
565
 
433
566
  os.system(f"grep -rn -E 'ERROR|CRITICAL|Traceback|Error' -C 5 {self.log_dir}")
434
567
 
435
-
436
568
  def format_worker_log_name(self):
437
569
  """
438
570
  Format worker log files' name.
@@ -85,7 +85,7 @@ def get_args():
85
85
  "--sim_level",
86
86
  default=-1,
87
87
  type=int,
88
- choices=[0, 1],
88
+ choices=[0, 1, 2, 3],
89
89
  help="specifies simulation level. When this argument is set, msrun only spawns one process "
90
90
  "but export RANK_SIZE with value worker_num and RANK_ID with value sim_rank_id."
91
91
  )
@@ -0,0 +1,24 @@
1
+ # Copyright 2025 Huawei Technologies Co., Ltd
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+ # ============================================================================
15
+
16
+ """
17
+ Parallel function operator
18
+ """
19
+
20
+ from mindspore.parallel.function.reshard_func import reshard
21
+
22
+ __all__ = []
23
+ __all__.extend(reshard_func.__all__)
24
+ __all__.sort()
@@ -0,0 +1,259 @@
1
+ # Copyright 2023 Huawei Technologies Co., Ltd
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+ # ============================================================================
15
+ """Defines parameter operators with functional form."""
16
+ import mindspore as ms
17
+ from mindspore import context, ops
18
+ from mindspore import log as logger
19
+ from mindspore.ops import operations as P
20
+ from mindspore.ops._primitive_cache import _get_cache_prim
21
+ from mindspore.common.tensor import Tensor
22
+ from mindspore.communication.management import get_group_size, get_rank
23
+ from mindspore.parallel.shard import Layout, _DistributedTensorInfo
24
+ from mindspore.parallel._auto_parallel_context import _get_all_auto_parallel_context, _recover_auto_parallel_context
25
+ from mindspore.ops.primitive import constexpr
26
+
27
+
28
+ REDIST_CELL_CACHE = {}
29
+ COMM_TENSOR_CELL_CACHE = {}
30
+
31
+
32
+ @constexpr
33
+ def group_size():
34
+ """ Return the device number in the Cell's construct method. """
35
+ return get_group_size()
36
+
37
+
38
+ # pylint: disable=W0212
39
+ def reshard(tensor, layout):
40
+ r"""
41
+ Converting a tensor from one distributed arrangement to another distributed arrangement.
42
+ The given layout must be type mindspore.parallel.Layout,
43
+ can check :class:`mindspore.parallel.Layout` for reference.
44
+
45
+ Note:
46
+ - In the Graph mode, this function can set the sharding propagation strategy of a tensor.
47
+ For those tensor do not manually be set, their strategies are decided by the sharding
48
+ strategy propagation algorithm automatically.
49
+ - In PyNative mode, you can use this method to arrange tensors in a cell (that is, cells
50
+ that use Cell.shard/F.shard in PyNative mode) that is executed in parallel in graph mode.
51
+
52
+ Args:
53
+ tensor (Tensor): The tensor to be set the sharding strategy.
54
+ layout (Layout): The layout to shard the tensor precisely, including the device
55
+ arrangement (device_matrix) and the alias for the device matrix
56
+ (alias_name).
57
+
58
+ Returns:
59
+ Tensor. The mathematically equivalent of the input tensor.
60
+
61
+ Raises:
62
+ TypeError: Reshard takes in Tensor type as the first input param, but got: `type(tensor)`.
63
+ TypeError: Reshard only support type mindspore.parallel.Layout but got: `type(layout)`.
64
+
65
+ Supported Platforms:
66
+ ``Ascend``
67
+
68
+ Examples:
69
+ .. note::
70
+ Before running the following examples, you need to configure the communication environment variables.
71
+
72
+ For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
73
+ without any third-party or configuration file dependencies.
74
+ Please see the `msrun start-up
75
+ <https://www.mindspore.cn/tutorials/en/master/parallel/msrun_launcher.html>`_
76
+ for more details.
77
+
78
+ This example should be run with 8 devices.
79
+
80
+ >>> import numpy as np
81
+ >>> import mindspore as ms
82
+ >>> from mindspore import ops, nn, Tensor, context, Layout
83
+ >>> from mindspore.parallel.function import reshard
84
+ >>> from mindspore.nn.utils import no_init_parameters
85
+ >>> from mindspore.parallel.auto_parallel import AutoParallel
86
+ >>> from mindspore.communication import init
87
+ >>> context.set_context(mode=ms.GRAPH_MODE)
88
+ >>> init()
89
+ >>> class Network(nn.Cell):
90
+ ... def __init__(self):
91
+ ... super().__init__()
92
+ ... self.matmul = ops.MatMul()
93
+ ... self.relu = ops.ReLU()
94
+ ... def construct(self, x, layout):
95
+ ... x = self.relu(x)
96
+ ... x_reshard = reshard(x, layout)
97
+ ... y = Tensor(np.ones(shape=(128, 128)), dtype=ms.float32)
98
+ ... x = self.matmul(x_reshard, y)
99
+ ... return x
100
+ >>> layout = Layout((4, 2), ("dp", "mp"))
101
+ >>> input_layout = layout("dp", "mp")
102
+ >>> with no_init_parameters():
103
+ ... net = Network()
104
+ >>> parallel_net = AutoParallel(net, parallel_mode='sharding_propagation')
105
+ >>> tensor = Tensor(np.ones(shape=(128, 128)), dtype=ms.float32)
106
+ >>> out = parallel_net(tensor, input_layout)
107
+ """
108
+ if group_size() == 1:
109
+ return tensor
110
+ if not isinstance(tensor, Tensor):
111
+ raise TypeError(f"Reshard takes in Tensor type as the first input param, but got: {type(tensor)}.")
112
+ if not isinstance(layout, Layout):
113
+ raise TypeError(f"Reshard only support type mindspore.parallel.Layout, but got: {type(layout)}.")
114
+
115
+ def layout_to_tuple(layout):
116
+ layout_dict = layout.to_dict()
117
+ tensor_map = layout_dict["tensor_map"]
118
+ device_matrix_rev = layout_dict["device_matrix"][::-1]
119
+ axis_stgy = ()
120
+ for ind in tensor_map:
121
+ if ind == -1:
122
+ axis_stgy += (1,)
123
+ else:
124
+ axis_stgy += (device_matrix_rev[ind],)
125
+ return axis_stgy
126
+
127
+ in_strategy = layout_to_tuple(layout)
128
+ _reshard = _get_cache_prim(P.Reshard)(in_layout=(layout,), out_layout=(layout,), in_strategy=(in_strategy,))
129
+ return _reshard(tensor)
130
+
131
+
132
+ def _redistribute(tensor, dst_dtensor_info):
133
+ """
134
+ Redistribute the tensor from the source sharding strategy to the destination sharding strategy.
135
+
136
+ Args:
137
+ tensor (Tensor): The source tensor.
138
+ dst_dtensor_info (_DistributedTensorInfo): The destination sharding strategy.
139
+
140
+ Returns:
141
+ Tensor, value is same as the source tensor, but the sharding strategy is the destination sharding strategy.
142
+
143
+ Supported Platforms:
144
+ ``Ascend``
145
+
146
+ Examples:
147
+ .. note::
148
+ Before running the following examples, you need to configure the communication environment variables.
149
+
150
+ For Ascend/GPU/CPU devices, it is recommended to use the msrun startup method
151
+ without any third-party or configuration file dependencies.
152
+ Please see the `msrun start up
153
+ <https://www.mindspore.cn/tutorials/en/master/parallel/msrun_launcher.html>`_
154
+ for more details.
155
+
156
+ This example should be run with 2 devices.
157
+
158
+ >>> import numpy as np
159
+ >>> from mindspore.communication import init
160
+ >>> from mindspore import Tensor, Layout, _DistributedTensorInfo
161
+ >>>
162
+ >>> init()
163
+ >>> layout = Layout((2, 1), ("dp", "mp"))
164
+ >>> src_layout = layout("dp", "mp")
165
+ >>> distributed_info = _DistributedTensorInfo(src_layout)
166
+ >>> x = Tensor(np.ones([2, 2]).astype(np.float32))
167
+ >>> out = x.redistribute(distributed_info)
168
+ >>> print(out)
169
+ [[1. 1.]]
170
+ """
171
+ from mindspore.parallel._cell_wrapper import RedistributionCell, _insert_virtual_pp_dim
172
+ if not isinstance(dst_dtensor_info, _DistributedTensorInfo):
173
+ raise TypeError(
174
+ "dst_dtensor_info should be _DistributedTensorInfo type, but got {}".format(type(dst_dtensor_info)))
175
+ run_mode = context.get_context("mode")
176
+ context.set_context(mode=context.GRAPH_MODE)
177
+ og_auto_parallel_context, pp_config = _get_all_auto_parallel_context()
178
+ context.reset_auto_parallel_context()
179
+ tensor_data = tensor
180
+ all_reduce_data = False
181
+ # If src_pp_stages is less than or equal to dst_pp_stages, the parameters of each pp stage of src can be
182
+ # directly swapped to the corresponding card of dst
183
+ # rank0 01 11 01
184
+ # rank1 02 12 02
185
+ # pp1 ------> pp2
186
+ # rank2 03 13 11
187
+ # rank3 04 14 12
188
+ # if dtensor info is None, return the all 1 strategy as from dtensor info
189
+ if tensor._dtensor_info is None:
190
+ all_dev_num = get_group_size()
191
+ dev_mat = Layout((all_dev_num,), ("replica",))
192
+ tensor_map = ["None"] * len(tensor.shape)
193
+ layout = dev_mat(*tensor_map)
194
+ tensor._dtensor_info = _DistributedTensorInfo(layout)
195
+ src_layout_info = tensor._dtensor_info.layout.to_dict()
196
+ dst_layout_info = dst_dtensor_info.layout.to_dict()
197
+ if len(tensor._dtensor_info.layout.to_dict()["rank_list"]) < len(dst_dtensor_info.layout.to_dict()["rank_list"]):
198
+ # If src_pp_stages is greater than dst_pp_stages, the weights of the corresponding cards need to
199
+ # be communicated via AllReduce to swap. Need to communicate src rank0's 01 to src rank2,
200
+ # so that rank2 holds param0's data. Similarly, communicate rank1's 02 to rank3
201
+ # rank0 01 01 11
202
+ # rank1 02 02 12
203
+ # pp2 -------> pp1
204
+ # rank2 11 03 13
205
+ # rank3 12 04 14
206
+ from mindspore.parallel._cell_wrapper import CommTensorDataForPP
207
+ if get_rank() in dst_dtensor_info.layout.to_dict()["rank_list"]:
208
+ comm_tensor_cache_key = (
209
+ f"{src_layout_info['device_matrix']}, {src_layout_info['tensor_map']}, {src_layout_info['rank_list']}"
210
+ f" -> "
211
+ f"{dst_layout_info['device_matrix']}, {dst_layout_info['tensor_map']}, {dst_layout_info['rank_list']}")
212
+ global COMM_TENSOR_CELL_CACHE
213
+ if comm_tensor_cache_key not in COMM_TENSOR_CELL_CACHE:
214
+ comm_tensor_data_func = CommTensorDataForPP(tensor._dtensor_info, dst_dtensor_info)
215
+ COMM_TENSOR_CELL_CACHE[comm_tensor_cache_key] = comm_tensor_data_func
216
+ logger.debug(f"comm_tensor_cache_key is {comm_tensor_cache_key}, not match cache")
217
+ else:
218
+ comm_tensor_data_func = COMM_TENSOR_CELL_CACHE[comm_tensor_cache_key]
219
+ logger.debug(f"comm_tensor_cache_key is {comm_tensor_cache_key}, match cache")
220
+ if not comm_tensor_data_func._current_rank_has_data:
221
+ new_tensor_shape = tuple([tensor_data.shape[i] // tensor._dtensor_info.sharding_strategy[i]
222
+ for i in range(len(tensor.shape))])
223
+ tensor_data = comm_tensor_data_func.comm_data(ops.zeros(new_tensor_shape, tensor.dtype))
224
+ else:
225
+ tensor_data = comm_tensor_data_func.comm_data(tensor)
226
+ all_reduce_data = True
227
+ ms.communication.comm_func.barrier()
228
+ if src_layout_info['device_matrix'] == dst_layout_info['device_matrix'] and src_layout_info['tensor_map'] == \
229
+ dst_layout_info['tensor_map']:
230
+ return tensor_data
231
+ dataset_strategy = (_insert_virtual_pp_dim(tensor._dtensor_info.layout),)
232
+ if get_rank() not in tensor._dtensor_info.layout.to_dict()["rank_list"] and not all_reduce_data:
233
+ dataset_strategy = "full_batch"
234
+ context.set_auto_parallel_context(dataset_strategy=dataset_strategy,
235
+ parallel_mode="semi_auto_parallel", device_num=get_group_size())
236
+ global REDIST_CELL_CACHE
237
+ redist_cache_key = (f"{src_layout_info['device_matrix']}, {src_layout_info['tensor_map']} -> "
238
+ f"{dst_layout_info['device_matrix']}, {dst_layout_info['tensor_map']}")
239
+ if redist_cache_key in REDIST_CELL_CACHE.keys():
240
+ logger.debug(f"redist_cache_key is {redist_cache_key}, match cache")
241
+ redist_func = REDIST_CELL_CACHE[redist_cache_key]
242
+ else:
243
+ logger.debug(f"redist_cache_key is {redist_cache_key}, not match cache")
244
+ redist_func = RedistributionCell(tensor._dtensor_info.layout, dst_dtensor_info.layout)
245
+ REDIST_CELL_CACHE[redist_cache_key] = redist_func
246
+ redist_func.set_train(True)
247
+ redist_tensor_data = redist_func(tensor_data)
248
+ context.reset_auto_parallel_context()
249
+ _recover_auto_parallel_context(og_auto_parallel_context, pp_config)
250
+ context.set_context(mode=run_mode)
251
+ redist_tensor_data._dtensor_info = dst_dtensor_info
252
+ return redist_tensor_data
253
+
254
+
255
+ __all__ = [
256
+ 'reshard'
257
+ ]
258
+
259
+ __all__.sort()
@@ -0,0 +1,25 @@
1
+ # Copyright 2025 Huawei Technologies Co., Ltd
2
+ #
3
+ # Licensed under the Apache License, Version 2.0 (the "License");
4
+ # you may not use this file except in compliance with the License.
5
+ # You may obtain a copy of the License at
6
+ #
7
+ # http://www.apache.org/licenses/LICENSE-2.0
8
+ #
9
+ # Unless required by applicable law or agreed to in writing, software
10
+ # distributed under the License is distributed on an "AS IS" BASIS,
11
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
12
+ # See the License for the specific language governing permissions and
13
+ # limitations under the License.
14
+ # ============================================================================
15
+ """
16
+ Interfaces for parallel-related functionality
17
+ """
18
+ from __future__ import absolute_import
19
+
20
+ from mindspore.parallel.nn.parallel_grad_reducer import PipelineGradReducer
21
+ from mindspore.parallel.nn.parallel_cell_wrapper import PipelineCell, Pipeline, MicroBatchInterleaved, GradAccumulation
22
+
23
+ __all__ = []
24
+ __all__.extend(parallel_grad_reducer.__all__)
25
+ __all__.extend(parallel_cell_wrapper.__all__)