mindspore 2.6.0rc1__cp310-cp310-win_amd64.whl → 2.7.0rc1__cp310-cp310-win_amd64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Potentially problematic release.


This version of mindspore might be problematic. Click here for more details.

Files changed (407) hide show
  1. mindspore/.commit_id +1 -1
  2. mindspore/Microsoft.VisualStudio.Telemetry.dll +0 -0
  3. mindspore/Newtonsoft.Json.dll +0 -0
  4. mindspore/__init__.py +1 -1
  5. mindspore/_c_dataengine.cp310-win_amd64.pyd +0 -0
  6. mindspore/_c_expression.cp310-win_amd64.pyd +0 -0
  7. mindspore/_c_mindrecord.cp310-win_amd64.pyd +0 -0
  8. mindspore/_checkparam.py +40 -9
  9. mindspore/{_deprecated → _extends/optimize}/__init__.py +9 -3
  10. mindspore/_extends/optimize/cell_utils.py +96 -0
  11. mindspore/_extends/parse/__init__.py +2 -2
  12. mindspore/_extends/parse/compile_config.py +44 -22
  13. mindspore/_extends/parse/deprecated/deprecated_tensor_method.py +1 -1
  14. mindspore/_extends/parse/parser.py +37 -62
  15. mindspore/_extends/parse/resources.py +39 -0
  16. mindspore/_extends/parse/standard_method.py +43 -13
  17. mindspore/_extends/parse/trope.py +8 -1
  18. mindspore/_extends/pijit/__init__.py +1 -2
  19. mindspore/amp.py +4 -4
  20. mindspore/atlprov.dll +0 -0
  21. mindspore/avcodec-59.dll +0 -0
  22. mindspore/avdevice-59.dll +0 -0
  23. mindspore/avfilter-8.dll +0 -0
  24. mindspore/avformat-59.dll +0 -0
  25. mindspore/avutil-57.dll +0 -0
  26. mindspore/boost/adasum.py +1 -1
  27. mindspore/boost/boost_cell_wrapper.py +4 -4
  28. mindspore/c1.dll +0 -0
  29. mindspore/c1xx.dll +0 -0
  30. mindspore/c2.dll +0 -0
  31. mindspore/common/__init__.py +27 -2
  32. mindspore/common/_grad_function.py +2 -1
  33. mindspore/common/_pijit_context.py +28 -7
  34. mindspore/common/_stub_tensor.py +1 -209
  35. mindspore/common/_tensor_cpp_method.py +1 -1
  36. mindspore/common/_tensor_docs.py +77 -16
  37. mindspore/common/api.py +238 -113
  38. mindspore/common/dtype.py +21 -11
  39. mindspore/common/dump.py +10 -15
  40. mindspore/common/generator.py +5 -3
  41. mindspore/common/hook_handle.py +11 -2
  42. mindspore/common/jit_config.py +1 -1
  43. mindspore/common/jit_trace.py +84 -105
  44. mindspore/common/parameter.py +26 -12
  45. mindspore/common/recompute.py +3 -3
  46. mindspore/common/sparse_tensor.py +0 -3
  47. mindspore/common/symbol.py +0 -1
  48. mindspore/common/tensor.py +81 -81
  49. mindspore/communication/_comm_helper.py +46 -4
  50. mindspore/communication/management.py +79 -7
  51. mindspore/context.py +58 -40
  52. mindspore/dataset/core/config.py +3 -3
  53. mindspore/dataset/engine/datasets.py +20 -7
  54. mindspore/dataset/engine/datasets_user_defined.py +33 -3
  55. mindspore/dataset/engine/iterators.py +2 -2
  56. mindspore/dataset/engine/obs/config_loader.py +2 -2
  57. mindspore/dataset/engine/obs/obs_mindrecord_dataset.py +8 -0
  58. mindspore/dataset/transforms/py_transforms.py +7 -3
  59. mindspore/dataset/transforms/transforms.py +7 -3
  60. mindspore/dataset/vision/validators.py +1 -0
  61. mindspore/device_context/ascend/device.py +1 -1
  62. mindspore/device_context/gpu/__init__.py +2 -2
  63. mindspore/device_context/gpu/device.py +1 -1
  64. mindspore/device_context/gpu/op_precision.py +4 -2
  65. mindspore/device_context/gpu/op_tuning.py +6 -3
  66. mindspore/device_manager.py +16 -9
  67. mindspore/dnnl.dll +0 -0
  68. mindspore/dpcmi.dll +0 -0
  69. mindspore/experimental/llm_boost/ascend_native/llama_boost_ascend_native.py +3 -7
  70. mindspore/experimental/llm_boost/atb/boost_base.py +2 -3
  71. mindspore/experimental/optim/adadelta.py +13 -20
  72. mindspore/experimental/optim/adagrad.py +15 -22
  73. mindspore/experimental/optim/adam.py +17 -24
  74. mindspore/experimental/optim/adamax.py +14 -22
  75. mindspore/experimental/optim/adamw.py +28 -34
  76. mindspore/experimental/optim/asgd.py +15 -25
  77. mindspore/experimental/optim/lr_scheduler.py +27 -45
  78. mindspore/experimental/optim/nadam.py +14 -24
  79. mindspore/experimental/optim/optimizer.py +13 -23
  80. mindspore/experimental/optim/radam.py +18 -24
  81. mindspore/experimental/optim/rmsprop.py +14 -25
  82. mindspore/experimental/optim/rprop.py +15 -26
  83. mindspore/experimental/optim/sgd.py +9 -19
  84. mindspore/hal/__init__.py +4 -4
  85. mindspore/hal/contiguous_tensors_handle.py +2 -2
  86. mindspore/hal/memory.py +27 -7
  87. mindspore/include/api/cell.h +37 -1
  88. mindspore/include/api/delegate.h +10 -0
  89. mindspore/include/api/model.h +3 -0
  90. mindspore/include/api/types.h +2 -2
  91. mindspore/include/c_api/model_c.h +0 -58
  92. mindspore/include/c_api/tensor_c.h +0 -26
  93. mindspore/include/dataset/vision_ascend.h +1 -1
  94. mindspore/jpeg62.dll +0 -0
  95. mindspore/mindrecord/tools/cifar10.py +60 -11
  96. mindspore/mindrecord/tools/cifar10_to_mr.py +5 -0
  97. mindspore/mindspore_backend_common.dll +0 -0
  98. mindspore/mindspore_backend_manager.dll +0 -0
  99. mindspore/mindspore_common.dll +0 -0
  100. mindspore/mindspore_core.dll +0 -0
  101. mindspore/mindspore_cpu_res_manager.dll +0 -0
  102. mindspore/mindspore_dump.dll +0 -0
  103. mindspore/mindspore_frontend.dll +0 -0
  104. mindspore/mindspore_glog.dll +0 -0
  105. mindspore/mindspore_memory_pool.dll +0 -0
  106. mindspore/mindspore_ms_backend.dll +0 -0
  107. mindspore/mindspore_ops.dll +0 -0
  108. mindspore/mindspore_ops_host.dll +0 -0
  109. mindspore/mindspore_ops_kernel_common.dll +0 -0
  110. mindspore/mindspore_profiler.dll +0 -0
  111. mindspore/mindspore_pyboost.dll +0 -0
  112. mindspore/mindspore_pynative.dll +0 -0
  113. mindspore/mindspore_res_manager.dll +0 -0
  114. mindspore/mindspore_runtime_pipeline.dll +0 -0
  115. mindspore/mint/__init__.py +6 -46
  116. mindspore/mint/distributed/__init__.py +1 -0
  117. mindspore/mint/distributed/distributed.py +212 -9
  118. mindspore/mint/nn/__init__.py +1 -1
  119. mindspore/mint/nn/functional.py +53 -6
  120. mindspore/mint/nn/layer/_functions.py +164 -294
  121. mindspore/mint/nn/layer/activation.py +8 -6
  122. mindspore/mint/nn/layer/conv.py +137 -101
  123. mindspore/mint/nn/layer/normalization.py +8 -22
  124. mindspore/mint/optim/adam.py +19 -18
  125. mindspore/mint/optim/adamw.py +14 -8
  126. mindspore/mint/optim/sgd.py +5 -5
  127. mindspore/msobj140.dll +0 -0
  128. mindspore/mspdb140.dll +0 -0
  129. mindspore/mspdbcore.dll +0 -0
  130. mindspore/mspdbst.dll +0 -0
  131. mindspore/mspft140.dll +0 -0
  132. mindspore/msvcdis140.dll +0 -0
  133. mindspore/msvcp140_1.dll +0 -0
  134. mindspore/msvcp140_2.dll +0 -0
  135. mindspore/msvcp140_atomic_wait.dll +0 -0
  136. mindspore/msvcp140_codecvt_ids.dll +0 -0
  137. mindspore/nn/cell.py +328 -502
  138. mindspore/nn/grad/cell_grad.py +11 -12
  139. mindspore/nn/layer/activation.py +32 -34
  140. mindspore/nn/layer/basic.py +67 -64
  141. mindspore/nn/layer/channel_shuffle.py +4 -4
  142. mindspore/nn/layer/combined.py +4 -2
  143. mindspore/nn/layer/conv.py +117 -110
  144. mindspore/nn/layer/dense.py +9 -7
  145. mindspore/nn/layer/embedding.py +50 -52
  146. mindspore/nn/layer/image.py +37 -39
  147. mindspore/nn/layer/math.py +111 -112
  148. mindspore/nn/layer/normalization.py +56 -44
  149. mindspore/nn/layer/pooling.py +58 -63
  150. mindspore/nn/layer/rnn_cells.py +33 -33
  151. mindspore/nn/layer/rnns.py +56 -56
  152. mindspore/nn/layer/thor_layer.py +74 -73
  153. mindspore/nn/layer/transformer.py +11 -1
  154. mindspore/nn/learning_rate_schedule.py +20 -20
  155. mindspore/nn/loss/loss.py +79 -81
  156. mindspore/nn/optim/adam.py +3 -3
  157. mindspore/nn/optim/adasum.py +2 -2
  158. mindspore/nn/optim/asgd.py +2 -0
  159. mindspore/nn/optim/optimizer.py +1 -1
  160. mindspore/nn/optim/thor.py +2 -2
  161. mindspore/nn/probability/distribution/exponential.py +2 -1
  162. mindspore/nn/probability/distribution/poisson.py +2 -1
  163. mindspore/nn/sparse/sparse.py +3 -3
  164. mindspore/nn/wrap/cell_wrapper.py +34 -37
  165. mindspore/nn/wrap/grad_reducer.py +37 -37
  166. mindspore/nn/wrap/loss_scale.py +72 -74
  167. mindspore/numpy/array_creations.py +5 -5
  168. mindspore/numpy/fft.py +1 -1
  169. mindspore/numpy/math_ops.py +5 -5
  170. mindspore/opencv_core452.dll +0 -0
  171. mindspore/opencv_imgcodecs452.dll +0 -0
  172. mindspore/opencv_imgproc452.dll +0 -0
  173. mindspore/ops/_grad_experimental/grad_comm_ops.py +51 -13
  174. mindspore/ops/_grad_experimental/grad_debug_ops.py +14 -0
  175. mindspore/ops/_vmap/vmap_array_ops.py +31 -13
  176. mindspore/ops/_vmap/vmap_nn_ops.py +8 -16
  177. mindspore/ops/auto_generate/cpp_create_prim_instance_helper.py +42 -11
  178. mindspore/ops/auto_generate/gen_extend_func.py +23 -141
  179. mindspore/ops/auto_generate/gen_ops_def.py +727 -321
  180. mindspore/ops/auto_generate/gen_ops_prim.py +1721 -984
  181. mindspore/ops/auto_generate/pyboost_inner_prim.py +31 -1
  182. mindspore/ops/composite/__init__.py +10 -0
  183. mindspore/ops/composite/base.py +8 -4
  184. mindspore/ops/composite/multitype_ops/__init__.py +12 -1
  185. mindspore/ops/composite/multitype_ops/_compile_utils.py +133 -109
  186. mindspore/ops/composite/multitype_ops/add_impl.py +70 -2
  187. mindspore/ops/composite/multitype_ops/div_impl.py +49 -0
  188. mindspore/ops/composite/multitype_ops/floordiv_impl.py +29 -0
  189. mindspore/ops/composite/multitype_ops/getitem_impl.py +11 -0
  190. mindspore/ops/composite/multitype_ops/mod_impl.py +5 -3
  191. mindspore/ops/composite/multitype_ops/mul_impl.py +49 -0
  192. mindspore/ops/composite/multitype_ops/setitem_impl.py +57 -0
  193. mindspore/ops/composite/multitype_ops/sub_impl.py +34 -0
  194. mindspore/ops/composite/multitype_ops/zeros_like_impl.py +14 -0
  195. mindspore/ops/function/__init__.py +3 -1
  196. mindspore/ops/function/_add_attr_func.py +11 -6
  197. mindspore/ops/function/array_func.py +9 -96
  198. mindspore/ops/function/debug_func.py +4 -3
  199. mindspore/ops/function/grad/grad_func.py +1 -1
  200. mindspore/ops/function/math_func.py +33 -540
  201. mindspore/ops/function/nn_func.py +28 -74
  202. mindspore/ops/function/other_func.py +4 -1
  203. mindspore/ops/function/random_func.py +44 -5
  204. mindspore/ops/function/vmap_func.py +2 -1
  205. mindspore/ops/functional.py +2 -3
  206. mindspore/ops/functional_overload.py +571 -6
  207. mindspore/ops/op_info_register.py +21 -0
  208. mindspore/ops/operations/__init__.py +16 -11
  209. mindspore/ops/operations/_custom_ops_utils.py +689 -34
  210. mindspore/ops/operations/_inner_ops.py +3 -6
  211. mindspore/ops/operations/_sequence_ops.py +1 -1
  212. mindspore/ops/operations/array_ops.py +2 -2
  213. mindspore/ops/operations/comm_ops.py +185 -26
  214. mindspore/ops/operations/custom_ops.py +294 -174
  215. mindspore/ops/operations/debug_ops.py +59 -4
  216. mindspore/ops/operations/image_ops.py +13 -13
  217. mindspore/ops/operations/manually_defined/ops_def.py +15 -16
  218. mindspore/ops/operations/math_ops.py +3 -4
  219. mindspore/ops/operations/nn_ops.py +7 -39
  220. mindspore/ops/primitive.py +6 -10
  221. mindspore/ops/tensor_method.py +47 -8
  222. mindspore/ops_generate/api/cpp_create_prim_instance_helper_generator.py +1 -1
  223. mindspore/ops_generate/api/functional_map_cpp_generator.py +10 -9
  224. mindspore/ops_generate/api/functions_cc_generator.py +58 -10
  225. mindspore/ops_generate/api/tensor_func_reg_cpp_generator.py +1 -1
  226. mindspore/ops_generate/common/base_generator.py +14 -0
  227. mindspore/ops_generate/common/gen_constants.py +8 -3
  228. mindspore/ops_generate/common/gen_utils.py +0 -19
  229. mindspore/ops_generate/common/op_proto.py +11 -4
  230. mindspore/ops_generate/common/template.py +88 -11
  231. mindspore/ops_generate/gen_ops.py +1 -1
  232. mindspore/ops_generate/op_def/lite_ops_cpp_generator.py +4 -4
  233. mindspore/ops_generate/op_def/ops_def_cc_generator.py +0 -3
  234. mindspore/ops_generate/op_def/ops_name_h_generator.py +0 -3
  235. mindspore/ops_generate/op_def/ops_primitive_h_generator.py +0 -4
  236. mindspore/ops_generate/op_def_py/op_prim_py_generator.py +5 -2
  237. mindspore/ops_generate/pyboost/auto_grad_impl_cc_generator.py +49 -8
  238. mindspore/ops_generate/pyboost/auto_grad_reg_cc_generator.py +2 -2
  239. mindspore/ops_generate/pyboost/gen_pyboost_func.py +31 -0
  240. mindspore/ops_generate/pyboost/op_template_parser.py +98 -72
  241. mindspore/ops_generate/pyboost/pyboost_functions_cpp_generator.py +70 -273
  242. mindspore/ops_generate/pyboost/pyboost_functions_h_generator.py +14 -6
  243. mindspore/ops_generate/pyboost/pyboost_functions_impl_cpp_generator.py +316 -0
  244. mindspore/ops_generate/pyboost/pyboost_functions_py_generator.py +1 -1
  245. mindspore/ops_generate/pyboost/pyboost_grad_function_cpp_generator.py +5 -3
  246. mindspore/ops_generate/pyboost/pyboost_inner_prim_generator.py +1 -1
  247. mindspore/ops_generate/pyboost/pyboost_internal_functions_cpp_generator.py +76 -0
  248. mindspore/ops_generate/pyboost/pyboost_internal_functions_h_generator.py +76 -0
  249. mindspore/ops_generate/pyboost/pyboost_internal_kernel_info_adapter_generator.py +125 -0
  250. mindspore/ops_generate/pyboost/pyboost_native_grad_functions_generator.py +4 -3
  251. mindspore/ops_generate/pyboost/pyboost_op_cpp_code_generator.py +348 -61
  252. mindspore/ops_generate/pyboost/pyboost_overload_functions_cpp_generator.py +1 -1
  253. mindspore/ops_generate/pyboost/pyboost_utils.py +118 -9
  254. mindspore/ops_generate/tensor_py_cc_generator.py +1 -24
  255. mindspore/parallel/_auto_parallel_context.py +11 -8
  256. mindspore/parallel/_cell_wrapper.py +113 -45
  257. mindspore/parallel/_parallel_serialization.py +1 -1
  258. mindspore/parallel/_ps_context.py +4 -6
  259. mindspore/parallel/_tensor.py +167 -12
  260. mindspore/parallel/_transformer/moe.py +1 -1
  261. mindspore/parallel/_transformer/transformer.py +13 -8
  262. mindspore/parallel/auto_parallel.py +14 -7
  263. mindspore/parallel/checkpoint_convert.py +3 -3
  264. mindspore/parallel/checkpoint_transform.py +11 -7
  265. mindspore/parallel/cluster/process_entity/_api.py +84 -48
  266. mindspore/parallel/cluster/process_entity/_utils.py +95 -7
  267. mindspore/parallel/cluster/run.py +43 -4
  268. mindspore/parallel/function/__init__.py +8 -1
  269. mindspore/parallel/function/reshard_func.py +6 -7
  270. mindspore/parallel/nn/__init__.py +15 -2
  271. mindspore/parallel/nn/parallel_cell_wrapper.py +9 -10
  272. mindspore/parallel/nn/parallel_grad_reducer.py +7 -6
  273. mindspore/parallel/shard.py +3 -4
  274. mindspore/parallel/transform_safetensors.py +463 -174
  275. mindspore/pgodb140.dll +0 -0
  276. mindspore/pgort140.dll +0 -0
  277. mindspore/profiler/__init__.py +2 -1
  278. mindspore/profiler/analysis/parser/timeline_assembly_factory/ascend_timeline_assembler.py +7 -7
  279. mindspore/profiler/analysis/parser/timeline_assembly_factory/base_timeline_assembler.py +3 -0
  280. mindspore/profiler/analysis/parser/timeline_assembly_factory/trace_view_container.py +12 -6
  281. mindspore/profiler/analysis/parser/timeline_creator/cpu_op_timeline_creator.py +3 -3
  282. mindspore/profiler/analysis/parser/timeline_creator/fwk_timeline_creator.py +3 -3
  283. mindspore/profiler/analysis/parser/timeline_creator/msprof_timeline_creator.py +4 -4
  284. mindspore/profiler/analysis/parser/timeline_creator/scope_layer_timeline_creator.py +3 -3
  285. mindspore/profiler/analysis/parser/timeline_event/fwk_event.py +4 -1
  286. mindspore/profiler/analysis/parser/timeline_event/timeline_event_pool.py +2 -1
  287. mindspore/profiler/analysis/task_manager.py +1 -1
  288. mindspore/profiler/analysis/viewer/ascend_communication_viewer.py +5 -1
  289. mindspore/profiler/analysis/viewer/ascend_integrate_viewer.py +2 -1
  290. mindspore/profiler/analysis/viewer/ascend_op_memory_viewer.py +42 -22
  291. mindspore/profiler/analysis/viewer/ascend_step_trace_time_viewer.py +3 -2
  292. mindspore/profiler/analysis/viewer/ms_minddata_viewer.py +9 -5
  293. mindspore/profiler/analysis/viewer/ms_operator_details_viewer.py +132 -0
  294. mindspore/profiler/common/constant.py +16 -0
  295. mindspore/profiler/common/profiler_context.py +25 -27
  296. mindspore/profiler/common/profiler_info.py +0 -16
  297. mindspore/profiler/common/profiler_op_analyse.py +235 -0
  298. mindspore/profiler/common/profiler_output_path.py +23 -8
  299. mindspore/profiler/common/profiler_parameters.py +128 -35
  300. mindspore/profiler/dynamic_profile/__init__.py +0 -0
  301. mindspore/profiler/dynamic_profile/dynamic_monitor_proxy.py +39 -0
  302. mindspore/profiler/dynamic_profile/dynamic_profiler_config_context.py +666 -0
  303. mindspore/profiler/dynamic_profile/dynamic_profiler_utils.py +62 -0
  304. mindspore/profiler/dynamic_profiler.py +305 -314
  305. mindspore/profiler/envprofiler.py +12 -7
  306. mindspore/profiler/experimental_config.py +96 -6
  307. mindspore/profiler/mstx.py +33 -12
  308. mindspore/profiler/platform/__init__.py +2 -3
  309. mindspore/profiler/platform/npu_profiler.py +29 -19
  310. mindspore/profiler/profiler.py +35 -19
  311. mindspore/profiler/profiler_action_controller.py +64 -76
  312. mindspore/profiler/schedule.py +10 -4
  313. mindspore/rewrite/common/config.py +1 -0
  314. mindspore/rewrite/common/namer.py +1 -0
  315. mindspore/rewrite/common/namespace.py +1 -0
  316. mindspore/rewrite/node/node.py +31 -11
  317. mindspore/rewrite/parsers/assign_parser.py +1 -1
  318. mindspore/rewrite/symbol_tree/symbol_tree.py +1 -1
  319. mindspore/run_check/_check_version.py +7 -10
  320. mindspore/runtime/__init__.py +5 -5
  321. mindspore/runtime/event.py +10 -4
  322. mindspore/runtime/executor.py +60 -45
  323. mindspore/runtime/memory.py +30 -32
  324. mindspore/runtime/thread_bind_core.py +298 -164
  325. mindspore/safeguard/rewrite_obfuscation.py +12 -13
  326. mindspore/swresample-4.dll +0 -0
  327. mindspore/swscale-6.dll +0 -0
  328. mindspore/tbbmalloc.dll +0 -0
  329. mindspore/tinyxml2.dll +0 -0
  330. mindspore/train/_utils.py +14 -4
  331. mindspore/train/amp.py +43 -20
  332. mindspore/train/callback/__init__.py +5 -5
  333. mindspore/train/callback/_checkpoint.py +3 -6
  334. mindspore/train/callback/_flops_collector.py +1 -1
  335. mindspore/train/callback/_landscape.py +0 -1
  336. mindspore/train/callback/_train_fault_tolerance.py +97 -16
  337. mindspore/train/data_sink.py +11 -2
  338. mindspore/train/dataset_helper.py +9 -0
  339. mindspore/train/model.py +135 -55
  340. mindspore/train/serialization.py +133 -111
  341. mindspore/train/summary/summary_record.py +13 -2
  342. mindspore/turbojpeg.dll +0 -0
  343. mindspore/utils/__init__.py +3 -2
  344. mindspore/utils/dryrun.py +0 -6
  345. mindspore/utils/runtime_execution_order_check.py +163 -77
  346. mindspore/utils/sdc_detect.py +68 -0
  347. mindspore/utils/utils.py +6 -9
  348. mindspore/vcmeta.dll +0 -0
  349. mindspore/vcruntime140.dll +0 -0
  350. mindspore/vcruntime140_1.dll +0 -0
  351. mindspore/version.py +1 -1
  352. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0rc1.dist-info}/METADATA +5 -4
  353. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0rc1.dist-info}/RECORD +356 -394
  354. mindspore/_deprecated/jit.py +0 -198
  355. mindspore/experimental/es/__init__.py +0 -22
  356. mindspore/experimental/es/embedding_service.py +0 -891
  357. mindspore/experimental/es/embedding_service_layer.py +0 -581
  358. mindspore/profiler/parser/__init__.py +0 -14
  359. mindspore/profiler/parser/aicpu_data_parser.py +0 -272
  360. mindspore/profiler/parser/ascend_analysis/__init__.py +0 -14
  361. mindspore/profiler/parser/ascend_analysis/constant.py +0 -71
  362. mindspore/profiler/parser/ascend_analysis/file_manager.py +0 -180
  363. mindspore/profiler/parser/ascend_analysis/function_event.py +0 -185
  364. mindspore/profiler/parser/ascend_analysis/fwk_cann_parser.py +0 -136
  365. mindspore/profiler/parser/ascend_analysis/fwk_file_parser.py +0 -131
  366. mindspore/profiler/parser/ascend_analysis/msprof_timeline_parser.py +0 -104
  367. mindspore/profiler/parser/ascend_analysis/path_manager.py +0 -313
  368. mindspore/profiler/parser/ascend_analysis/profiler_info_parser.py +0 -123
  369. mindspore/profiler/parser/ascend_analysis/tlv_decoder.py +0 -86
  370. mindspore/profiler/parser/ascend_analysis/trace_event_manager.py +0 -75
  371. mindspore/profiler/parser/ascend_cluster_generator.py +0 -116
  372. mindspore/profiler/parser/ascend_communicate_generator.py +0 -314
  373. mindspore/profiler/parser/ascend_flops_generator.py +0 -116
  374. mindspore/profiler/parser/ascend_fpbp_generator.py +0 -82
  375. mindspore/profiler/parser/ascend_hccl_generator.py +0 -271
  376. mindspore/profiler/parser/ascend_integrate_generator.py +0 -42
  377. mindspore/profiler/parser/ascend_memory_generator.py +0 -185
  378. mindspore/profiler/parser/ascend_msprof_exporter.py +0 -282
  379. mindspore/profiler/parser/ascend_msprof_generator.py +0 -187
  380. mindspore/profiler/parser/ascend_op_generator.py +0 -334
  381. mindspore/profiler/parser/ascend_steptrace_generator.py +0 -94
  382. mindspore/profiler/parser/ascend_timeline_generator.py +0 -545
  383. mindspore/profiler/parser/base_timeline_generator.py +0 -483
  384. mindspore/profiler/parser/container.py +0 -229
  385. mindspore/profiler/parser/cpu_gpu_timeline_generator.py +0 -697
  386. mindspore/profiler/parser/flops_parser.py +0 -531
  387. mindspore/profiler/parser/framework_enum.py +0 -111
  388. mindspore/profiler/parser/framework_parser.py +0 -464
  389. mindspore/profiler/parser/framework_struct.py +0 -61
  390. mindspore/profiler/parser/gpu_analysis/__init__.py +0 -14
  391. mindspore/profiler/parser/gpu_analysis/function_event.py +0 -44
  392. mindspore/profiler/parser/gpu_analysis/fwk_file_parser.py +0 -89
  393. mindspore/profiler/parser/gpu_analysis/profiler_info_parser.py +0 -72
  394. mindspore/profiler/parser/hccl_parser.py +0 -573
  395. mindspore/profiler/parser/hwts_log_parser.py +0 -122
  396. mindspore/profiler/parser/integrator.py +0 -526
  397. mindspore/profiler/parser/memory_usage_parser.py +0 -277
  398. mindspore/profiler/parser/minddata_analyzer.py +0 -800
  399. mindspore/profiler/parser/minddata_parser.py +0 -186
  400. mindspore/profiler/parser/minddata_pipeline_parser.py +0 -299
  401. mindspore/profiler/parser/op_intermediate_parser.py +0 -149
  402. mindspore/profiler/parser/optime_parser.py +0 -250
  403. mindspore/profiler/parser/profiler_info.py +0 -213
  404. mindspore/profiler/parser/step_trace_parser.py +0 -666
  405. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0rc1.dist-info}/WHEEL +0 -0
  406. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0rc1.dist-info}/entry_points.txt +0 -0
  407. {mindspore-2.6.0rc1.dist-info → mindspore-2.7.0rc1.dist-info}/top_level.txt +0 -0
mindspore/train/model.py CHANGED
@@ -57,8 +57,10 @@ from mindspore.dataset.engine.datasets import _set_training_dataset, _reset_trai
57
57
  from mindspore.train import amp
58
58
  from mindspore._c_expression import _framework_profiler_step_start, _framework_profiler_step_end
59
59
  from mindspore._c_expression import _get_optimzer_timestamps
60
+ from mindspore._c_expression import clean_tdt_channel, _clean_rootinfo
60
61
 
61
62
  from mindspore.parallel._utils import _init_auto_parallel_context, _clear_auto_parallel_context
63
+ from .serialization import load_param_into_net
62
64
 
63
65
  def _transfer_tensor_to_tuple(inputs):
64
66
  """
@@ -130,7 +132,8 @@ def _handle_exception_info(obj, uce_env, tft, e):
130
132
  if not uce_env:
131
133
  logger.error("uce wrapper caught RuntimeError but uce not enable, enter MindIO TTP process.",
132
134
  exc_info=True)
133
- tft.tft_report_error(tft.ReportState.RS_UNKNOWN.value)
135
+ if tft:
136
+ tft.tft_report_error(tft.ReportState.RS_UNKNOWN.value)
134
137
  raise e
135
138
  e_str = str(e)
136
139
  logger.warning("uce wrapper caught RuntimeError e_str:{}".format(e_str))
@@ -151,6 +154,13 @@ def _handle_exception_info(obj, uce_env, tft, e):
151
154
  tft.tft_report_error(tft.ReportState.RS_UNKNOWN.value)
152
155
  raise e
153
156
  tft.tft_report_error(tft.ReportState.RS_UCE.value)
157
+ elif "HCCEError" in e_str:
158
+ logger.warning("uce wrapper caught HCCEError")
159
+ if obj.stop_been_called:
160
+ logger.warning("Received HCCEError after force stop been called, so report force stopped error to MindIO.")
161
+ tft.tft_report_error(tft.ReportState.RS_NORMAL.value)
162
+ else:
163
+ tft.tft_report_error(tft.ReportState.RS_HCCL_FAILED.value)
154
164
  elif "ForceStopError" in e_str:
155
165
  logger.warning("uce wrapper caught RuntimeError ForceStopError")
156
166
  force_stop_err = tft.ReportState.RS_NORMAL.value
@@ -165,6 +175,69 @@ def _handle_exception_info(obj, uce_env, tft, e):
165
175
  raise e
166
176
 
167
177
 
178
+ def _handle_training_result_error(model, tft_obj):
179
+ """
180
+ Handle training result error for resuming training.
181
+ """
182
+ ckpt_load_fn = tft_obj.ckpt_load_func
183
+ train_network = tft_obj.cb_params.train_network
184
+ logger.warning("Process training result error start.")
185
+ # 1. Clear tdt channel
186
+ logger.warning("Clean tdt channel.")
187
+ clean_tdt_channel()
188
+
189
+ # 2. Load checkpoint
190
+ logger.warning("Load checkpoint.")
191
+ new_param_dict, remove_redundancy = ckpt_load_fn()
192
+ param_not_load, ckpt_not_load = load_param_into_net(train_network, new_param_dict, True, remove_redundancy)
193
+ logger.warning(f"param_not_load: {param_not_load}")
194
+ logger.warning(f"ckpt_not_load: {ckpt_not_load}")
195
+ resume_epoch = new_param_dict.get('epoch_num')
196
+ resume_step = new_param_dict.get('step_num')
197
+ model._initial_step = int(resume_step.asnumpy())
198
+ logger.warning("Process training result error end.")
199
+ return (resume_epoch, resume_step)
200
+
201
+
202
+ def _calc_cb_initial_step(org_epoch, org_step, *args, **kwargs):
203
+ """calculate initial step for callback"""
204
+ train_dataset = args[1]
205
+ dataset_sink_mode = args[3] if len(args) > 3 else kwargs.get('dataset_sink_mode', True)
206
+ sink_size = args[4] if len(args) > 4 else kwargs.get('sink_size', -1)
207
+
208
+ cb_initial_step = 0
209
+ if dataset_sink_mode:
210
+ train_dataset.set_init_step(org_epoch)
211
+ dataset_size = train_dataset.get_dataset_size()
212
+ if sink_size != -1:
213
+ cb_initial_step = org_epoch * sink_size + org_step
214
+ else:
215
+ cb_initial_step = org_epoch * dataset_size + org_step
216
+ else:
217
+ train_dataset.set_init_step(org_step)
218
+ cb_initial_step = org_step
219
+ if hasattr(train_dataset, '_dataset_helper'):
220
+ dataset_helper = train_dataset._dataset_helper
221
+ _reset_training_dataset(cb_initial_step, dataset_helper.iter.dataset.get_dataset_size())
222
+ return cb_initial_step
223
+
224
+
225
+ def _update_ckpt_callback_info(resume_train_step, **kwargs):
226
+ """
227
+ Update checkpoint callback internal state
228
+ """
229
+ ckpt_obj = None
230
+ if kwargs.get('callbacks') and isinstance(kwargs.get('callbacks'), ModelCheckpoint):
231
+ ckpt_obj = kwargs.get('callbacks')
232
+ if kwargs.get('callbacks') and isinstance(kwargs.get('callbacks'), list):
233
+ for item in kwargs.get('callbacks'):
234
+ if isinstance(item, ModelCheckpoint):
235
+ ckpt_obj = item
236
+ if ckpt_obj is not None:
237
+ ckpt_obj._last_triggered_step = 0
238
+ ckpt_obj._append_step_num = resume_train_step
239
+
240
+
168
241
  def _handle_tft(func):
169
242
  """
170
243
  Decorator function, which starts uce handle process when an exception occurs during training.
@@ -180,42 +253,35 @@ def _handle_tft(func):
180
253
  if isinstance(item, TrainFaultTolerance):
181
254
  obj = item
182
255
  if obj:
183
- tft = obj.tft
184
256
  tft_env = os.getenv("MS_ENABLE_TFT", "")
185
- uce_env = "UCE:1" in tft_env or "ARF:1" in tft_env
257
+ uce_env = "UCE:1" in tft_env or "ARF:1" in tft_env or "HCCE:1" in tft_env
258
+ tre_env = "TRE:1" in tft_env
186
259
  while True:
187
260
  try:
188
261
  return func(self, *args, **kwargs)
189
262
  except RuntimeError as e:
190
- _handle_exception_info(obj, uce_env, tft, e)
191
- ret = tft.tft_wait_next_action()
192
- if ret == tft.Action.EXIT.value:
193
- raise e
194
- repair_step = tft.tft_get_repair_step()
195
- logger.warning(
196
- "uce wrapper caught repair finish REPAIR STEP: {} batch_num:{}".format(repair_step,
197
- self.batch_num))
263
+ if tre_env and 'TREError' in str(e):
264
+ _, resume_step = _handle_training_result_error(self, obj)
265
+ repair_step = int(resume_step.asnumpy())
266
+ _update_ckpt_callback_info(repair_step, **kwargs)
267
+ logger.warning(f'Resume training after TREError from step {repair_step}.')
268
+ else:
269
+ _handle_exception_info(obj, uce_env, obj.tft, e)
270
+ ret = obj.tft.tft_wait_next_action()
271
+ if ret == obj.tft.Action.EXIT.value:
272
+ raise e
273
+ obj.stop_been_called = False
274
+ repair_step = obj.tft.tft_get_repair_step()
275
+ logger.warning(
276
+ "uce wrapper caught repair finish REPAIR STEP: {} batch_num:{}".format(repair_step,
277
+ self.batch_num))
198
278
  initial_epoch = int(repair_step / self.batch_num)
199
279
  initial_step = repair_step % self.batch_num
200
280
  kwargs["initial_epoch"] = initial_epoch
201
-
202
- train_dataset = args[1]
203
- dataset_sink_mode = args[3] if len(args) > 3 else kwargs.get('dataset_sink_mode', True)
204
- sink_size = args[4] if len(args) > 4 else kwargs.get('sink_size', -1)
205
-
206
- cb_initial_step = 0
207
- if dataset_sink_mode:
208
- train_dataset.set_init_step(initial_epoch)
209
- dataset_size = train_dataset.get_dataset_size()
210
- if sink_size != -1:
211
- cb_initial_step = initial_epoch * sink_size + initial_step
212
- else:
213
- cb_initial_step = initial_epoch * dataset_size + initial_step
214
- else:
215
- train_dataset.set_init_step(initial_step)
216
- cb_initial_step = initial_step
217
-
218
- kwargs["initial_step"] = cb_initial_step
281
+ cb_initial_step = _calc_cb_initial_step(initial_epoch, initial_step, *args, **kwargs)
282
+ if not self.enable_tre:
283
+ kwargs["initial_step"] = cb_initial_step
284
+ self._initial_step = 0
219
285
  # reset all accu grads to zero
220
286
  obj._reset_acc_grads()
221
287
  logger.warning(
@@ -223,8 +289,9 @@ def _handle_tft(func):
223
289
  cb_initial_step))
224
290
  continue
225
291
  except BaseException as e:
226
- logger.error("uce wrapper caught BaseException error, enter MindIO TTP process.", exc_info=True)
227
- tft.tft_report_error(tft.ReportState.RS_UNKNOWN.value)
292
+ if obj.tft:
293
+ logger.error("uce wrapper caught BaseException error, enter MindIO TTP process.", exc_info=True)
294
+ obj.tft.tft_report_error(obj.tft.ReportState.RS_UNKNOWN.value)
228
295
  raise e
229
296
  else:
230
297
  return func(self, *args, **kwargs)
@@ -384,6 +451,11 @@ def _set_with_processed_inputs(network, inputs):
384
451
  "Reset inputs from a process inputs, should be a list/tuple or a dict, but got %s!" % str(inputs))
385
452
 
386
453
 
454
+ def _check_tft_reset_dataset():
455
+ env_tft = os.getenv("MS_ENABLE_TFT", "")
456
+ return any([v in env_tft for v in ["TRE:1", "UCE:1", "HCCE:1", "ARF:1"]])
457
+
458
+
387
459
  class Model:
388
460
  """
389
461
  High-Level API for training or inference.
@@ -501,6 +573,10 @@ class Model:
501
573
  self._lite_infer = True # if backend lite infer fails, set False
502
574
  self._mindspore_lite_model_group_id = id(self) & 0xFFFF
503
575
  self.batch_num = -1
576
+ self.enable_tre = "TRE:1" in os.getenv("MS_ENABLE_TFT", "")
577
+ self.enable_hcce = "HCCE:1" in os.getenv("MS_ENABLE_TFT", "")
578
+ self._initial_step = None
579
+ self._need_reset_data = _check_tft_reset_dataset()
504
580
  _clear_auto_parallel_context(self._network)
505
581
 
506
582
  def _check_for_graph_cell(self, kwargs):
@@ -700,7 +776,7 @@ class Model:
700
776
  logger.info("Begin to connect network with dataset.")
701
777
  network = connect_network_with_dataset(network, dataset_helper)
702
778
 
703
- if _get_recovery_context("enable_recovery") and is_train:
779
+ if (_get_recovery_context("enable_recovery") or self._need_reset_data) and is_train:
704
780
  _set_training_dataset(dataset_helper)
705
781
 
706
782
  network.set_train(is_train)
@@ -957,6 +1033,7 @@ class Model:
957
1033
  cb_params.latest_ckpt_file = None
958
1034
  cb_params.loss_scale_mananger = self._loss_scale_manager
959
1035
  cb_params.is_arf = _get_recovery_context("is_arf")
1036
+ cb_params.initial_step = self._initial_step
960
1037
 
961
1038
  # build callback list
962
1039
  with _CallbackManager(callbacks) as list_callback:
@@ -995,7 +1072,7 @@ class Model:
995
1072
  initial_epoch (int): Epoch at which to start train, it used for resuming a previous training run.
996
1073
  Default: 0.
997
1074
  """
998
- is_graph = (context.get_context("mode") == context.GRAPH_MODE)
1075
+ is_graph = context.get_context("mode") == context.GRAPH_MODE
999
1076
  dataset_size = train_dataset.get_dataset_size()
1000
1077
  if dataset_size % sink_size != 0:
1001
1078
  logger.info("In dataset_sink mode (dataset_size % sink_size) should equal to 0, "
@@ -1064,6 +1141,7 @@ class Model:
1064
1141
  if cb_params.is_arf:
1065
1142
  cb_params.is_arf = False
1066
1143
  _set_recovery_context(is_arf=False)
1144
+ _clean_rootinfo()
1067
1145
 
1068
1146
  # Embedding cache server only run one step.
1069
1147
  if is_embedding_cache_server:
@@ -1278,6 +1356,7 @@ class Model:
1278
1356
  if cb_params.is_arf:
1279
1357
  cb_params.is_arf = False
1280
1358
  _set_recovery_context(is_arf=False)
1359
+ _clean_rootinfo()
1281
1360
  # Embedding cache server only run one step.
1282
1361
  if is_embedding_cache_server:
1283
1362
  break
@@ -2241,6 +2320,7 @@ class Model:
2241
2320
 
2242
2321
  Examples:
2243
2322
  >>> import numpy as np
2323
+ >>> import mindspore as ms
2244
2324
  >>> import mindspore.nn as nn
2245
2325
  >>> from mindspore import Tensor
2246
2326
  >>> from mindspore.train import Model
@@ -2250,28 +2330,28 @@ class Model:
2250
2330
  >>> from mindspore.parallel.auto_parallel import AutoParallel
2251
2331
  >>>
2252
2332
  >>> class Net(nn.Cell):
2253
- >>> def __init__(self):
2254
- >>> super(Net, self).__init__()
2255
- >>> self.fc1 = nn.Dense(128, 768, activation='relu')
2256
- >>> self.fc2 = nn.Dense(128, 768, activation='relu')
2257
- >>> self.fc3 = nn.Dense(128, 768, activation='relu')
2258
- >>> self.fc4 = nn.Dense(768, 768, activation='relu')
2259
- >>> self.relu4 = nn.ReLU()
2260
- >>> self.relu5 = nn.ReLU()
2261
- >>> self.transpose = P.Transpose()
2262
- >>> self.matmul1 = P.MatMul()
2263
- >>> self.matmul2 = P.MatMul()
2264
- >>>
2265
- >>> def construct(self, x):
2266
- >>> q = self.fc1(x)
2267
- >>> k = self.fc2(x)
2268
- >>> v = self.fc3(x)
2269
- >>> k = self.transpose(k, (1, 0))
2270
- >>> c = self.relu4(self.matmul1(q, k))
2271
- >>> s = self.relu5(self.matmul2(c, v))
2272
- >>> s = self.fc4(s)
2273
- >>> return s
2274
- >>>
2333
+ ... def __init__(self):
2334
+ ... super(Net, self).__init__()
2335
+ ... self.fc1 = nn.Dense(128, 768, activation='relu')
2336
+ ... self.fc2 = nn.Dense(128, 768, activation='relu')
2337
+ ... self.fc3 = nn.Dense(128, 768, activation='relu')
2338
+ ... self.fc4 = nn.Dense(768, 768, activation='relu')
2339
+ ... self.relu4 = nn.ReLU()
2340
+ ... self.relu5 = nn.ReLU()
2341
+ ... self.transpose = P.Transpose()
2342
+ ... self.matmul1 = P.MatMul()
2343
+ ... self.matmul2 = P.MatMul()
2344
+ ...
2345
+ ... def construct(self, x):
2346
+ ... q = self.fc1(x)
2347
+ ... k = self.fc2(x)
2348
+ ... v = self.fc3(x)
2349
+ ... k = self.transpose(k, (1, 0))
2350
+ ... c = self.relu4(self.matmul1(q, k))
2351
+ ... s = self.relu5(self.matmul2(c, v))
2352
+ ... s = self.fc4(s)
2353
+ ... return s
2354
+ ...
2275
2355
  >>> ms.set_context(mode=ms.GRAPH_MODE)
2276
2356
  >>> init()
2277
2357
  >>> inputs = Tensor(np.ones([32, 128]).astype(np.float32))