mindstudio-probe 1.0.1__py3-none-any.whl → 1.0.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (323) hide show
  1. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/LICENSE +201 -201
  2. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/METADATA +36 -30
  3. mindstudio_probe-1.0.4.dist-info/RECORD +276 -0
  4. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/WHEEL +1 -1
  5. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/entry_points.txt +1 -0
  6. msprobe/README.md +101 -182
  7. msprobe/__init__.py +1 -0
  8. msprobe/{config/config.json → config.json} +49 -27
  9. msprobe/core/__init__.py +0 -0
  10. msprobe/{pytorch → core}/advisor/advisor.py +124 -124
  11. msprobe/{pytorch → core}/advisor/advisor_const.py +59 -59
  12. msprobe/{pytorch → core}/advisor/advisor_result.py +58 -58
  13. msprobe/core/common/const.py +341 -241
  14. msprobe/core/common/exceptions.py +100 -88
  15. msprobe/core/common/{file_check.py → file_utils.py} +478 -265
  16. msprobe/core/common/log.py +76 -55
  17. msprobe/core/common/utils.py +385 -516
  18. msprobe/core/common_config.py +85 -58
  19. msprobe/core/compare/acc_compare.py +300 -0
  20. msprobe/core/compare/check.py +95 -0
  21. msprobe/core/compare/compare_cli.py +49 -0
  22. msprobe/core/compare/highlight.py +223 -0
  23. msprobe/core/compare/multiprocessing_compute.py +149 -0
  24. msprobe/{pytorch → core}/compare/npy_compare.py +295 -244
  25. msprobe/core/compare/utils.py +430 -0
  26. msprobe/core/data_dump/data_collector.py +154 -140
  27. msprobe/core/data_dump/data_processor/base.py +314 -245
  28. msprobe/core/data_dump/data_processor/factory.py +59 -61
  29. msprobe/core/data_dump/data_processor/mindspore_processor.py +186 -0
  30. msprobe/core/data_dump/data_processor/pytorch_processor.py +366 -346
  31. msprobe/core/data_dump/json_writer.py +96 -116
  32. msprobe/core/data_dump/scope.py +178 -178
  33. msprobe/core/grad_probe/__init__.py +0 -0
  34. msprobe/core/grad_probe/constant.py +71 -0
  35. msprobe/core/grad_probe/grad_compare.py +171 -0
  36. msprobe/core/grad_probe/utils.py +64 -0
  37. msprobe/docs/01.installation.md +89 -0
  38. msprobe/docs/02.config_introduction.md +165 -0
  39. msprobe/docs/03.config_examples.md +247 -0
  40. msprobe/docs/04.acl_config_examples.md +76 -0
  41. msprobe/docs/05.data_dump_PyTorch.md +198 -0
  42. msprobe/docs/06.data_dump_MindSpore.md +243 -0
  43. msprobe/docs/07.accuracy_checker_PyTorch.md +274 -0
  44. msprobe/docs/08.accuracy_checker_online_PyTorch.md +198 -0
  45. msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
  46. msprobe/docs/10.accuracy_compare_PyTorch.md +245 -0
  47. msprobe/docs/11.accuracy_compare_MindSpore.md +202 -0
  48. msprobe/docs/12.overflow_check_PyTorch.md +79 -0
  49. msprobe/docs/13.overflow_check_MindSpore.md +31 -0
  50. msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
  51. msprobe/docs/15.free_benchmarking_PyTorch.md +164 -0
  52. msprobe/docs/17.grad_probe.md +207 -0
  53. msprobe/docs/FAQ_PyTorch.md +177 -0
  54. msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
  55. msprobe/docs/img/free_benchmark_framework.png +0 -0
  56. msprobe/docs/img/grad_probe_image-1.png +0 -0
  57. msprobe/docs/img/grad_probe_image-2.png +0 -0
  58. msprobe/docs/img/grad_probe_image-3.png +0 -0
  59. msprobe/docs/img/grad_probe_image-4.png +0 -0
  60. msprobe/docs/img/grad_probe_image.png +0 -0
  61. msprobe/mindspore/__init__.py +1 -1
  62. msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
  63. msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +255 -0
  64. msprobe/mindspore/api_accuracy_checker/api_info.py +69 -0
  65. msprobe/mindspore/api_accuracy_checker/api_runner.py +156 -0
  66. msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +197 -0
  67. msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
  68. msprobe/mindspore/api_accuracy_checker/compute_element.py +239 -0
  69. msprobe/mindspore/api_accuracy_checker/main.py +9 -0
  70. msprobe/mindspore/api_accuracy_checker/type_mapping.py +114 -0
  71. msprobe/mindspore/api_accuracy_checker/utils.py +80 -0
  72. msprobe/mindspore/cell_processor.py +34 -0
  73. msprobe/mindspore/common/const.py +106 -0
  74. msprobe/mindspore/common/log.py +38 -0
  75. msprobe/mindspore/common/utils.py +81 -0
  76. msprobe/mindspore/compare/distributed_compare.py +75 -0
  77. msprobe/mindspore/compare/ms_compare.py +219 -0
  78. msprobe/mindspore/compare/ms_graph_compare.py +348 -0
  79. msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -0
  80. msprobe/mindspore/debugger/debugger_config.py +66 -51
  81. msprobe/mindspore/debugger/precision_debugger.py +126 -32
  82. msprobe/mindspore/dump/dump_tool_factory.py +35 -38
  83. msprobe/mindspore/dump/hook_cell/api_registry.py +118 -0
  84. msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -0
  85. msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +922 -0
  86. msprobe/mindspore/dump/hook_cell/wrap_api.py +113 -0
  87. msprobe/mindspore/dump/jit_dump.py +72 -0
  88. msprobe/mindspore/dump/kernel_graph_dump.py +59 -60
  89. msprobe/mindspore/dump/kernel_kbyk_dump.py +64 -0
  90. msprobe/mindspore/free_benchmark/__init__.py +0 -0
  91. msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -0
  92. msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
  93. msprobe/mindspore/free_benchmark/common/config.py +12 -0
  94. msprobe/mindspore/free_benchmark/common/handler_params.py +17 -0
  95. msprobe/mindspore/free_benchmark/common/utils.py +71 -0
  96. msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -0
  97. msprobe/mindspore/free_benchmark/decorator/__init__.py +0 -0
  98. msprobe/mindspore/free_benchmark/decorator/dec_forward.py +43 -0
  99. msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -0
  100. msprobe/mindspore/free_benchmark/handler/__init__.py +0 -0
  101. msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -0
  102. msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -0
  103. msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -0
  104. msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -0
  105. msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -0
  106. msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -0
  107. msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -0
  108. msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +51 -0
  109. msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +35 -0
  110. msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -0
  111. msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +29 -0
  112. msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -0
  113. msprobe/mindspore/grad_probe/__init__.py +0 -0
  114. msprobe/mindspore/grad_probe/global_context.py +90 -0
  115. msprobe/mindspore/grad_probe/grad_analyzer.py +231 -0
  116. msprobe/mindspore/grad_probe/grad_monitor.py +27 -0
  117. msprobe/mindspore/grad_probe/grad_stat_csv.py +132 -0
  118. msprobe/mindspore/grad_probe/hook.py +94 -0
  119. msprobe/mindspore/grad_probe/utils.py +30 -0
  120. msprobe/mindspore/ms_config.py +128 -78
  121. msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +44 -45
  122. msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +34 -32
  123. msprobe/mindspore/runtime.py +4 -0
  124. msprobe/mindspore/service.py +378 -0
  125. msprobe/mindspore/task_handler_factory.py +24 -21
  126. msprobe/msprobe.py +105 -67
  127. msprobe/pytorch/__init__.py +4 -4
  128. msprobe/pytorch/api_accuracy_checker/common/config.py +53 -50
  129. msprobe/pytorch/api_accuracy_checker/common/utils.py +214 -224
  130. msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +213 -216
  131. msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +606 -545
  132. msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
  133. msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
  134. msprobe/pytorch/api_accuracy_checker/compare/compare.py +386 -345
  135. msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +73 -73
  136. msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +245 -248
  137. msprobe/pytorch/api_accuracy_checker/config.yaml +10 -4
  138. msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +335 -328
  139. msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +200 -203
  140. msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +133 -127
  141. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +592 -493
  142. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +70 -7
  143. msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
  144. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py +0 -0
  145. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +197 -0
  146. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +325 -0
  147. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -0
  148. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +219 -0
  149. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -0
  150. msprobe/pytorch/bench_functions/__init__.py +15 -0
  151. msprobe/pytorch/bench_functions/apply_adam_w.py +28 -0
  152. msprobe/pytorch/bench_functions/confusion_transpose.py +19 -0
  153. msprobe/pytorch/bench_functions/fast_gelu.py +55 -0
  154. msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -0
  155. msprobe/pytorch/bench_functions/linear.py +12 -0
  156. msprobe/pytorch/bench_functions/matmul_backward.py +48 -0
  157. msprobe/pytorch/bench_functions/npu_fusion_attention.py +509 -0
  158. msprobe/pytorch/bench_functions/rms_norm.py +15 -0
  159. msprobe/pytorch/bench_functions/rotary_mul.py +52 -0
  160. msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -0
  161. msprobe/pytorch/bench_functions/swiglu.py +55 -0
  162. msprobe/pytorch/common/__init__.py +2 -2
  163. msprobe/pytorch/common/compare_script.template +14 -14
  164. msprobe/pytorch/common/log.py +20 -31
  165. msprobe/pytorch/common/parse_json.py +39 -37
  166. msprobe/pytorch/common/utils.py +305 -224
  167. msprobe/pytorch/compare/distributed_compare.py +66 -111
  168. msprobe/pytorch/compare/mapping.yaml +607 -607
  169. msprobe/pytorch/compare/match.py +34 -36
  170. msprobe/pytorch/compare/pt_compare.py +50 -0
  171. msprobe/pytorch/debugger/debugger_config.py +95 -86
  172. msprobe/pytorch/debugger/precision_debugger.py +125 -95
  173. msprobe/pytorch/free_benchmark/__init__.py +8 -8
  174. msprobe/pytorch/free_benchmark/common/constant.py +70 -67
  175. msprobe/pytorch/free_benchmark/common/counter.py +71 -71
  176. msprobe/pytorch/free_benchmark/common/enums.py +37 -37
  177. msprobe/pytorch/free_benchmark/common/params.py +129 -129
  178. msprobe/pytorch/free_benchmark/common/utils.py +102 -98
  179. msprobe/pytorch/free_benchmark/compare/grad_saver.py +179 -183
  180. msprobe/pytorch/free_benchmark/compare/single_benchmark.py +104 -104
  181. msprobe/pytorch/free_benchmark/main.py +105 -102
  182. msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +13 -13
  183. msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +41 -41
  184. msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +90 -90
  185. msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +104 -104
  186. msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +63 -63
  187. msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +68 -68
  188. msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +28 -28
  189. msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +45 -45
  190. msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +19 -19
  191. msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +217 -203
  192. msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +39 -39
  193. msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +23 -23
  194. msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +30 -31
  195. msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +170 -170
  196. msprobe/pytorch/function_factory.py +76 -0
  197. msprobe/pytorch/functional/dump_module.py +39 -39
  198. msprobe/pytorch/grad_probe/__init__.py +0 -0
  199. msprobe/pytorch/grad_probe/grad_monitor.py +91 -0
  200. msprobe/pytorch/grad_probe/grad_stat_csv.py +129 -0
  201. msprobe/pytorch/hook_module/api_registry.py +161 -161
  202. msprobe/pytorch/hook_module/hook_module.py +120 -109
  203. msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1876
  204. msprobe/pytorch/hook_module/utils.py +30 -29
  205. msprobe/pytorch/hook_module/wrap_aten.py +110 -100
  206. msprobe/pytorch/hook_module/wrap_distributed.py +78 -75
  207. msprobe/pytorch/hook_module/wrap_functional.py +105 -108
  208. msprobe/pytorch/hook_module/wrap_npu_custom.py +93 -73
  209. msprobe/pytorch/hook_module/wrap_tensor.py +71 -72
  210. msprobe/pytorch/hook_module/wrap_torch.py +86 -88
  211. msprobe/pytorch/hook_module/wrap_vf.py +62 -64
  212. msprobe/pytorch/module_processer.py +138 -98
  213. msprobe/pytorch/online_dispatch/__init__.py +20 -20
  214. msprobe/pytorch/online_dispatch/compare.py +236 -236
  215. msprobe/pytorch/online_dispatch/dispatch.py +271 -273
  216. msprobe/pytorch/online_dispatch/dump_compare.py +155 -186
  217. msprobe/pytorch/online_dispatch/single_compare.py +391 -391
  218. msprobe/pytorch/online_dispatch/torch_ops_config.yaml +49 -49
  219. msprobe/pytorch/online_dispatch/utils.py +130 -187
  220. msprobe/pytorch/parse.py +4 -4
  221. msprobe/pytorch/parse_tool/cli.py +32 -32
  222. msprobe/pytorch/parse_tool/lib/compare.py +260 -259
  223. msprobe/pytorch/parse_tool/lib/config.py +52 -51
  224. msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
  225. msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
  226. msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
  227. msprobe/pytorch/parse_tool/lib/parse_tool.py +158 -158
  228. msprobe/pytorch/parse_tool/lib/utils.py +316 -367
  229. msprobe/pytorch/parse_tool/lib/visualization.py +85 -90
  230. msprobe/pytorch/pt_config.py +188 -93
  231. msprobe/pytorch/service.py +246 -167
  232. mindstudio_probe-1.0.1.dist-info/RECORD +0 -228
  233. msprobe/config/README.md +0 -397
  234. msprobe/mindspore/doc/dump.md +0 -65
  235. msprobe/mindspore/dump/api_kbk_dump.py +0 -55
  236. msprobe/pytorch/compare/acc_compare.py +0 -1024
  237. msprobe/pytorch/compare/highlight.py +0 -100
  238. msprobe/pytorch/doc/FAQ.md +0 -193
  239. msprobe/pytorch/doc/api_accuracy_checker.md +0 -269
  240. msprobe/pytorch/doc/atat/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
  241. msprobe/pytorch/doc/dump.md +0 -207
  242. msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -176
  243. msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
  244. msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
  245. msprobe/pytorch/doc/run_overflow_check.md +0 -25
  246. msprobe/pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md +0 -90
  247. msprobe/test/core_ut/common/test_utils.py +0 -345
  248. msprobe/test/core_ut/data_dump/test_data_collector.py +0 -47
  249. msprobe/test/core_ut/data_dump/test_json_writer.py +0 -183
  250. msprobe/test/core_ut/data_dump/test_scope.py +0 -151
  251. msprobe/test/core_ut/test_common_config.py +0 -152
  252. msprobe/test/core_ut/test_file_check.py +0 -218
  253. msprobe/test/core_ut/test_log.py +0 -109
  254. msprobe/test/mindspore_ut/test_api_kbk_dump.py +0 -51
  255. msprobe/test/mindspore_ut/test_debugger_config.py +0 -42
  256. msprobe/test/mindspore_ut/test_dump_tool_factory.py +0 -51
  257. msprobe/test/mindspore_ut/test_kernel_graph_dump.py +0 -66
  258. msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +0 -63
  259. msprobe/test/mindspore_ut/test_ms_config.py +0 -69
  260. msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +0 -51
  261. msprobe/test/mindspore_ut/test_precision_debugger.py +0 -56
  262. msprobe/test/mindspore_ut/test_task_handler_factory.py +0 -58
  263. msprobe/test/pytorch_ut/advisor/test_advisor.py +0 -83
  264. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +0 -108
  265. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +0 -39
  266. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +0 -112
  267. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +0 -77
  268. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +0 -125
  269. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +0 -10
  270. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +0 -43
  271. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +0 -179
  272. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +0 -63
  273. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +0 -99
  274. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +0 -115
  275. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +0 -72
  276. msprobe/test/pytorch_ut/compare/test_acc_compare.py +0 -17
  277. msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +0 -105
  278. msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +0 -121
  279. msprobe/test/pytorch_ut/free_benchmark/test_main.py +0 -101
  280. msprobe/test/pytorch_ut/functional/test_dump_module.py +0 -15
  281. msprobe/test/pytorch_ut/hook_module/test_api_registry.py +0 -130
  282. msprobe/test/pytorch_ut/hook_module/test_hook_module.py +0 -42
  283. msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +0 -65
  284. msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +0 -35
  285. msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +0 -20
  286. msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +0 -35
  287. msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +0 -43
  288. msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +0 -11
  289. msprobe/test/pytorch_ut/test_pt_config.py +0 -69
  290. msprobe/test/pytorch_ut/test_service.py +0 -59
  291. msprobe/test/resources/advisor.txt +0 -3
  292. msprobe/test/resources/compare_result_20230703104808.csv +0 -9
  293. msprobe/test/resources/compare_result_without_accuracy.csv +0 -9
  294. msprobe/test/resources/config.yaml +0 -3
  295. msprobe/test/resources/npu_test.pkl +0 -8
  296. msprobe/test/run_test.sh +0 -30
  297. msprobe/test/run_ut.py +0 -58
  298. msprobe/test/test_module_processer.py +0 -64
  299. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/top_level.txt +0 -0
  300. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
  301. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
  302. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
  303. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
  304. /msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
  305. /msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
  306. /msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
  307. /msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
  308. /msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
  309. /msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
  310. /msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
  311. /msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
  312. /msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
  313. /msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
  314. /msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
  315. /msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
  316. /msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
  317. /msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
  318. /msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
  319. /msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
  320. /msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
  321. /msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
  322. /msprobe/{config → docs}/img/free_benchmark.png +0 -0
  323. /msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0
@@ -1,203 +1,200 @@
1
- import subprocess
2
- import json
3
- import os
4
- import sys
5
- import argparse
6
- import time
7
- import signal
8
- import threading
9
- from collections import namedtuple
10
- from itertools import cycle
11
- from tqdm import tqdm
12
- from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut import _run_ut_parser, get_validated_result_csv_path, \
13
- get_validated_details_csv_path, preprocess_forward_content
14
- from msprobe.pytorch.api_accuracy_checker.compare.compare import Comparator
15
- from msprobe.pytorch.common import parse_json_info_forward_backward
16
- from msprobe.core.common.file_check import FileChecker, check_file_suffix, check_link, FileOpen, \
17
- check_path_before_create, create_directory
18
- from msprobe.pytorch.common.log import logger
19
- from msprobe.core.common.const import FileCheckConst
20
-
21
-
22
- def split_json_file(input_file, num_splits, filter_api):
23
- forward_data, backward_data, real_data_path = parse_json_info_forward_backward(input_file)
24
- if filter_api:
25
- forward_data = preprocess_forward_content(forward_data)
26
- for data_name in list(forward_data.keys()):
27
- forward_data[f"{data_name}.forward"] = forward_data.pop(data_name)
28
- for data_name in list(backward_data.keys()):
29
- backward_data[f"{data_name}.backward"] = backward_data.pop(data_name)
30
-
31
- with FileOpen(input_file, 'r') as file:
32
- input_data = json.load(file)
33
- input_data.pop("data")
34
-
35
- items = list(forward_data.items())
36
- total_items = len(items)
37
- chunk_size = total_items // num_splits
38
- split_files = []
39
-
40
- for i in range(num_splits):
41
- start = i * chunk_size
42
- end = (i + 1) * chunk_size if i < num_splits - 1 else total_items
43
-
44
- split_forward_data = dict(items[start:end])
45
- temp_data = {
46
- **input_data,
47
- "data":{
48
- **split_forward_data,
49
- **backward_data
50
- }
51
- }
52
- split_filename = f"temp_part{i}.json"
53
- with FileOpen(split_filename, 'w') as split_file:
54
- json.dump(temp_data, split_file)
55
- split_files.append(split_filename)
56
-
57
- return split_files, total_items
58
-
59
-
60
- def signal_handler(signum, frame):
61
- logger.warning(f'Signal handler called with signal {signum}')
62
- raise KeyboardInterrupt()
63
-
64
-
65
- signal.signal(signal.SIGINT, signal_handler)
66
- signal.signal(signal.SIGTERM, signal_handler)
67
-
68
-
69
- ParallelUTConfig = namedtuple('ParallelUTConfig', ['api_files', 'out_path', 'num_splits',
70
- 'save_error_data_flag', 'jit_compile_flag', 'device_id',
71
- 'result_csv_path', 'total_items', 'real_data_path'])
72
-
73
-
74
- def run_parallel_ut(config):
75
- processes = []
76
- device_id_cycle = cycle(config.device_id)
77
- if config.save_error_data_flag:
78
- logger.info("UT task error datas will be saved")
79
- logger.info(f"Starting parallel UT with {config.num_splits} processes")
80
- progress_bar = tqdm(total=config.total_items, desc="Total items", unit="items")
81
-
82
- def create_cmd(api_info, dev_id):
83
- dirname, filename = os.path.split(os.path.abspath(__file__))
84
- run_ut_path = os.path.join(dirname, "run_ut.py")
85
- cmd = [
86
- sys.executable, run_ut_path,
87
- '-api_info', api_info,
88
- *(['-o', config.out_path] if config.out_path else []),
89
- '-d', str(dev_id),
90
- *(['-j'] if config.jit_compile_flag else []),
91
- *(['-save_error_data'] if config.save_error_data_flag else []),
92
- '-csv_path', config.result_csv_path,
93
- *(['-real_data_path', config.real_data_path] if config.real_data_path else [])
94
- ]
95
- return cmd
96
-
97
- def read_process_output(process):
98
- try:
99
- while True:
100
- if process.poll() is not None:
101
- break
102
- output = process.stdout.readline()
103
- if output == '':
104
- break
105
- if '[ERROR]' in output:
106
- print(output, end='')
107
- sys.stdout.flush()
108
- except ValueError as e:
109
- logger.warning(f"An error occurred while reading subprocess output: {e}")
110
-
111
- def update_progress_bar(progress_bar, result_csv_path):
112
- while any(process.poll() is None for process in processes):
113
- try:
114
- with open(result_csv_path, 'r') as result_file:
115
- completed_items = len(result_file.readlines()) - 1
116
- progress_bar.update(completed_items - progress_bar.n)
117
- except FileNotFoundError:
118
- logger.warning(f"Result CSV file not found: {result_csv_path}.")
119
- except Exception as e:
120
- logger.error(f"An unexpected error occurred while reading result CSV: {e}")
121
- time.sleep(1)
122
-
123
- for api_info in config.api_files:
124
- cmd = create_cmd(api_info, next(device_id_cycle))
125
- process = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL, text=True, bufsize=1)
126
- processes.append(process)
127
- threading.Thread(target=read_process_output, args=(process,), daemon=True).start()
128
-
129
- progress_bar_thread = threading.Thread(target=update_progress_bar, args=(progress_bar, config.result_csv_path))
130
- progress_bar_thread.start()
131
-
132
- def clean_up():
133
- progress_bar.close()
134
- for process in processes:
135
- try:
136
- process.terminate()
137
- process.wait(timeout=1)
138
- except subprocess.TimeoutExpired:
139
- process.kill()
140
- for file in config.api_files:
141
- check_link(file)
142
- try:
143
- os.remove(file)
144
- except FileNotFoundError:
145
- logger.warning(f"File not found and could not be deleted: {file}")
146
-
147
- try:
148
- for process in processes:
149
- process.communicate(timeout=None)
150
- except KeyboardInterrupt:
151
- logger.warning("Interrupted by user, terminating processes and cleaning up...")
152
- except Exception as e:
153
- logger.error(f"An unexpected error occurred: {e}")
154
- finally:
155
- if progress_bar.n < config.total_items:
156
- logger.warning("The UT task has not been completed. The parameter '-csv_path' along with the path to the result CSV file will be utilized to resume the UT task.")
157
- clean_up()
158
- progress_bar_thread.join()
159
- try:
160
- comparator = Comparator(config.result_csv_path, config.result_csv_path, False)
161
- comparator.print_pretest_result()
162
- except FileNotFoundError as e:
163
- logger.error(f"Error: {e}")
164
- except Exception as e:
165
- logger.error(f"An unexpected error occurred: {e}")
166
-
167
-
168
- def prepare_config(args):
169
- check_link(args.api_info_file)
170
- api_info = os.path.realpath(args.api_info_file)
171
- check_file_suffix(api_info, FileCheckConst.JSON_SUFFIX)
172
- out_path = os.path.realpath(args.out_path) if args.out_path else "./"
173
- check_path_before_create(out_path)
174
- create_directory(out_path)
175
- out_path_checker = FileChecker(out_path, FileCheckConst.DIR, ability=FileCheckConst.WRITE_ABLE)
176
- out_path = out_path_checker.common_check()
177
- split_files, total_items = split_json_file(api_info, args.num_splits, args.filter_api)
178
-
179
- result_csv_path = args.result_csv_path or os.path.join(out_path, f"accuracy_checking_result_{time.strftime('%Y%m%d%H%M%S')}.csv")
180
- if not args.result_csv_path:
181
- details_csv_path = os.path.join(out_path, f"accuracy_checking_details_{time.strftime('%Y%m%d%H%M%S')}.csv")
182
- comparator = Comparator(result_csv_path, details_csv_path, False)
183
- else:
184
- result_csv_path = get_validated_result_csv_path(args.result_csv_path, 'result')
185
- details_csv_path = get_validated_details_csv_path(result_csv_path)
186
- logger.info(f"UT task result will be saved in {result_csv_path}")
187
- logger.info(f"UT task details will be saved in {details_csv_path}")
188
- return ParallelUTConfig(split_files, out_path, args.num_splits, args.save_error_data,
189
- args.jit_compile, args.device_id, result_csv_path,
190
- total_items, args.real_data_path)
191
-
192
-
193
- def main():
194
- parser = argparse.ArgumentParser(description='Run UT in parallel')
195
- _run_ut_parser(parser)
196
- parser.add_argument('-n', '--num_splits', type=int, choices=range(1, 65), default=8, help='Number of splits for parallel processing. Range: 1-64')
197
- args = parser.parse_args()
198
- config = prepare_config(args)
199
- run_parallel_ut(config)
200
-
201
-
202
- if __name__ == '__main__':
203
- main()
1
+ import subprocess
2
+ import json
3
+ import os
4
+ import sys
5
+ import argparse
6
+ import time
7
+ import signal
8
+ import threading
9
+ from collections import namedtuple
10
+ from itertools import cycle
11
+ from tqdm import tqdm
12
+ from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut import _run_ut_parser, preprocess_forward_content
13
+ from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut_utils import get_validated_result_csv_path, \
14
+ get_validated_details_csv_path
15
+ from msprobe.pytorch.api_accuracy_checker.compare.compare import Comparator
16
+ from msprobe.pytorch.common import parse_json_info_forward_backward
17
+ from msprobe.pytorch.common.log import logger
18
+ from msprobe.core.common.file_utils import FileChecker, check_file_suffix, check_link, FileOpen, \
19
+ check_path_before_create, create_directory
20
+ from msprobe.core.common.file_utils import remove_path
21
+ from msprobe.core.common.const import FileCheckConst
22
+
23
+
24
+ def split_json_file(input_file, num_splits, filter_api):
25
+ forward_data, backward_data, real_data_path = parse_json_info_forward_backward(input_file)
26
+ if filter_api:
27
+ forward_data = preprocess_forward_content(forward_data)
28
+ for data_name in list(forward_data.keys()):
29
+ forward_data[f"{data_name}.forward"] = forward_data.pop(data_name)
30
+ for data_name in list(backward_data.keys()):
31
+ backward_data[f"{data_name}.backward"] = backward_data.pop(data_name)
32
+
33
+ with FileOpen(input_file, 'r') as file:
34
+ input_data = json.load(file)
35
+ input_data.pop("data")
36
+
37
+ items = list(forward_data.items())
38
+ total_items = len(items)
39
+ chunk_size = total_items // num_splits
40
+ split_files = []
41
+
42
+ for i in range(num_splits):
43
+ start = i * chunk_size
44
+ end = (i + 1) * chunk_size if i < num_splits - 1 else total_items
45
+
46
+ split_forward_data = dict(items[start:end])
47
+ temp_data = {
48
+ **input_data,
49
+ "data":{
50
+ **split_forward_data,
51
+ **backward_data
52
+ }
53
+ }
54
+ split_filename = f"temp_part{i}.json"
55
+ with FileOpen(split_filename, 'w') as split_file:
56
+ json.dump(temp_data, split_file)
57
+ split_files.append(split_filename)
58
+
59
+ return split_files, total_items
60
+
61
+
62
+ def signal_handler(signum, frame):
63
+ logger.warning(f'Signal handler called with signal {signum}')
64
+ raise KeyboardInterrupt()
65
+
66
+
67
+ signal.signal(signal.SIGINT, signal_handler)
68
+ signal.signal(signal.SIGTERM, signal_handler)
69
+
70
+
71
+ ParallelUTConfig = namedtuple('ParallelUTConfig', ['api_files', 'out_path', 'num_splits',
72
+ 'save_error_data_flag', 'jit_compile_flag', 'device_id',
73
+ 'result_csv_path', 'total_items', 'config_path'])
74
+
75
+
76
+ def run_parallel_ut(config):
77
+ processes = []
78
+ device_id_cycle = cycle(config.device_id)
79
+ if config.save_error_data_flag:
80
+ logger.info("UT task error datas will be saved")
81
+ logger.info(f"Starting parallel UT with {config.num_splits} processes")
82
+ progress_bar = tqdm(total=config.total_items, desc="Total items", unit="items")
83
+
84
+ def create_cmd(api_info, dev_id):
85
+ dirname, filename = os.path.split(os.path.abspath(__file__))
86
+ run_ut_path = os.path.join(dirname, "run_ut.py")
87
+ cmd = [
88
+ sys.executable, run_ut_path,
89
+ '-api_info', api_info,
90
+ *(['-o', config.out_path] if config.out_path else []),
91
+ '-d', str(dev_id),
92
+ *(['-j'] if config.jit_compile_flag else []),
93
+ *(['-save_error_data'] if config.save_error_data_flag else []),
94
+ '-csv_path', config.result_csv_path,
95
+ *(['-config', config.config_path] if config.config_path else [])
96
+ ]
97
+ return cmd
98
+
99
+ def read_process_output(process):
100
+ try:
101
+ while True:
102
+ if process.poll() is not None:
103
+ break
104
+ output = process.stdout.readline()
105
+ if output == '':
106
+ break
107
+ if '[ERROR]' in output:
108
+ print(output, end='')
109
+ sys.stdout.flush()
110
+ except ValueError as e:
111
+ logger.warning(f"An error occurred while reading subprocess output: {e}")
112
+
113
+ def update_progress_bar(progress_bar, result_csv_path):
114
+ while any(process.poll() is None for process in processes):
115
+ with FileOpen(result_csv_path, 'r') as result_file:
116
+ completed_items = len(result_file.readlines()) - 1
117
+ progress_bar.update(completed_items - progress_bar.n)
118
+ time.sleep(1)
119
+
120
+ for api_info in config.api_files:
121
+ cmd = create_cmd(api_info, next(device_id_cycle))
122
+ process = subprocess.Popen(cmd, stdout=subprocess.PIPE, stderr=subprocess.DEVNULL, text=True, bufsize=1, shell=False)
123
+ processes.append(process)
124
+ threading.Thread(target=read_process_output, args=(process,), daemon=True).start()
125
+
126
+ progress_bar_thread = threading.Thread(target=update_progress_bar, args=(progress_bar, config.result_csv_path))
127
+ progress_bar_thread.start()
128
+
129
+ def clean_up():
130
+ progress_bar.close()
131
+ for process in processes:
132
+ try:
133
+ process.terminate()
134
+ process.wait(timeout=1)
135
+ except subprocess.TimeoutExpired:
136
+ process.kill()
137
+ for file in config.api_files:
138
+ check_link(file)
139
+ try:
140
+ remove_path(file)
141
+ except FileNotFoundError:
142
+ logger.warning(f"File not found and could not be deleted: {file}")
143
+
144
+ try:
145
+ for process in processes:
146
+ process.communicate(timeout=None)
147
+ except KeyboardInterrupt:
148
+ logger.warning("Interrupted by user, terminating processes and cleaning up...")
149
+ except Exception as e:
150
+ logger.error(f"An unexpected error occurred: {e}")
151
+ finally:
152
+ if progress_bar.n < config.total_items:
153
+ logger.warning("The UT task has not been completed. The parameter '-csv_path' along with the path to the result CSV file will be utilized to resume the UT task.")
154
+ clean_up()
155
+ progress_bar_thread.join()
156
+ try:
157
+ comparator = Comparator(config.result_csv_path, config.result_csv_path, False)
158
+ comparator.print_pretest_result()
159
+ except FileNotFoundError as e:
160
+ logger.error(f"Error: {e}")
161
+ except Exception as e:
162
+ logger.error(f"An unexpected error occurred: {e}")
163
+
164
+
165
+ def prepare_config(args):
166
+ check_link(args.api_info_file)
167
+ api_info = os.path.realpath(args.api_info_file)
168
+ check_file_suffix(api_info, FileCheckConst.JSON_SUFFIX)
169
+ out_path = os.path.realpath(args.out_path) if args.out_path else "./"
170
+ check_path_before_create(out_path)
171
+ create_directory(out_path)
172
+ out_path_checker = FileChecker(out_path, FileCheckConst.DIR, ability=FileCheckConst.WRITE_ABLE)
173
+ out_path = out_path_checker.common_check()
174
+ split_files, total_items = split_json_file(api_info, args.num_splits, args.filter_api)
175
+ config_path = os.path.realpath(args.config_path) if args.config_path else None
176
+ result_csv_path = args.result_csv_path or os.path.join(out_path, f"accuracy_checking_result_{time.strftime('%Y%m%d%H%M%S')}.csv")
177
+ if not args.result_csv_path:
178
+ details_csv_path = os.path.join(out_path, f"accuracy_checking_details_{time.strftime('%Y%m%d%H%M%S')}.csv")
179
+ comparator = Comparator(result_csv_path, details_csv_path, False)
180
+ else:
181
+ result_csv_path = get_validated_result_csv_path(args.result_csv_path, 'result')
182
+ details_csv_path = get_validated_details_csv_path(result_csv_path)
183
+ logger.info(f"UT task result will be saved in {result_csv_path}")
184
+ logger.info(f"UT task details will be saved in {details_csv_path}")
185
+ return ParallelUTConfig(split_files, out_path, args.num_splits, args.save_error_data,
186
+ args.jit_compile, args.device_id, result_csv_path,
187
+ total_items, config_path)
188
+
189
+
190
+ def main():
191
+ parser = argparse.ArgumentParser(description='Run UT in parallel')
192
+ _run_ut_parser(parser)
193
+ parser.add_argument('-n', '--num_splits', type=int, choices=range(1, 65), default=8, help='Number of splits for parallel processing. Range: 1-64')
194
+ args = parser.parse_args()
195
+ config = prepare_config(args)
196
+ run_parallel_ut(config)
197
+
198
+
199
+ if __name__ == '__main__':
200
+ main()