mindstudio-probe 1.0.1__py3-none-any.whl → 1.0.4__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (323) hide show
  1. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/LICENSE +201 -201
  2. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/METADATA +36 -30
  3. mindstudio_probe-1.0.4.dist-info/RECORD +276 -0
  4. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/WHEEL +1 -1
  5. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/entry_points.txt +1 -0
  6. msprobe/README.md +101 -182
  7. msprobe/__init__.py +1 -0
  8. msprobe/{config/config.json → config.json} +49 -27
  9. msprobe/core/__init__.py +0 -0
  10. msprobe/{pytorch → core}/advisor/advisor.py +124 -124
  11. msprobe/{pytorch → core}/advisor/advisor_const.py +59 -59
  12. msprobe/{pytorch → core}/advisor/advisor_result.py +58 -58
  13. msprobe/core/common/const.py +341 -241
  14. msprobe/core/common/exceptions.py +100 -88
  15. msprobe/core/common/{file_check.py → file_utils.py} +478 -265
  16. msprobe/core/common/log.py +76 -55
  17. msprobe/core/common/utils.py +385 -516
  18. msprobe/core/common_config.py +85 -58
  19. msprobe/core/compare/acc_compare.py +300 -0
  20. msprobe/core/compare/check.py +95 -0
  21. msprobe/core/compare/compare_cli.py +49 -0
  22. msprobe/core/compare/highlight.py +223 -0
  23. msprobe/core/compare/multiprocessing_compute.py +149 -0
  24. msprobe/{pytorch → core}/compare/npy_compare.py +295 -244
  25. msprobe/core/compare/utils.py +430 -0
  26. msprobe/core/data_dump/data_collector.py +154 -140
  27. msprobe/core/data_dump/data_processor/base.py +314 -245
  28. msprobe/core/data_dump/data_processor/factory.py +59 -61
  29. msprobe/core/data_dump/data_processor/mindspore_processor.py +186 -0
  30. msprobe/core/data_dump/data_processor/pytorch_processor.py +366 -346
  31. msprobe/core/data_dump/json_writer.py +96 -116
  32. msprobe/core/data_dump/scope.py +178 -178
  33. msprobe/core/grad_probe/__init__.py +0 -0
  34. msprobe/core/grad_probe/constant.py +71 -0
  35. msprobe/core/grad_probe/grad_compare.py +171 -0
  36. msprobe/core/grad_probe/utils.py +64 -0
  37. msprobe/docs/01.installation.md +89 -0
  38. msprobe/docs/02.config_introduction.md +165 -0
  39. msprobe/docs/03.config_examples.md +247 -0
  40. msprobe/docs/04.acl_config_examples.md +76 -0
  41. msprobe/docs/05.data_dump_PyTorch.md +198 -0
  42. msprobe/docs/06.data_dump_MindSpore.md +243 -0
  43. msprobe/docs/07.accuracy_checker_PyTorch.md +274 -0
  44. msprobe/docs/08.accuracy_checker_online_PyTorch.md +198 -0
  45. msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
  46. msprobe/docs/10.accuracy_compare_PyTorch.md +245 -0
  47. msprobe/docs/11.accuracy_compare_MindSpore.md +202 -0
  48. msprobe/docs/12.overflow_check_PyTorch.md +79 -0
  49. msprobe/docs/13.overflow_check_MindSpore.md +31 -0
  50. msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
  51. msprobe/docs/15.free_benchmarking_PyTorch.md +164 -0
  52. msprobe/docs/17.grad_probe.md +207 -0
  53. msprobe/docs/FAQ_PyTorch.md +177 -0
  54. msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
  55. msprobe/docs/img/free_benchmark_framework.png +0 -0
  56. msprobe/docs/img/grad_probe_image-1.png +0 -0
  57. msprobe/docs/img/grad_probe_image-2.png +0 -0
  58. msprobe/docs/img/grad_probe_image-3.png +0 -0
  59. msprobe/docs/img/grad_probe_image-4.png +0 -0
  60. msprobe/docs/img/grad_probe_image.png +0 -0
  61. msprobe/mindspore/__init__.py +1 -1
  62. msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
  63. msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +255 -0
  64. msprobe/mindspore/api_accuracy_checker/api_info.py +69 -0
  65. msprobe/mindspore/api_accuracy_checker/api_runner.py +156 -0
  66. msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +197 -0
  67. msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
  68. msprobe/mindspore/api_accuracy_checker/compute_element.py +239 -0
  69. msprobe/mindspore/api_accuracy_checker/main.py +9 -0
  70. msprobe/mindspore/api_accuracy_checker/type_mapping.py +114 -0
  71. msprobe/mindspore/api_accuracy_checker/utils.py +80 -0
  72. msprobe/mindspore/cell_processor.py +34 -0
  73. msprobe/mindspore/common/const.py +106 -0
  74. msprobe/mindspore/common/log.py +38 -0
  75. msprobe/mindspore/common/utils.py +81 -0
  76. msprobe/mindspore/compare/distributed_compare.py +75 -0
  77. msprobe/mindspore/compare/ms_compare.py +219 -0
  78. msprobe/mindspore/compare/ms_graph_compare.py +348 -0
  79. msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -0
  80. msprobe/mindspore/debugger/debugger_config.py +66 -51
  81. msprobe/mindspore/debugger/precision_debugger.py +126 -32
  82. msprobe/mindspore/dump/dump_tool_factory.py +35 -38
  83. msprobe/mindspore/dump/hook_cell/api_registry.py +118 -0
  84. msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -0
  85. msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +922 -0
  86. msprobe/mindspore/dump/hook_cell/wrap_api.py +113 -0
  87. msprobe/mindspore/dump/jit_dump.py +72 -0
  88. msprobe/mindspore/dump/kernel_graph_dump.py +59 -60
  89. msprobe/mindspore/dump/kernel_kbyk_dump.py +64 -0
  90. msprobe/mindspore/free_benchmark/__init__.py +0 -0
  91. msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -0
  92. msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
  93. msprobe/mindspore/free_benchmark/common/config.py +12 -0
  94. msprobe/mindspore/free_benchmark/common/handler_params.py +17 -0
  95. msprobe/mindspore/free_benchmark/common/utils.py +71 -0
  96. msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -0
  97. msprobe/mindspore/free_benchmark/decorator/__init__.py +0 -0
  98. msprobe/mindspore/free_benchmark/decorator/dec_forward.py +43 -0
  99. msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -0
  100. msprobe/mindspore/free_benchmark/handler/__init__.py +0 -0
  101. msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -0
  102. msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -0
  103. msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -0
  104. msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -0
  105. msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -0
  106. msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -0
  107. msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -0
  108. msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +51 -0
  109. msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +35 -0
  110. msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -0
  111. msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +29 -0
  112. msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -0
  113. msprobe/mindspore/grad_probe/__init__.py +0 -0
  114. msprobe/mindspore/grad_probe/global_context.py +90 -0
  115. msprobe/mindspore/grad_probe/grad_analyzer.py +231 -0
  116. msprobe/mindspore/grad_probe/grad_monitor.py +27 -0
  117. msprobe/mindspore/grad_probe/grad_stat_csv.py +132 -0
  118. msprobe/mindspore/grad_probe/hook.py +94 -0
  119. msprobe/mindspore/grad_probe/utils.py +30 -0
  120. msprobe/mindspore/ms_config.py +128 -78
  121. msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +44 -45
  122. msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +34 -32
  123. msprobe/mindspore/runtime.py +4 -0
  124. msprobe/mindspore/service.py +378 -0
  125. msprobe/mindspore/task_handler_factory.py +24 -21
  126. msprobe/msprobe.py +105 -67
  127. msprobe/pytorch/__init__.py +4 -4
  128. msprobe/pytorch/api_accuracy_checker/common/config.py +53 -50
  129. msprobe/pytorch/api_accuracy_checker/common/utils.py +214 -224
  130. msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +213 -216
  131. msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +606 -545
  132. msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
  133. msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
  134. msprobe/pytorch/api_accuracy_checker/compare/compare.py +386 -345
  135. msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +73 -73
  136. msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +245 -248
  137. msprobe/pytorch/api_accuracy_checker/config.yaml +10 -4
  138. msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +335 -328
  139. msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +200 -203
  140. msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +133 -127
  141. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +592 -493
  142. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +70 -7
  143. msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
  144. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py +0 -0
  145. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +197 -0
  146. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +325 -0
  147. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -0
  148. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +219 -0
  149. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -0
  150. msprobe/pytorch/bench_functions/__init__.py +15 -0
  151. msprobe/pytorch/bench_functions/apply_adam_w.py +28 -0
  152. msprobe/pytorch/bench_functions/confusion_transpose.py +19 -0
  153. msprobe/pytorch/bench_functions/fast_gelu.py +55 -0
  154. msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -0
  155. msprobe/pytorch/bench_functions/linear.py +12 -0
  156. msprobe/pytorch/bench_functions/matmul_backward.py +48 -0
  157. msprobe/pytorch/bench_functions/npu_fusion_attention.py +509 -0
  158. msprobe/pytorch/bench_functions/rms_norm.py +15 -0
  159. msprobe/pytorch/bench_functions/rotary_mul.py +52 -0
  160. msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -0
  161. msprobe/pytorch/bench_functions/swiglu.py +55 -0
  162. msprobe/pytorch/common/__init__.py +2 -2
  163. msprobe/pytorch/common/compare_script.template +14 -14
  164. msprobe/pytorch/common/log.py +20 -31
  165. msprobe/pytorch/common/parse_json.py +39 -37
  166. msprobe/pytorch/common/utils.py +305 -224
  167. msprobe/pytorch/compare/distributed_compare.py +66 -111
  168. msprobe/pytorch/compare/mapping.yaml +607 -607
  169. msprobe/pytorch/compare/match.py +34 -36
  170. msprobe/pytorch/compare/pt_compare.py +50 -0
  171. msprobe/pytorch/debugger/debugger_config.py +95 -86
  172. msprobe/pytorch/debugger/precision_debugger.py +125 -95
  173. msprobe/pytorch/free_benchmark/__init__.py +8 -8
  174. msprobe/pytorch/free_benchmark/common/constant.py +70 -67
  175. msprobe/pytorch/free_benchmark/common/counter.py +71 -71
  176. msprobe/pytorch/free_benchmark/common/enums.py +37 -37
  177. msprobe/pytorch/free_benchmark/common/params.py +129 -129
  178. msprobe/pytorch/free_benchmark/common/utils.py +102 -98
  179. msprobe/pytorch/free_benchmark/compare/grad_saver.py +179 -183
  180. msprobe/pytorch/free_benchmark/compare/single_benchmark.py +104 -104
  181. msprobe/pytorch/free_benchmark/main.py +105 -102
  182. msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +13 -13
  183. msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +41 -41
  184. msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +90 -90
  185. msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +104 -104
  186. msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +63 -63
  187. msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +68 -68
  188. msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +28 -28
  189. msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +45 -45
  190. msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +19 -19
  191. msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +217 -203
  192. msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +39 -39
  193. msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +23 -23
  194. msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +30 -31
  195. msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +170 -170
  196. msprobe/pytorch/function_factory.py +76 -0
  197. msprobe/pytorch/functional/dump_module.py +39 -39
  198. msprobe/pytorch/grad_probe/__init__.py +0 -0
  199. msprobe/pytorch/grad_probe/grad_monitor.py +91 -0
  200. msprobe/pytorch/grad_probe/grad_stat_csv.py +129 -0
  201. msprobe/pytorch/hook_module/api_registry.py +161 -161
  202. msprobe/pytorch/hook_module/hook_module.py +120 -109
  203. msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1876
  204. msprobe/pytorch/hook_module/utils.py +30 -29
  205. msprobe/pytorch/hook_module/wrap_aten.py +110 -100
  206. msprobe/pytorch/hook_module/wrap_distributed.py +78 -75
  207. msprobe/pytorch/hook_module/wrap_functional.py +105 -108
  208. msprobe/pytorch/hook_module/wrap_npu_custom.py +93 -73
  209. msprobe/pytorch/hook_module/wrap_tensor.py +71 -72
  210. msprobe/pytorch/hook_module/wrap_torch.py +86 -88
  211. msprobe/pytorch/hook_module/wrap_vf.py +62 -64
  212. msprobe/pytorch/module_processer.py +138 -98
  213. msprobe/pytorch/online_dispatch/__init__.py +20 -20
  214. msprobe/pytorch/online_dispatch/compare.py +236 -236
  215. msprobe/pytorch/online_dispatch/dispatch.py +271 -273
  216. msprobe/pytorch/online_dispatch/dump_compare.py +155 -186
  217. msprobe/pytorch/online_dispatch/single_compare.py +391 -391
  218. msprobe/pytorch/online_dispatch/torch_ops_config.yaml +49 -49
  219. msprobe/pytorch/online_dispatch/utils.py +130 -187
  220. msprobe/pytorch/parse.py +4 -4
  221. msprobe/pytorch/parse_tool/cli.py +32 -32
  222. msprobe/pytorch/parse_tool/lib/compare.py +260 -259
  223. msprobe/pytorch/parse_tool/lib/config.py +52 -51
  224. msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
  225. msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
  226. msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
  227. msprobe/pytorch/parse_tool/lib/parse_tool.py +158 -158
  228. msprobe/pytorch/parse_tool/lib/utils.py +316 -367
  229. msprobe/pytorch/parse_tool/lib/visualization.py +85 -90
  230. msprobe/pytorch/pt_config.py +188 -93
  231. msprobe/pytorch/service.py +246 -167
  232. mindstudio_probe-1.0.1.dist-info/RECORD +0 -228
  233. msprobe/config/README.md +0 -397
  234. msprobe/mindspore/doc/dump.md +0 -65
  235. msprobe/mindspore/dump/api_kbk_dump.py +0 -55
  236. msprobe/pytorch/compare/acc_compare.py +0 -1024
  237. msprobe/pytorch/compare/highlight.py +0 -100
  238. msprobe/pytorch/doc/FAQ.md +0 -193
  239. msprobe/pytorch/doc/api_accuracy_checker.md +0 -269
  240. msprobe/pytorch/doc/atat/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
  241. msprobe/pytorch/doc/dump.md +0 -207
  242. msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -176
  243. msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
  244. msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
  245. msprobe/pytorch/doc/run_overflow_check.md +0 -25
  246. msprobe/pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md +0 -90
  247. msprobe/test/core_ut/common/test_utils.py +0 -345
  248. msprobe/test/core_ut/data_dump/test_data_collector.py +0 -47
  249. msprobe/test/core_ut/data_dump/test_json_writer.py +0 -183
  250. msprobe/test/core_ut/data_dump/test_scope.py +0 -151
  251. msprobe/test/core_ut/test_common_config.py +0 -152
  252. msprobe/test/core_ut/test_file_check.py +0 -218
  253. msprobe/test/core_ut/test_log.py +0 -109
  254. msprobe/test/mindspore_ut/test_api_kbk_dump.py +0 -51
  255. msprobe/test/mindspore_ut/test_debugger_config.py +0 -42
  256. msprobe/test/mindspore_ut/test_dump_tool_factory.py +0 -51
  257. msprobe/test/mindspore_ut/test_kernel_graph_dump.py +0 -66
  258. msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +0 -63
  259. msprobe/test/mindspore_ut/test_ms_config.py +0 -69
  260. msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +0 -51
  261. msprobe/test/mindspore_ut/test_precision_debugger.py +0 -56
  262. msprobe/test/mindspore_ut/test_task_handler_factory.py +0 -58
  263. msprobe/test/pytorch_ut/advisor/test_advisor.py +0 -83
  264. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +0 -108
  265. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +0 -39
  266. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +0 -112
  267. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +0 -77
  268. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +0 -125
  269. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +0 -10
  270. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +0 -43
  271. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +0 -179
  272. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +0 -63
  273. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +0 -99
  274. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +0 -115
  275. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +0 -72
  276. msprobe/test/pytorch_ut/compare/test_acc_compare.py +0 -17
  277. msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +0 -105
  278. msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +0 -121
  279. msprobe/test/pytorch_ut/free_benchmark/test_main.py +0 -101
  280. msprobe/test/pytorch_ut/functional/test_dump_module.py +0 -15
  281. msprobe/test/pytorch_ut/hook_module/test_api_registry.py +0 -130
  282. msprobe/test/pytorch_ut/hook_module/test_hook_module.py +0 -42
  283. msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +0 -65
  284. msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +0 -35
  285. msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +0 -20
  286. msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +0 -35
  287. msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +0 -43
  288. msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +0 -11
  289. msprobe/test/pytorch_ut/test_pt_config.py +0 -69
  290. msprobe/test/pytorch_ut/test_service.py +0 -59
  291. msprobe/test/resources/advisor.txt +0 -3
  292. msprobe/test/resources/compare_result_20230703104808.csv +0 -9
  293. msprobe/test/resources/compare_result_without_accuracy.csv +0 -9
  294. msprobe/test/resources/config.yaml +0 -3
  295. msprobe/test/resources/npu_test.pkl +0 -8
  296. msprobe/test/run_test.sh +0 -30
  297. msprobe/test/run_ut.py +0 -58
  298. msprobe/test/test_module_processer.py +0 -64
  299. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/top_level.txt +0 -0
  300. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
  301. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
  302. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
  303. /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
  304. /msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
  305. /msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
  306. /msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
  307. /msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
  308. /msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
  309. /msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
  310. /msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
  311. /msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
  312. /msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
  313. /msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
  314. /msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
  315. /msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
  316. /msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
  317. /msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
  318. /msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
  319. /msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
  320. /msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
  321. /msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
  322. /msprobe/{config → docs}/img/free_benchmark.png +0 -0
  323. /msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0
@@ -1,50 +1,53 @@
1
- import os
2
- import yaml
3
- from msprobe.pytorch.api_accuracy_checker.common.utils import check_file_or_directory_path
4
- from msprobe.pytorch.hook_module.utils import WrapFunctionalOps, WrapTensorOps, WrapTorchOps
5
- from msprobe.core.common.file_check import FileOpen
6
-
7
- WrapApi = set(WrapFunctionalOps) | set(WrapTensorOps) | set(WrapTorchOps)
8
-
9
-
10
- class Config:
11
- def __init__(self, yaml_file):
12
- check_file_or_directory_path(yaml_file, False)
13
- with FileOpen(yaml_file, 'r') as file:
14
- config = yaml.safe_load(file)
15
- self.config = {key: self.validate(key, value) for key, value in config.items()}
16
-
17
- def __getattr__(self, item):
18
- return self.config[item]
19
-
20
- def __str__(self):
21
- return '\n'.join(f"{key}={value}" for key, value in self.config.items())
22
-
23
- @staticmethod
24
- def validate(key, value):
25
- validators = {
26
- 'white_list': list,
27
- 'error_data_path': str,
28
- 'precision': int
29
- }
30
- if key not in validators:
31
- raise ValueError(f"{key} must be one of {validators.keys()}")
32
- if not isinstance(value, validators.get(key)):
33
- raise ValueError(f"{key} must be {validators[key].__name__} type")
34
- if key == 'precision' and value < 0:
35
- raise ValueError("precision must be greater than 0")
36
- if key == 'white_list':
37
- if not isinstance(value, list):
38
- raise ValueError("white_list must be a list type")
39
- if not all(isinstance(i, str) for i in value):
40
- raise ValueError("All elements in white_list must be of str type")
41
- invalid_api = [i for i in value if i not in WrapApi]
42
- if invalid_api:
43
- raise ValueError(
44
- f"{', '.join(invalid_api)} is not in support_wrap_ops.yaml, please check the white_list")
45
- return value
46
-
47
-
48
- cur_path = os.path.dirname(os.path.dirname(os.path.realpath(__file__)))
49
- yaml_path = os.path.join(cur_path, "config.yaml")
50
- msCheckerConfig = Config(yaml_path)
1
+ import os
2
+ from msprobe.core.common.file_utils import load_yaml, check_file_or_directory_path
3
+ from msprobe.pytorch.pt_config import RunUTConfig
4
+
5
+
6
+ class Config:
7
+ def __init__(self, yaml_file):
8
+ check_file_or_directory_path(yaml_file, False)
9
+ config = load_yaml(yaml_file)
10
+ self.config = {key: self.validate(key, value) for key, value in config.items()}
11
+
12
+ def __getattr__(self, item):
13
+ return self.config[item]
14
+
15
+ def __str__(self):
16
+ return '\n'.join(f"{key}={value}" for key, value in self.config.items())
17
+
18
+ @staticmethod
19
+ def validate(key, value):
20
+ validators = {
21
+ 'white_list': list,
22
+ 'black_list': list,
23
+ 'error_data_path': str,
24
+ 'precision': int,
25
+ 'is_online': bool,
26
+ 'nfs_path': str,
27
+ 'host': str,
28
+ 'port': int,
29
+ 'rank_list': list,
30
+ 'tls_path': str
31
+ }
32
+ if key not in validators:
33
+ raise ValueError(f"{key} must be one of {validators.keys()}")
34
+ if not isinstance(value, validators.get(key)):
35
+ raise ValueError(f"{key} must be {validators[key].__name__} type")
36
+ if key == 'precision' and value < 0:
37
+ raise ValueError("precision must be greater than 0")
38
+ if key == 'white_list':
39
+ RunUTConfig.check_filter_list_config(key, value)
40
+ if key == 'black_list':
41
+ RunUTConfig.check_filter_list_config(key, value)
42
+ if key == 'error_data_path':
43
+ RunUTConfig.check_error_data_path_config(value)
44
+ if key == 'nfs_path':
45
+ RunUTConfig.check_nfs_path_config(value)
46
+ if key == 'tls_path':
47
+ RunUTConfig.check_tls_path_config(value)
48
+ return value
49
+
50
+
51
+ cur_path = os.path.dirname(os.path.dirname(os.path.realpath(__file__)))
52
+ yaml_path = os.path.join(cur_path, "config.yaml")
53
+ msCheckerConfig = Config(yaml_path)
@@ -1,224 +1,214 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- # Copyright (C) 2023-2023. Huawei Technologies Co., Ltd. All rights reserved.
5
- # Licensed under the Apache License, Version 2.0 (the "License");
6
- # you may not use this file except in compliance with the License.
7
- # You may obtain a copy of the License at
8
- #
9
- # http://www.apache.org/licenses/LICENSE-2.0
10
- #
11
- # Unless required by applicable law or agreed to in writing, software
12
- # distributed under the License is distributed on an "AS IS" BASIS,
13
- # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
- # See the License for the specific language governing permissions and
15
- # limitations under the License.
16
- """
17
- import json
18
- import os
19
- import re
20
- import csv
21
-
22
- import torch
23
-
24
- try:
25
- import torch_npu
26
- except ImportError:
27
- IS_GPU = True
28
- else:
29
- IS_GPU = False
30
-
31
- from msprobe.pytorch.common.log import logger
32
- from msprobe.core.common.file_check import FileChecker, FileOpen, change_mode, create_directory
33
- from msprobe.core.common.const import Const, FileCheckConst
34
- from msprobe.core.common.utils import CompareException
35
-
36
-
37
- class DumpException(CompareException):
38
- pass
39
-
40
-
41
- def write_csv(data, filepath):
42
- with FileOpen(filepath, 'a', encoding='utf-8-sig') as f:
43
- writer = csv.writer(f)
44
- writer.writerows(data)
45
-
46
-
47
- def check_object_type(check_object, allow_type):
48
- """
49
- Function Description:
50
- Check if the object belongs to a certain data type
51
- Parameter:
52
- check_object: the object to be checked
53
- allow_type: legal data type
54
- Exception Description:
55
- when invalid data throw exception
56
- """
57
- if not isinstance(check_object, allow_type):
58
- logger.error(f"{check_object} not of {allow_type} type")
59
- raise CompareException(CompareException.INVALID_DATA_ERROR)
60
-
61
-
62
- def check_file_or_directory_path(path, isdir=False):
63
- """
64
- Function Description:
65
- check whether the path is valid
66
- Parameter:
67
- path: the path to check
68
- isdir: the path is dir or file
69
- Exception Description:
70
- when invalid data throw exception
71
- """
72
- if isdir:
73
- if not os.path.exists(path):
74
- logger.error('The path {} is not exist.'.format(path))
75
- raise CompareException(CompareException.INVALID_PATH_ERROR)
76
-
77
- if not os.path.isdir(path):
78
- logger.error('The path {} is not a directory.'.format(path))
79
- raise CompareException(CompareException.INVALID_PATH_ERROR)
80
-
81
- if not os.access(path, os.W_OK):
82
- logger.error(
83
- 'The path {} does not have permission to write. Please check the path permission'.format(path))
84
- raise CompareException(CompareException.INVALID_PATH_ERROR)
85
- else:
86
- if not os.path.isfile(path):
87
- logger.error('{} is an invalid file or non-exist.'.format(path))
88
- raise CompareException(CompareException.INVALID_PATH_ERROR)
89
-
90
- if not os.access(path, os.R_OK):
91
- logger.error(
92
- 'The path {} does not have permission to read. Please check the path permission'.format(path))
93
- raise CompareException(CompareException.INVALID_PATH_ERROR)
94
-
95
-
96
- def get_json_contents(file_path):
97
- ops = get_file_content_bytes(file_path)
98
- try:
99
- json_obj = json.loads(ops)
100
- except ValueError as error:
101
- logger.error('Failed to load "%s". %s' % (file_path, str(error)))
102
- raise CompareException(CompareException.INVALID_FILE_ERROR) from error
103
- if not isinstance(json_obj, dict):
104
- logger.error('Json file %s, content is not a dictionary!' % file_path)
105
- raise CompareException(CompareException.INVALID_FILE_ERROR)
106
- return json_obj
107
-
108
-
109
- def get_file_content_bytes(file):
110
- with FileOpen(file, 'rb') as file_handle:
111
- return file_handle.read()
112
-
113
-
114
- class SoftlinkCheckException(Exception):
115
- pass
116
-
117
-
118
- def check_need_convert(api_name):
119
- convert_type = None
120
- for key, value in Const.CONVERT_API.items():
121
- if api_name not in value:
122
- continue
123
- else:
124
- convert_type = key
125
- return convert_type
126
-
127
-
128
- def api_info_preprocess(api_name, api_info_dict):
129
- """
130
- Function Description:
131
- Preprocesses the API information.
132
- Parameter:
133
- api_name: Name of the API.
134
- api_info_dict: argument of the API.
135
- Return api_info_dict:
136
- convert_type: Type of conversion.
137
- api_info_dict: Processed argument of the API.
138
- """
139
- convert_type = check_need_convert(api_name)
140
- if api_name == 'cross_entropy':
141
- api_info_dict = cross_entropy_process(api_info_dict)
142
- return convert_type, api_info_dict
143
-
144
-
145
- def cross_entropy_process(api_info_dict):
146
- """
147
- Function Description:
148
- Preprocesses the cross_entropy API information.
149
- Parameter:
150
- api_info_dict: argument of the API.
151
- Return api_info_dict:
152
- api_info_dict: Processed argument of the API.
153
- """
154
- if 'args' in api_info_dict and len(api_info_dict['args']) > 1 and 'Min' in api_info_dict['args'][1]:
155
- if api_info_dict['args'][1]['Min'] <= 0:
156
- # The second argument in cross_entropy should be -100 or not less than 0
157
- api_info_dict['args'][1]['Min'] = 0
158
- return api_info_dict
159
-
160
-
161
- def initialize_save_path(save_path, dir_name):
162
- data_path = os.path.join(save_path, dir_name)
163
- if os.path.exists(data_path):
164
- logger.warning(f"{data_path} already exists, it will be overwritten")
165
- else:
166
- os.mkdir(data_path, mode=FileCheckConst.DATA_DIR_AUTHORITY)
167
- data_path_checker = FileChecker(data_path, FileCheckConst.DIR)
168
- data_path_checker.common_check()
169
-
170
-
171
- def write_pt(file_path, tensor):
172
- if os.path.exists(file_path):
173
- raise ValueError(f"File {file_path} already exists")
174
- torch.save(tensor, file_path)
175
- full_path = os.path.realpath(file_path)
176
- change_mode(full_path, FileCheckConst.DATA_FILE_AUTHORITY)
177
- return full_path
178
-
179
-
180
- def get_real_data_path(file_path):
181
- targets = ['forward_real_data', 'backward_real_data', 'ut_error_data\d+']
182
- pattern = re.compile(r'({})'.format('|'.join(targets)))
183
- match = pattern.search(file_path)
184
- if match:
185
- target_index = match.start()
186
- target_path = file_path[target_index:]
187
- return target_path
188
- else:
189
- raise DumpException(DumpException.INVALID_PATH_ERROR)
190
-
191
-
192
- def get_full_data_path(data_path, real_data_path):
193
- if not data_path:
194
- return data_path
195
- full_data_path = os.path.join(real_data_path, data_path)
196
- return os.path.realpath(full_data_path)
197
-
198
-
199
- class UtDataProcessor:
200
- def __init__(self, save_path):
201
- self.save_path = save_path
202
- self.index = 0
203
-
204
- def save_tensors_in_element(self, api_name, element):
205
- self.index = 0
206
- self._save_recursive(api_name, element)
207
-
208
- def _save_recursive(self, api_name, element):
209
- if isinstance(element, torch.Tensor):
210
- api_args = api_name + Const.SEP + str(self.index)
211
- create_directory(self.save_path)
212
- file_path = os.path.join(self.save_path, f'{api_args}.pt')
213
- write_pt(file_path, element.contiguous().cpu().detach())
214
- self.index += 1
215
- elif element is None or isinstance(element, (bool, int, float, str, slice)):
216
- self.index += 1
217
- elif isinstance(element, (list, tuple)):
218
- for item in element:
219
- self._save_recursive(api_name, item)
220
- elif isinstance(element, dict):
221
- for value in element.values():
222
- self._save_recursive(api_name, value)
223
- else:
224
- self.index += 1
1
+ #!/usr/bin/env python3
2
+ # -*- coding: utf-8 -*-
3
+ """
4
+ # Copyright (C) 2023-2023. Huawei Technologies Co., Ltd. All rights reserved.
5
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
+ # you may not use this file except in compliance with the License.
7
+ # You may obtain a copy of the License at
8
+ #
9
+ # http://www.apache.org/licenses/LICENSE-2.0
10
+ #
11
+ # Unless required by applicable law or agreed to in writing, software
12
+ # distributed under the License is distributed on an "AS IS" BASIS,
13
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
+ # See the License for the specific language governing permissions and
15
+ # limitations under the License.
16
+ """
17
+ import os
18
+ import re
19
+ from collections import namedtuple
20
+
21
+ import torch
22
+
23
+ try:
24
+ import torch_npu
25
+ except ImportError:
26
+ IS_GPU = True
27
+ else:
28
+ IS_GPU = False
29
+
30
+ from msprobe.pytorch.common.log import logger
31
+ from msprobe.pytorch.common.utils import save_pt
32
+ from msprobe.core.common.file_utils import create_directory
33
+ from msprobe.core.common.const import Const
34
+ from msprobe.core.common.utils import CompareException
35
+
36
+ ApiData = namedtuple('ApiData', ['name', 'args', 'kwargs', 'result', 'step', 'rank'],
37
+ defaults=['unknown', None, None, None, 0, 0])
38
+
39
+
40
+ class DumpException(CompareException):
41
+ pass
42
+
43
+
44
+ def check_object_type(check_object, allow_type):
45
+ """
46
+ Function Description:
47
+ Check if the object belongs to a certain data type
48
+ Parameter:
49
+ check_object: the object to be checked
50
+ allow_type: legal data type
51
+ Exception Description:
52
+ when invalid data throw exception
53
+ """
54
+ if not isinstance(check_object, allow_type):
55
+ logger.error(f"{check_object} not of {allow_type} type")
56
+ raise CompareException(CompareException.INVALID_DATA_ERROR)
57
+
58
+
59
+ class SoftlinkCheckException(Exception):
60
+ pass
61
+
62
+
63
+ def check_need_convert(api_name):
64
+ convert_type = None
65
+ for key, value in Const.CONVERT_API.items():
66
+ if api_name not in value:
67
+ continue
68
+ else:
69
+ convert_type = key
70
+ return convert_type
71
+
72
+
73
+ def api_info_preprocess(api_name, api_info_dict):
74
+ """
75
+ Function Description:
76
+ Preprocesses the API information.
77
+ Parameter:
78
+ api_name: Name of the API.
79
+ api_info_dict: argument of the API.
80
+ Return api_info_dict:
81
+ convert_type: Type of conversion.
82
+ api_info_dict: Processed argument of the API.
83
+ """
84
+ convert_type = check_need_convert(api_name)
85
+ if api_name == 'cross_entropy':
86
+ api_info_dict = cross_entropy_process(api_info_dict)
87
+ return convert_type, api_info_dict
88
+
89
+
90
+ def cross_entropy_process(api_info_dict):
91
+ """
92
+ Function Description:
93
+ Preprocesses the cross_entropy API information.
94
+ Parameter:
95
+ api_info_dict: argument of the API.
96
+ Return api_info_dict:
97
+ api_info_dict: Processed argument of the API.
98
+ """
99
+ if 'input_args' in api_info_dict and len(api_info_dict['input_args']) > 1 and 'Min' in api_info_dict['input_args'][1]:
100
+ if api_info_dict['input_args'][1]['Min'] <= 0:
101
+ # The second argument in cross_entropy should be -100 or not less than 0
102
+ api_info_dict['input_args'][1]['Min'] = 0
103
+ return api_info_dict
104
+
105
+
106
+ def initialize_save_path(save_path, dir_name):
107
+ data_path = os.path.join(save_path, dir_name)
108
+ create_directory(data_path)
109
+ return data_path
110
+
111
+
112
+ def get_real_data_path(file_path):
113
+ targets = ['forward_real_data', 'backward_real_data', 'ut_error_data\d+']
114
+ pattern = re.compile(r'({})'.format('|'.join(targets)))
115
+ match = pattern.search(file_path)
116
+ if match:
117
+ target_index = match.start()
118
+ target_path = file_path[target_index:]
119
+ return target_path
120
+ else:
121
+ raise DumpException(DumpException.INVALID_PATH_ERROR)
122
+
123
+
124
+ def get_full_data_path(data_path, real_data_path):
125
+ if not data_path:
126
+ return data_path
127
+ full_data_path = os.path.join(real_data_path, data_path)
128
+ return os.path.realpath(full_data_path)
129
+
130
+
131
+ class UtDataProcessor:
132
+ def __init__(self, save_path):
133
+ self.save_path = save_path
134
+ self.index = 0
135
+
136
+ def save_tensors_in_element(self, api_name, element):
137
+ self.index = 0
138
+ self._save_recursive(api_name, element)
139
+
140
+ def _save_recursive(self, api_name, element):
141
+ if isinstance(element, torch.Tensor):
142
+ api_args = api_name + Const.SEP + str(self.index)
143
+ create_directory(self.save_path)
144
+ file_path = os.path.join(self.save_path, f'{api_args}.pt')
145
+ try:
146
+ tensor = element.contiguous().detach().cpu()
147
+ except Exception as err:
148
+ logger.error(f"Failed to transfer tensor to cpu for {api_args}")
149
+ raise DumpException(DumpException.INVALID_DATA_ERROR) from err
150
+ save_pt(tensor, file_path)
151
+ self.index += 1
152
+ elif element is None or isinstance(element, (bool, int, float, str, slice)):
153
+ self.index += 1
154
+ elif isinstance(element, (list, tuple)):
155
+ for item in element:
156
+ self._save_recursive(api_name, item)
157
+ elif isinstance(element, dict):
158
+ for value in element.values():
159
+ self._save_recursive(api_name, value)
160
+ else:
161
+ self.index += 1
162
+
163
+
164
+ def extract_basic_api_segments(api_full_name):
165
+ """
166
+ Function Description:
167
+ Extract the name of the API.
168
+ Parameter:
169
+ api_full_name: Full name of the API. Example: torch.matmul.0, torch.linalg.inv.0
170
+ Return:
171
+ api_type: Type of api. Example: torch, tensor, etc.
172
+ api_name: Name of api. Example: matmul, linalg.inv, etc.
173
+ """
174
+ api_type = None
175
+ api_parts = api_full_name.split(Const.SEP)
176
+ api_parts_length = len(api_parts)
177
+ if api_parts_length == Const.THREE_SEGMENT:
178
+ api_type, api_name, _ = api_parts
179
+ elif api_parts_length == Const.FOUR_SEGMENT:
180
+ api_type, prefix, api_name, _ = api_parts
181
+ api_name = Const.SEP.join([prefix, api_name])
182
+ else:
183
+ api_name = None
184
+ return api_type, api_name
185
+
186
+
187
+ def extract_detailed_api_segments(full_api_name_with_direction_status):
188
+ """
189
+ Function Description:
190
+ Extract the name of the API.
191
+ Parameter:
192
+ full_api_name_with_direction_status: Full name of the API. Example: torch.matmul.0.forward.output.0
193
+ Return:
194
+ api_name: Name of api. Example: matmul, mul, etc.
195
+ full_api_name: Full name of api. Example: torch.matmul.0
196
+ direction_status: Direction status of api. Example: forward, backward, etc.
197
+ """
198
+ api_type = None
199
+ prefix = None
200
+ api_name = None
201
+ direction_status = None
202
+ api_parts = full_api_name_with_direction_status.split(Const.SEP)
203
+ api_parts_length = len(api_parts)
204
+ if api_parts_length == Const.SIX_SEGMENT:
205
+ api_type, api_name, api_order, direction_status, _, _ = api_parts
206
+ full_api_name = Const.SEP.join([api_type, api_name, api_order])
207
+ elif api_parts_length == Const.SEVEN_SEGMENT:
208
+ api_type, prefix, api_name, api_order, direction_status, _, _ = api_parts
209
+ full_api_name = Const.SEP.join([api_type, prefix, api_name, api_order])
210
+ api_name = Const.SEP.join([prefix, api_name])
211
+ else:
212
+ full_api_name = None
213
+ return api_name, full_api_name, direction_status
214
+