mindstudio-probe 1.0.4__tar.gz → 1.1.1__tar.gz

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (408) hide show
  1. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/PKG-INFO +14 -3
  2. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/PKG-INFO +14 -3
  3. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/SOURCES.txt +74 -9
  4. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/entry_points.txt +0 -1
  5. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/requires.txt +2 -0
  6. mindstudio_probe-1.1.1/msprobe/README.md +167 -0
  7. mindstudio_probe-1.1.1/msprobe/__init__.py +16 -0
  8. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/config.json +1 -5
  9. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/advisor/advisor.py +16 -11
  10. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/advisor/advisor_const.py +6 -7
  11. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/advisor/advisor_result.py +12 -12
  12. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/common/const.py +164 -3
  13. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/common/exceptions.py +26 -4
  14. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/common/file_utils.py +196 -27
  15. mindstudio_probe-1.1.1/msprobe/core/common/inplace_op_checker.py +53 -0
  16. mindstudio_probe-1.1.1/msprobe/core/common/inplace_ops.yaml +251 -0
  17. mindstudio_probe-1.1.1/msprobe/core/common/log.py +104 -0
  18. mindstudio_probe-1.1.1/msprobe/core/common/utils.py +484 -0
  19. mindstudio_probe-1.1.1/msprobe/core/common_config.py +107 -0
  20. mindstudio_probe-1.1.1/msprobe/core/compare/acc_compare.py +538 -0
  21. mindstudio_probe-1.1.1/msprobe/core/compare/check.py +177 -0
  22. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/compare/compare_cli.py +42 -5
  23. mindstudio_probe-1.1.1/msprobe/core/compare/highlight.py +328 -0
  24. mindstudio_probe-1.1.1/msprobe/core/compare/layer_mapping/__init__.py +19 -0
  25. mindstudio_probe-1.1.1/msprobe/core/compare/layer_mapping/data_scope_parser.py +235 -0
  26. mindstudio_probe-1.1.1/msprobe/core/compare/layer_mapping/layer_mapping.py +242 -0
  27. mindstudio_probe-1.1.1/msprobe/core/compare/layer_mapping/postprocess_pass.py +94 -0
  28. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/compare/multiprocessing_compute.py +33 -8
  29. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/compare/npy_compare.py +73 -29
  30. mindstudio_probe-1.1.1/msprobe/core/compare/utils.py +489 -0
  31. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/data_dump/data_collector.py +44 -43
  32. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/data_dump/data_processor/base.py +88 -35
  33. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/data_dump/data_processor/factory.py +20 -3
  34. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/data_dump/data_processor/mindspore_processor.py +14 -8
  35. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/data_dump/data_processor/pytorch_processor.py +180 -66
  36. mindstudio_probe-1.1.1/msprobe/core/data_dump/json_writer.py +117 -0
  37. mindstudio_probe-1.1.1/msprobe/core/data_dump/scope.py +273 -0
  38. mindstudio_probe-1.1.1/msprobe/core/grad_probe/constant.py +89 -0
  39. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/grad_probe/grad_compare.py +20 -4
  40. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/grad_probe/utils.py +44 -3
  41. mindstudio_probe-1.1.1/msprobe/core/overflow_check/abnormal_scene.py +185 -0
  42. mindstudio_probe-1.1.1/msprobe/core/overflow_check/api_info.py +55 -0
  43. mindstudio_probe-1.1.1/msprobe/core/overflow_check/checker.py +138 -0
  44. mindstudio_probe-1.1.1/msprobe/core/overflow_check/filter.py +157 -0
  45. mindstudio_probe-1.1.1/msprobe/core/overflow_check/ignore_rules.yaml +55 -0
  46. mindstudio_probe-1.1.1/msprobe/core/overflow_check/level.py +22 -0
  47. mindstudio_probe-1.1.1/msprobe/core/overflow_check/utils.py +28 -0
  48. mindstudio_probe-1.1.1/msprobe/docs/01.installation.md +109 -0
  49. mindstudio_probe-1.1.1/msprobe/docs/02.config_introduction.md +164 -0
  50. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/03.config_examples.md +3 -20
  51. mindstudio_probe-1.1.1/msprobe/docs/04.kernel_dump_PyTorch.md +73 -0
  52. mindstudio_probe-1.1.1/msprobe/docs/05.data_dump_PyTorch.md +328 -0
  53. mindstudio_probe-1.1.1/msprobe/docs/06.data_dump_MindSpore.md +352 -0
  54. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/07.accuracy_checker_PyTorch.md +69 -46
  55. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/08.accuracy_checker_online_PyTorch.md +52 -17
  56. mindstudio_probe-1.1.1/msprobe/docs/09.accuracy_checker_MindSpore.md +104 -0
  57. mindstudio_probe-1.1.1/msprobe/docs/10.accuracy_compare_PyTorch.md +333 -0
  58. mindstudio_probe-1.1.1/msprobe/docs/11.accuracy_compare_MindSpore.md +424 -0
  59. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/12.overflow_check_PyTorch.md +1 -1
  60. mindstudio_probe-1.1.1/msprobe/docs/13.overflow_check_MindSpore.md +31 -0
  61. mindstudio_probe-1.1.1/msprobe/docs/15.free_benchmarking_PyTorch.md +169 -0
  62. mindstudio_probe-1.1.1/msprobe/docs/16.free_benchmarking_MindSpore.md +159 -0
  63. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/17.grad_probe.md +19 -22
  64. mindstudio_probe-1.1.1/msprobe/docs/18.online_dispatch.md +89 -0
  65. mindstudio_probe-1.1.1/msprobe/docs/19.monitor.md +468 -0
  66. mindstudio_probe-1.1.1/msprobe/docs/20.monitor_performance_baseline.md +52 -0
  67. mindstudio_probe-1.1.1/msprobe/docs/21.visualization_PyTorch.md +386 -0
  68. mindstudio_probe-1.1.1/msprobe/docs/22.visualization_MindSpore.md +384 -0
  69. mindstudio_probe-1.1.1/msprobe/docs/23.tool_function_introduction.md +28 -0
  70. mindstudio-probe-1.0.4/msprobe/docs/FAQ_PyTorch.md → mindstudio_probe-1.1.1/msprobe/docs/FAQ.md +25 -10
  71. mindstudio_probe-1.1.1/msprobe/docs/data_dump_Mindspore/dynamic_graph_quick_start_example.md +211 -0
  72. mindstudio_probe-1.1.1/msprobe/docs/img/compare_result.png +0 -0
  73. mindstudio_probe-1.1.1/msprobe/docs/img/monitor/cpu_info.png +0 -0
  74. mindstudio_probe-1.1.1/msprobe/docs/img/ms_dump.png +0 -0
  75. mindstudio_probe-1.1.1/msprobe/docs/img/ms_layer.png +0 -0
  76. mindstudio_probe-1.1.1/msprobe/docs/img/pt_dump.png +0 -0
  77. mindstudio_probe-1.1.1/msprobe/mindspore/__init__.py +17 -0
  78. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +247 -0
  79. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/api_info.py +27 -5
  80. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/api_runner.py +43 -18
  81. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +21 -7
  82. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +77 -0
  83. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/cmd_parser.py +68 -0
  84. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/compute_element.py +59 -24
  85. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/data_manager.py +264 -0
  86. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/main.py +33 -0
  87. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +206 -0
  88. mindstudio_probe-1.1.1/msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +58 -0
  89. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/type_mapping.py +22 -5
  90. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/utils.py +34 -17
  91. mindstudio_probe-1.1.1/msprobe/mindspore/cell_processor.py +79 -0
  92. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/common/const.py +35 -13
  93. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/common/log.py +5 -9
  94. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/common/utils.py +60 -5
  95. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/compare/distributed_compare.py +15 -28
  96. mindstudio_probe-1.1.1/msprobe/mindspore/compare/ms_compare.py +380 -0
  97. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/compare/ms_graph_compare.py +99 -49
  98. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/debugger/debugger_config.py +20 -14
  99. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/debugger/precision_debugger.py +43 -13
  100. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/dump_tool_factory.py +18 -1
  101. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/hook_cell/api_registry.py +23 -3
  102. mindstudio_probe-1.1.1/msprobe/mindspore/dump/hook_cell/primitive_hooks.py +203 -0
  103. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +107 -10
  104. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/hook_cell/wrap_api.py +21 -13
  105. mindstudio_probe-1.1.1/msprobe/mindspore/dump/jit_dump.py +108 -0
  106. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/kernel_graph_dump.py +19 -5
  107. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/kernel_kbyk_dump.py +19 -6
  108. mindstudio_probe-1.1.1/msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +140 -0
  109. mindstudio_probe-1.1.1/msprobe/mindspore/dym_loader/hook_dynamic_loader.h +53 -0
  110. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/api_pynative_self_check.py +237 -0
  111. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/common/config.py +27 -0
  112. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/common/handler_params.py +31 -0
  113. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/common/utils.py +37 -8
  114. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -204
  115. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/handler/base_handler.py +20 -5
  116. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/handler/check_handler.py +21 -7
  117. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/handler/fix_handler.py +18 -3
  118. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/handler/handler_factory.py +36 -0
  119. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/perturbation/add_noise.py +23 -8
  120. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +45 -0
  121. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +25 -10
  122. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +77 -0
  123. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +29 -8
  124. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/perturbation/no_change.py +27 -0
  125. mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +44 -0
  126. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/self_check_tool_factory.py +17 -2
  127. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/global_context.py +44 -14
  128. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/grad_analyzer.py +27 -13
  129. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/grad_monitor.py +16 -1
  130. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/grad_stat_csv.py +33 -5
  131. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/hook.py +24 -10
  132. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/grad_probe/utils.py +18 -5
  133. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/ms_config.py +22 -15
  134. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +20 -6
  135. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +15 -0
  136. mindstudio_probe-1.1.1/msprobe/mindspore/runtime.py +19 -0
  137. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/service.py +75 -150
  138. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/task_handler_factory.py +15 -0
  139. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/msprobe.py +24 -7
  140. mindstudio_probe-1.1.1/msprobe/pytorch/__init__.py +24 -0
  141. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/common/config.py +132 -0
  142. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/common/utils.py +53 -21
  143. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +19 -2
  144. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +50 -25
  145. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/compare.py +51 -21
  146. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +23 -6
  147. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +28 -8
  148. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/config.yaml +1 -1
  149. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +9 -0
  150. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +454 -0
  151. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +365 -0
  152. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +73 -33
  153. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +44 -18
  154. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +32 -11
  155. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +122 -172
  156. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +224 -0
  157. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +30 -24
  158. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +68 -31
  159. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +27 -4
  160. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +115 -0
  161. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +26 -9
  162. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml +63 -0
  163. mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +44 -0
  164. mindstudio_probe-1.1.1/msprobe/pytorch/bench_functions/__init__.py +30 -0
  165. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/apply_adam_w.py +15 -0
  166. mindstudio_probe-1.1.1/msprobe/pytorch/bench_functions/confusion_transpose.py +38 -0
  167. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/fast_gelu.py +15 -0
  168. mindstudio_probe-1.1.1/msprobe/pytorch/bench_functions/layer_norm_eval.py +21 -0
  169. mindstudio_probe-1.1.1/msprobe/pytorch/bench_functions/linear.py +27 -0
  170. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/matmul_backward.py +33 -6
  171. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/npu_fusion_attention.py +280 -157
  172. mindstudio_probe-1.1.1/msprobe/pytorch/bench_functions/rms_norm.py +30 -0
  173. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/rotary_mul.py +32 -9
  174. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/scaled_mask_softmax.py +15 -0
  175. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/bench_functions/swiglu.py +29 -6
  176. mindstudio_probe-1.1.1/msprobe/pytorch/common/__init__.py +17 -0
  177. mindstudio_probe-1.1.1/msprobe/pytorch/common/log.py +33 -0
  178. mindstudio_probe-1.1.1/msprobe/pytorch/common/parse_json.py +54 -0
  179. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/common/utils.py +96 -40
  180. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/compare/distributed_compare.py +13 -14
  181. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/compare/match.py +15 -0
  182. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/compare/pt_compare.py +44 -10
  183. mindstudio_probe-1.1.1/msprobe/pytorch/debugger/debugger_config.py +112 -0
  184. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/debugger/precision_debugger.py +72 -24
  185. mindstudio_probe-1.1.1/msprobe/pytorch/dump/kernel_dump/kernel_config.py +33 -0
  186. mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/__init__.py +23 -0
  187. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/common/constant.py +15 -0
  188. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/common/counter.py +15 -0
  189. mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/common/enums.py +80 -0
  190. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/common/params.py +23 -1
  191. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/common/utils.py +43 -5
  192. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/compare/grad_saver.py +47 -9
  193. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/compare/single_benchmark.py +17 -0
  194. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/main.py +19 -4
  195. mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +28 -0
  196. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +19 -4
  197. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +18 -1
  198. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +21 -4
  199. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +28 -2
  200. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +19 -0
  201. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +15 -0
  202. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +15 -0
  203. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +15 -0
  204. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +65 -16
  205. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +15 -0
  206. mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +40 -0
  207. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +15 -0
  208. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +19 -4
  209. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/function_factory.py +17 -2
  210. mindstudio_probe-1.1.1/msprobe/pytorch/functional/module_dump.py +84 -0
  211. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/grad_probe/grad_monitor.py +23 -6
  212. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/grad_probe/grad_stat_csv.py +40 -10
  213. mindstudio_probe-1.1.1/msprobe/pytorch/hook_module/__init__.py +16 -0
  214. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/api_registry.py +13 -8
  215. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/hook_module.py +17 -19
  216. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/support_wrap_ops.yaml +1 -0
  217. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/utils.py +4 -6
  218. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_aten.py +12 -11
  219. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_distributed.py +6 -7
  220. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_functional.py +21 -20
  221. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_npu_custom.py +9 -17
  222. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_tensor.py +4 -6
  223. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_torch.py +4 -6
  224. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/hook_module/wrap_vf.py +4 -6
  225. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/module_processer.py +18 -6
  226. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/anomaly_analyse.py +201 -0
  227. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/anomaly_detect.py +340 -0
  228. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/distributed/distributed_ops.yaml +19 -0
  229. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/distributed/stack_blacklist.yaml +5 -0
  230. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/distributed/wrap_distributed.py +272 -0
  231. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/features.py +108 -0
  232. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/module_hook.py +870 -0
  233. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/module_metric.py +193 -0
  234. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/module_spec_verifier.py +93 -0
  235. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/optimizer_collect.py +295 -0
  236. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/unittest/test_monitor.py +145 -0
  237. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/utils.py +250 -0
  238. mindstudio_probe-1.1.1/msprobe/pytorch/monitor/visualizer.py +59 -0
  239. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/__init__.py +2 -3
  240. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/compare.py +38 -48
  241. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/dispatch.py +50 -25
  242. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/dump_compare.py +21 -9
  243. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/single_compare.py +60 -39
  244. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/torch_ops_config.yaml +9 -1
  245. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/online_dispatch/utils.py +48 -23
  246. mindstudio_probe-1.1.1/msprobe/pytorch/parse.py +19 -0
  247. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/cli.py +5 -6
  248. mindstudio_probe-1.1.1/msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
  249. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/compare.py +19 -26
  250. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/config.py +1 -1
  251. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/parse_tool.py +4 -2
  252. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/utils.py +40 -55
  253. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/visualization.py +3 -1
  254. mindstudio_probe-1.1.1/msprobe/pytorch/pt_config.py +340 -0
  255. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/service.py +110 -35
  256. mindstudio_probe-1.1.1/msprobe/visualization/__init__.py +14 -0
  257. mindstudio_probe-1.1.1/msprobe/visualization/builder/__init__.py +14 -0
  258. mindstudio_probe-1.1.1/msprobe/visualization/builder/graph_builder.py +165 -0
  259. mindstudio_probe-1.1.1/msprobe/visualization/builder/msprobe_adapter.py +205 -0
  260. mindstudio_probe-1.1.1/msprobe/visualization/compare/__init__.py +14 -0
  261. mindstudio_probe-1.1.1/msprobe/visualization/compare/graph_comparator.py +130 -0
  262. mindstudio_probe-1.1.1/msprobe/visualization/compare/mode_adapter.py +211 -0
  263. mindstudio_probe-1.1.1/msprobe/visualization/graph/__init__.py +14 -0
  264. mindstudio_probe-1.1.1/msprobe/visualization/graph/base_node.py +124 -0
  265. mindstudio_probe-1.1.1/msprobe/visualization/graph/graph.py +200 -0
  266. mindstudio_probe-1.1.1/msprobe/visualization/graph/node_colors.py +95 -0
  267. mindstudio_probe-1.1.1/msprobe/visualization/graph/node_op.py +39 -0
  268. mindstudio_probe-1.1.1/msprobe/visualization/graph_service.py +214 -0
  269. mindstudio_probe-1.1.1/msprobe/visualization/utils.py +232 -0
  270. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/setup.py +10 -7
  271. mindstudio-probe-1.0.4/msprobe/README.md +0 -101
  272. mindstudio-probe-1.0.4/msprobe/__init__.py +0 -1
  273. mindstudio-probe-1.0.4/msprobe/core/common/log.py +0 -76
  274. mindstudio-probe-1.0.4/msprobe/core/common/utils.py +0 -385
  275. mindstudio-probe-1.0.4/msprobe/core/common_config.py +0 -85
  276. mindstudio-probe-1.0.4/msprobe/core/compare/acc_compare.py +0 -300
  277. mindstudio-probe-1.0.4/msprobe/core/compare/check.py +0 -95
  278. mindstudio-probe-1.0.4/msprobe/core/compare/highlight.py +0 -223
  279. mindstudio-probe-1.0.4/msprobe/core/compare/utils.py +0 -430
  280. mindstudio-probe-1.0.4/msprobe/core/data_dump/json_writer.py +0 -96
  281. mindstudio-probe-1.0.4/msprobe/core/data_dump/scope.py +0 -178
  282. mindstudio-probe-1.0.4/msprobe/core/grad_probe/constant.py +0 -71
  283. mindstudio-probe-1.0.4/msprobe/docs/01.installation.md +0 -89
  284. mindstudio-probe-1.0.4/msprobe/docs/02.config_introduction.md +0 -165
  285. mindstudio-probe-1.0.4/msprobe/docs/04.acl_config_examples.md +0 -76
  286. mindstudio-probe-1.0.4/msprobe/docs/05.data_dump_PyTorch.md +0 -198
  287. mindstudio-probe-1.0.4/msprobe/docs/06.data_dump_MindSpore.md +0 -243
  288. mindstudio-probe-1.0.4/msprobe/docs/09.accuracy_checker_MindSpore.md +0 -68
  289. mindstudio-probe-1.0.4/msprobe/docs/10.accuracy_compare_PyTorch.md +0 -245
  290. mindstudio-probe-1.0.4/msprobe/docs/11.accuracy_compare_MindSpore.md +0 -202
  291. mindstudio-probe-1.0.4/msprobe/docs/13.overflow_check_MindSpore.md +0 -31
  292. mindstudio-probe-1.0.4/msprobe/docs/15.free_benchmarking_PyTorch.md +0 -164
  293. mindstudio-probe-1.0.4/msprobe/mindspore/__init__.py +0 -1
  294. mindstudio-probe-1.0.4/msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +0 -255
  295. mindstudio-probe-1.0.4/msprobe/mindspore/api_accuracy_checker/cmd_parser.py +0 -6
  296. mindstudio-probe-1.0.4/msprobe/mindspore/api_accuracy_checker/main.py +0 -9
  297. mindstudio-probe-1.0.4/msprobe/mindspore/cell_processor.py +0 -34
  298. mindstudio-probe-1.0.4/msprobe/mindspore/compare/ms_compare.py +0 -219
  299. mindstudio-probe-1.0.4/msprobe/mindspore/dump/jit_dump.py +0 -72
  300. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/api_pynative_self_check.py +0 -116
  301. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/common/config.py +0 -12
  302. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/common/handler_params.py +0 -17
  303. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/decorator/dec_forward.py +0 -43
  304. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +0 -107
  305. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/handler/handler_factory.py +0 -21
  306. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +0 -21
  307. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +0 -51
  308. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/perturbation/no_change.py +0 -12
  309. mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +0 -29
  310. mindstudio-probe-1.0.4/msprobe/mindspore/runtime.py +0 -4
  311. mindstudio-probe-1.0.4/msprobe/pytorch/__init__.py +0 -4
  312. mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/common/config.py +0 -53
  313. mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +0 -70
  314. mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +0 -10
  315. mindstudio-probe-1.0.4/msprobe/pytorch/bench_functions/__init__.py +0 -15
  316. mindstudio-probe-1.0.4/msprobe/pytorch/bench_functions/confusion_transpose.py +0 -19
  317. mindstudio-probe-1.0.4/msprobe/pytorch/bench_functions/layer_norm_eval.py +0 -6
  318. mindstudio-probe-1.0.4/msprobe/pytorch/bench_functions/linear.py +0 -12
  319. mindstudio-probe-1.0.4/msprobe/pytorch/bench_functions/rms_norm.py +0 -15
  320. mindstudio-probe-1.0.4/msprobe/pytorch/common/__init__.py +0 -2
  321. mindstudio-probe-1.0.4/msprobe/pytorch/common/log.py +0 -21
  322. mindstudio-probe-1.0.4/msprobe/pytorch/common/parse_json.py +0 -39
  323. mindstudio-probe-1.0.4/msprobe/pytorch/debugger/debugger_config.py +0 -95
  324. mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/__init__.py +0 -8
  325. mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/common/enums.py +0 -37
  326. mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +0 -13
  327. mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +0 -24
  328. mindstudio-probe-1.0.4/msprobe/pytorch/functional/dump_module.py +0 -39
  329. mindstudio-probe-1.0.4/msprobe/pytorch/hook_module/__init__.py +0 -1
  330. mindstudio-probe-1.0.4/msprobe/pytorch/parse.py +0 -4
  331. mindstudio-probe-1.0.4/msprobe/pytorch/pt_config.py +0 -188
  332. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/LICENSE +0 -0
  333. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/MANIFEST.in +0 -0
  334. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/dependency_links.txt +0 -0
  335. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/not-zip-safe +0 -0
  336. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/mindstudio_probe.egg-info/top_level.txt +0 -0
  337. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/__init__.py +0 -0
  338. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/core/grad_probe/__init__.py +0 -0
  339. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/14.data_parse_PyTorch.md +0 -0
  340. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +0 -0
  341. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/BLOOM-7B_1.png +0 -0
  342. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/BLOOM-7B_2.png +0 -0
  343. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/BLOOM-7B_3.png +0 -0
  344. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/BLOOM-7B_4.png +0 -0
  345. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_1.png +0 -0
  346. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_2.png +0 -0
  347. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_3.png +0 -0
  348. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_4.png +0 -0
  349. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_5.png +0 -0
  350. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_6.png +0 -0
  351. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_7.png +0 -0
  352. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/GPT-3_8.png +0 -0
  353. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/YOLOV5S_1.png +0 -0
  354. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/YOLOV5S_2.png +0 -0
  355. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/accuracy_checking_details.png +0 -0
  356. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/accuracy_checking_result.png +0 -0
  357. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/api_precision_compare_details.png +0 -0
  358. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/api_precision_compare_result.png +0 -0
  359. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/auto_analyze_log.png +0 -0
  360. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/compare_result_pkl.png +0 -0
  361. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/compare_result_pkl_md5.png.png +0 -0
  362. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/cpu_info.png +0 -0
  363. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/free_benchmark.png +0 -0
  364. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/free_benchmark_framework.png +0 -0
  365. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/grad_probe_image-1.png +0 -0
  366. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/grad_probe_image-2.png +0 -0
  367. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/grad_probe_image-3.png +0 -0
  368. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/grad_probe_image-4.png +0 -0
  369. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/grad_probe_image.png +0 -0
  370. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/docs/img/module_compare.png +0 -0
  371. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
  372. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/compare/ms_to_pt_api.yaml +0 -0
  373. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/debugger/__init__.py +0 -0
  374. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/__init__.py +0 -0
  375. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/dump/hook_cell/hook_cell.py +0 -0
  376. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/__init__.py +0 -0
  377. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
  378. {mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/decorator → mindstudio_probe-1.1.1/msprobe/mindspore/free_benchmark/handler}/__init__.py +0 -0
  379. {mindstudio-probe-1.0.4/msprobe/mindspore/free_benchmark/handler → mindstudio_probe-1.1.1/msprobe/mindspore/grad_probe}/__init__.py +0 -0
  380. {mindstudio-probe-1.0.4/msprobe/mindspore/grad_probe → mindstudio_probe-1.1.1/msprobe/mindspore/overflow_check}/__init__.py +0 -0
  381. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/.keep +0 -0
  382. {mindstudio-probe-1.0.4/msprobe/mindspore/overflow_check → mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker}/__init__.py +0 -0
  383. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/common/.keep +0 -0
  384. {mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker → mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/common}/__init__.py +0 -0
  385. {mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/common → mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/compare}/__init__.py +0 -0
  386. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +0 -0
  387. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +0 -0
  388. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/.keep +0 -0
  389. {mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/compare → mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/run_ut}/__init__.py +0 -0
  390. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +0 -0
  391. {mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/run_ut → mindstudio_probe-1.1.1/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer}/__init__.py +0 -0
  392. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/common/compare_script.template +0 -0
  393. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/compare/mapping.yaml +0 -0
  394. {mindstudio-probe-1.0.4/msprobe/pytorch/api_accuracy_checker/tensor_transport_layer → mindstudio_probe-1.1.1/msprobe/pytorch/debugger}/__init__.py +0 -0
  395. {mindstudio-probe-1.0.4/msprobe/pytorch/debugger → mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/common}/__init__.py +0 -0
  396. {mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/common → mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/perturbed_layers}/__init__.py +0 -0
  397. {mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/perturbed_layers → mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/perturbed_layers/npu}/__init__.py +0 -0
  398. {mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/perturbed_layers/npu → mindstudio_probe-1.1.1/msprobe/pytorch/free_benchmark/result_handlers}/__init__.py +0 -0
  399. {mindstudio-probe-1.0.4/msprobe/pytorch/free_benchmark/result_handlers → mindstudio_probe-1.1.1/msprobe/pytorch/functional}/__init__.py +0 -0
  400. {mindstudio-probe-1.0.4/msprobe/pytorch/functional → mindstudio_probe-1.1.1/msprobe/pytorch/grad_probe}/__init__.py +0 -0
  401. {mindstudio-probe-1.0.4/msprobe/pytorch/grad_probe → mindstudio_probe-1.1.1/msprobe/pytorch/monitor}/__init__.py +0 -0
  402. {mindstudio-probe-1.0.4/msprobe/pytorch/parse_tool → mindstudio_probe-1.1.1/msprobe/pytorch/monitor/distributed}/__init__.py +0 -0
  403. {mindstudio-probe-1.0.4/msprobe/pytorch/parse_tool/lib → mindstudio_probe-1.1.1/msprobe/pytorch/monitor/unittest}/__init__.py +0 -0
  404. /mindstudio-probe-1.0.4/msprobe/pytorch/functional/data_processor.py → /mindstudio_probe-1.1.1/msprobe/pytorch/parse_tool/__init__.py +0 -0
  405. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/file_desc.py +0 -0
  406. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/interactive_cli.py +0 -0
  407. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/msprobe/pytorch/parse_tool/lib/parse_exception.py +0 -0
  408. {mindstudio-probe-1.0.4 → mindstudio_probe-1.1.1}/setup.cfg +0 -0
@@ -1,13 +1,12 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mindstudio-probe
3
- Version: 1.0.4
3
+ Version: 1.1.1
4
4
  Summary: Pytorch Ascend Probe Utils
5
5
  Home-page: https://gitee.com/ascend/mstt/tree/master/debug/accuracy_tools/msprobe
6
6
  Author: Ascend Team
7
7
  Author-email: pmail_mindstudio@huawei.com
8
8
  License: Apache License 2.0
9
9
  Keywords: pytorch msprobe ascend
10
- Platform: UNKNOWN
11
10
  Classifier: Intended Audience :: Developers
12
11
  Classifier: Intended Audience :: Education
13
12
  Classifier: Intended Audience :: Science/Research
@@ -20,6 +19,18 @@ Classifier: Topic :: Software Development :: Libraries
20
19
  Classifier: Topic :: Software Development :: Libraries :: Python Modules
21
20
  Requires-Python: >=3.6.2
22
21
  License-File: LICENSE
22
+ Requires-Dist: wheel
23
+ Requires-Dist: einops
24
+ Requires-Dist: numpy<2.0
25
+ Requires-Dist: pandas<2.1,>=1.3.5
26
+ Requires-Dist: pyyaml
27
+ Requires-Dist: rich
28
+ Requires-Dist: tqdm
29
+ Requires-Dist: openpyxl
30
+ Requires-Dist: pyopenssl
31
+ Requires-Dist: twisted
32
+ Requires-Dist: matplotlib
33
+ Requires-Dist: tensorboard
34
+ Requires-Dist: tabulate
23
35
 
24
36
  MindStudio-Probe is a set of tools for diagnosing and improving model accuracy on Ascend NPU, including API acc checker, ptdbg, grad tool etc.
25
-
@@ -1,13 +1,12 @@
1
1
  Metadata-Version: 2.1
2
2
  Name: mindstudio-probe
3
- Version: 1.0.4
3
+ Version: 1.1.1
4
4
  Summary: Pytorch Ascend Probe Utils
5
5
  Home-page: https://gitee.com/ascend/mstt/tree/master/debug/accuracy_tools/msprobe
6
6
  Author: Ascend Team
7
7
  Author-email: pmail_mindstudio@huawei.com
8
8
  License: Apache License 2.0
9
9
  Keywords: pytorch msprobe ascend
10
- Platform: UNKNOWN
11
10
  Classifier: Intended Audience :: Developers
12
11
  Classifier: Intended Audience :: Education
13
12
  Classifier: Intended Audience :: Science/Research
@@ -20,6 +19,18 @@ Classifier: Topic :: Software Development :: Libraries
20
19
  Classifier: Topic :: Software Development :: Libraries :: Python Modules
21
20
  Requires-Python: >=3.6.2
22
21
  License-File: LICENSE
22
+ Requires-Dist: wheel
23
+ Requires-Dist: einops
24
+ Requires-Dist: numpy<2.0
25
+ Requires-Dist: pandas<2.1,>=1.3.5
26
+ Requires-Dist: pyyaml
27
+ Requires-Dist: rich
28
+ Requires-Dist: tqdm
29
+ Requires-Dist: openpyxl
30
+ Requires-Dist: pyopenssl
31
+ Requires-Dist: twisted
32
+ Requires-Dist: matplotlib
33
+ Requires-Dist: tensorboard
34
+ Requires-Dist: tabulate
23
35
 
24
36
  MindStudio-Probe is a set of tools for diagnosing and improving model accuracy on Ascend NPU, including API acc checker, ptdbg, grad tool etc.
25
-
@@ -20,6 +20,8 @@ msprobe/core/advisor/advisor_result.py
20
20
  msprobe/core/common/const.py
21
21
  msprobe/core/common/exceptions.py
22
22
  msprobe/core/common/file_utils.py
23
+ msprobe/core/common/inplace_op_checker.py
24
+ msprobe/core/common/inplace_ops.yaml
23
25
  msprobe/core/common/log.py
24
26
  msprobe/core/common/utils.py
25
27
  msprobe/core/compare/acc_compare.py
@@ -29,6 +31,10 @@ msprobe/core/compare/highlight.py
29
31
  msprobe/core/compare/multiprocessing_compute.py
30
32
  msprobe/core/compare/npy_compare.py
31
33
  msprobe/core/compare/utils.py
34
+ msprobe/core/compare/layer_mapping/__init__.py
35
+ msprobe/core/compare/layer_mapping/data_scope_parser.py
36
+ msprobe/core/compare/layer_mapping/layer_mapping.py
37
+ msprobe/core/compare/layer_mapping/postprocess_pass.py
32
38
  msprobe/core/data_dump/data_collector.py
33
39
  msprobe/core/data_dump/json_writer.py
34
40
  msprobe/core/data_dump/scope.py
@@ -40,10 +46,17 @@ msprobe/core/grad_probe/__init__.py
40
46
  msprobe/core/grad_probe/constant.py
41
47
  msprobe/core/grad_probe/grad_compare.py
42
48
  msprobe/core/grad_probe/utils.py
49
+ msprobe/core/overflow_check/abnormal_scene.py
50
+ msprobe/core/overflow_check/api_info.py
51
+ msprobe/core/overflow_check/checker.py
52
+ msprobe/core/overflow_check/filter.py
53
+ msprobe/core/overflow_check/ignore_rules.yaml
54
+ msprobe/core/overflow_check/level.py
55
+ msprobe/core/overflow_check/utils.py
43
56
  msprobe/docs/01.installation.md
44
57
  msprobe/docs/02.config_introduction.md
45
58
  msprobe/docs/03.config_examples.md
46
- msprobe/docs/04.acl_config_examples.md
59
+ msprobe/docs/04.kernel_dump_PyTorch.md
47
60
  msprobe/docs/05.data_dump_PyTorch.md
48
61
  msprobe/docs/06.data_dump_MindSpore.md
49
62
  msprobe/docs/07.accuracy_checker_PyTorch.md
@@ -55,9 +68,17 @@ msprobe/docs/12.overflow_check_PyTorch.md
55
68
  msprobe/docs/13.overflow_check_MindSpore.md
56
69
  msprobe/docs/14.data_parse_PyTorch.md
57
70
  msprobe/docs/15.free_benchmarking_PyTorch.md
71
+ msprobe/docs/16.free_benchmarking_MindSpore.md
58
72
  msprobe/docs/17.grad_probe.md
59
- msprobe/docs/FAQ_PyTorch.md
73
+ msprobe/docs/18.online_dispatch.md
74
+ msprobe/docs/19.monitor.md
75
+ msprobe/docs/20.monitor_performance_baseline.md
76
+ msprobe/docs/21.visualization_PyTorch.md
77
+ msprobe/docs/22.visualization_MindSpore.md
78
+ msprobe/docs/23.tool_function_introduction.md
79
+ msprobe/docs/FAQ.md
60
80
  msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md
81
+ msprobe/docs/data_dump_Mindspore/dynamic_graph_quick_start_example.md
61
82
  msprobe/docs/img/BLOOM-7B_1.png
62
83
  msprobe/docs/img/BLOOM-7B_2.png
63
84
  msprobe/docs/img/BLOOM-7B_3.png
@@ -77,6 +98,7 @@ msprobe/docs/img/accuracy_checking_result.png
77
98
  msprobe/docs/img/api_precision_compare_details.png
78
99
  msprobe/docs/img/api_precision_compare_result.png
79
100
  msprobe/docs/img/auto_analyze_log.png
101
+ msprobe/docs/img/compare_result.png
80
102
  msprobe/docs/img/compare_result_pkl.png
81
103
  msprobe/docs/img/compare_result_pkl_md5.png.png
82
104
  msprobe/docs/img/cpu_info.png
@@ -88,6 +110,10 @@ msprobe/docs/img/grad_probe_image-3.png
88
110
  msprobe/docs/img/grad_probe_image-4.png
89
111
  msprobe/docs/img/grad_probe_image.png
90
112
  msprobe/docs/img/module_compare.png
113
+ msprobe/docs/img/ms_dump.png
114
+ msprobe/docs/img/ms_layer.png
115
+ msprobe/docs/img/pt_dump.png
116
+ msprobe/docs/img/monitor/cpu_info.png
91
117
  msprobe/mindspore/__init__.py
92
118
  msprobe/mindspore/cell_processor.py
93
119
  msprobe/mindspore/ms_config.py
@@ -99,9 +125,13 @@ msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py
99
125
  msprobe/mindspore/api_accuracy_checker/api_info.py
100
126
  msprobe/mindspore/api_accuracy_checker/api_runner.py
101
127
  msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py
128
+ msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml
102
129
  msprobe/mindspore/api_accuracy_checker/cmd_parser.py
103
130
  msprobe/mindspore/api_accuracy_checker/compute_element.py
131
+ msprobe/mindspore/api_accuracy_checker/data_manager.py
104
132
  msprobe/mindspore/api_accuracy_checker/main.py
133
+ msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py
134
+ msprobe/mindspore/api_accuracy_checker/multi_data_manager.py
105
135
  msprobe/mindspore/api_accuracy_checker/type_mapping.py
106
136
  msprobe/mindspore/api_accuracy_checker/utils.py
107
137
  msprobe/mindspore/common/const.py
@@ -121,8 +151,11 @@ msprobe/mindspore/dump/kernel_graph_dump.py
121
151
  msprobe/mindspore/dump/kernel_kbyk_dump.py
122
152
  msprobe/mindspore/dump/hook_cell/api_registry.py
123
153
  msprobe/mindspore/dump/hook_cell/hook_cell.py
154
+ msprobe/mindspore/dump/hook_cell/primitive_hooks.py
124
155
  msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml
125
156
  msprobe/mindspore/dump/hook_cell/wrap_api.py
157
+ msprobe/mindspore/dym_loader/hook_dynamic_loader.cc
158
+ msprobe/mindspore/dym_loader/hook_dynamic_loader.h
126
159
  msprobe/mindspore/free_benchmark/__init__.py
127
160
  msprobe/mindspore/free_benchmark/api_pynative_self_check.py
128
161
  msprobe/mindspore/free_benchmark/self_check_tool_factory.py
@@ -131,9 +164,6 @@ msprobe/mindspore/free_benchmark/common/config.py
131
164
  msprobe/mindspore/free_benchmark/common/handler_params.py
132
165
  msprobe/mindspore/free_benchmark/common/utils.py
133
166
  msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml
134
- msprobe/mindspore/free_benchmark/decorator/__init__.py
135
- msprobe/mindspore/free_benchmark/decorator/dec_forward.py
136
- msprobe/mindspore/free_benchmark/decorator/decorator_factory.py
137
167
  msprobe/mindspore/free_benchmark/handler/__init__.py
138
168
  msprobe/mindspore/free_benchmark/handler/base_handler.py
139
169
  msprobe/mindspore/free_benchmark/handler/check_handler.py
@@ -177,6 +207,9 @@ msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml
177
207
  msprobe/pytorch/api_accuracy_checker/compare/compare.py
178
208
  msprobe/pytorch/api_accuracy_checker/compare/compare_column.py
179
209
  msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py
210
+ msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json
211
+ msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py
212
+ msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template
180
213
  msprobe/pytorch/api_accuracy_checker/run_ut/.keep
181
214
  msprobe/pytorch/api_accuracy_checker/run_ut/__init__.py
182
215
  msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py
@@ -189,8 +222,10 @@ msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py
189
222
  msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py
190
223
  msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py
191
224
  msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py
225
+ msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py
192
226
  msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py
193
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py
227
+ msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml
228
+ msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py
194
229
  msprobe/pytorch/bench_functions/__init__.py
195
230
  msprobe/pytorch/bench_functions/apply_adam_w.py
196
231
  msprobe/pytorch/bench_functions/confusion_transpose.py
@@ -215,6 +250,7 @@ msprobe/pytorch/compare/pt_compare.py
215
250
  msprobe/pytorch/debugger/__init__.py
216
251
  msprobe/pytorch/debugger/debugger_config.py
217
252
  msprobe/pytorch/debugger/precision_debugger.py
253
+ msprobe/pytorch/dump/kernel_dump/kernel_config.py
218
254
  msprobe/pytorch/free_benchmark/__init__.py
219
255
  msprobe/pytorch/free_benchmark/main.py
220
256
  msprobe/pytorch/free_benchmark/common/__init__.py
@@ -243,8 +279,7 @@ msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py
243
279
  msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py
244
280
  msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py
245
281
  msprobe/pytorch/functional/__init__.py
246
- msprobe/pytorch/functional/data_processor.py
247
- msprobe/pytorch/functional/dump_module.py
282
+ msprobe/pytorch/functional/module_dump.py
248
283
  msprobe/pytorch/grad_probe/__init__.py
249
284
  msprobe/pytorch/grad_probe/grad_monitor.py
250
285
  msprobe/pytorch/grad_probe/grad_stat_csv.py
@@ -260,6 +295,22 @@ msprobe/pytorch/hook_module/wrap_npu_custom.py
260
295
  msprobe/pytorch/hook_module/wrap_tensor.py
261
296
  msprobe/pytorch/hook_module/wrap_torch.py
262
297
  msprobe/pytorch/hook_module/wrap_vf.py
298
+ msprobe/pytorch/monitor/__init__.py
299
+ msprobe/pytorch/monitor/anomaly_analyse.py
300
+ msprobe/pytorch/monitor/anomaly_detect.py
301
+ msprobe/pytorch/monitor/features.py
302
+ msprobe/pytorch/monitor/module_hook.py
303
+ msprobe/pytorch/monitor/module_metric.py
304
+ msprobe/pytorch/monitor/module_spec_verifier.py
305
+ msprobe/pytorch/monitor/optimizer_collect.py
306
+ msprobe/pytorch/monitor/utils.py
307
+ msprobe/pytorch/monitor/visualizer.py
308
+ msprobe/pytorch/monitor/distributed/__init__.py
309
+ msprobe/pytorch/monitor/distributed/distributed_ops.yaml
310
+ msprobe/pytorch/monitor/distributed/stack_blacklist.yaml
311
+ msprobe/pytorch/monitor/distributed/wrap_distributed.py
312
+ msprobe/pytorch/monitor/unittest/__init__.py
313
+ msprobe/pytorch/monitor/unittest/test_monitor.py
263
314
  msprobe/pytorch/online_dispatch/__init__.py
264
315
  msprobe/pytorch/online_dispatch/compare.py
265
316
  msprobe/pytorch/online_dispatch/dispatch.py
@@ -277,4 +328,18 @@ msprobe/pytorch/parse_tool/lib/interactive_cli.py
277
328
  msprobe/pytorch/parse_tool/lib/parse_exception.py
278
329
  msprobe/pytorch/parse_tool/lib/parse_tool.py
279
330
  msprobe/pytorch/parse_tool/lib/utils.py
280
- msprobe/pytorch/parse_tool/lib/visualization.py
331
+ msprobe/pytorch/parse_tool/lib/visualization.py
332
+ msprobe/visualization/__init__.py
333
+ msprobe/visualization/graph_service.py
334
+ msprobe/visualization/utils.py
335
+ msprobe/visualization/builder/__init__.py
336
+ msprobe/visualization/builder/graph_builder.py
337
+ msprobe/visualization/builder/msprobe_adapter.py
338
+ msprobe/visualization/compare/__init__.py
339
+ msprobe/visualization/compare/graph_comparator.py
340
+ msprobe/visualization/compare/mode_adapter.py
341
+ msprobe/visualization/graph/__init__.py
342
+ msprobe/visualization/graph/base_node.py
343
+ msprobe/visualization/graph/graph.py
344
+ msprobe/visualization/graph/node_colors.py
345
+ msprobe/visualization/graph/node_op.py
@@ -1,3 +1,2 @@
1
1
  [console_scripts]
2
2
  msprobe = msprobe.msprobe:main
3
-
@@ -9,3 +9,5 @@ openpyxl
9
9
  pyopenssl
10
10
  twisted
11
11
  matplotlib
12
+ tensorboard
13
+ tabulate
@@ -0,0 +1,167 @@
1
+ # 📖 msprobe 使用手册
2
+
3
+ ![version](https://img.shields.io/badge/version-1.0.4-blueviolet)
4
+ ![python](https://img.shields.io/badge/python-3.8|3.9|3.10-blue)
5
+ ![platform](https://img.shields.io/badge/platform-Linux-yellow)
6
+
7
+ **msprobe** 是 MindStudio Training Tools 工具链下精度调试部分的工具包。主要包括精度预检、溢出检测和精度比对等功能,目前适配 [PyTorch](https://pytorch.org/) 和 [MindSpore](https://www.mindspore.cn/) 框架。这些子工具侧重不同的训练场景,可以定位模型训练中的精度问题。
8
+
9
+ 为方便使用,本工具提供了统一、简易的程序接口:**PrecisionDebugger**。以 PyTorch 框架为例,通过以下示例模板和 **config.json** 可以轻松使用各种功能。
10
+
11
+ ```python
12
+ from msprobe.pytorch import PrecisionDebugger
13
+
14
+ debugger = PrecisionDebugger(config_path='./config.json')
15
+ ...
16
+ debugger.start() # 一般在训练循环开头启动工具
17
+ ... # 循环体
18
+ debugger.stop() # 一般在训练循环末尾结束工具
19
+ debugger.step() # 在训练循环的最后需要重置工具,非循环场景不需要
20
+ ```
21
+
22
+ 此外,根据以下规则,可以通过环境变量设置日志级别。
23
+ - MSPROBE_LOG_LEVEL=4,不打印任何日志;
24
+ - MSPROBE_LOG_LEVEL=3,仅打印 ERROR;
25
+ - MSPROBE_LOG_LEVEL=2,仅打印 WARNING、ERROR;
26
+ - MSPROBE_LOG_LEVEL=1,仅打印 INFO、WARNING、ERROR(默认配置);
27
+ - MSPROBE_LOG_LEVEL=0,打印 DEBUG、INFO、WARNING、ERROR。
28
+
29
+ 例如在 shell 脚本:
30
+
31
+ ```shell
32
+ export MSPROBE_LOG_LEVEL={x}
33
+ ```
34
+ **config.json** 的配置要求和各功能具体的使用指导详见后续章节。
35
+
36
+ ## 环境和依赖
37
+
38
+ - 硬件环境请参见《[昇腾产品形态说明](https://gitee.com/link?target=https%3A%2F%2Fwww.hiascend.com%2Fdocument%2Fdetail%2Fzh%2Fcanncommercial%2F80RC22%2Fquickstart%2Fquickstart%2Fquickstart_18_0002.html)》。
39
+ - 软件环境请参见《[CANN 软件安装指南](https://gitee.com/link?target=https%3A%2F%2Fwww.hiascend.com%2Fdocument%2Fdetail%2Fzh%2Fcanncommercial%2F80RC22%2Fsoftwareinst%2Finstg%2Finstg_0000.html%3FMode%3DPmIns%26OS%3DUbuntu%26Software%3DcannToolKit)》安装昇腾设备开发或运行环境,即toolkit软件包。
40
+
41
+ 以上环境依赖请根据实际环境选择适配的版本。
42
+
43
+ ## 版本配套说明
44
+
45
+ - msprobe支持AscendPyTorch 1.11.0或更高版本,支持的PyTorch和CANN以及PyTorch和python软件版本配套关系请参见《[Ascend Extension for PyTorch插件](https://gitee.com/ascend/pytorch)》。
46
+ - msprobe支持MindSpore 2.4.0或更高版本,支持的MindSpore和CANN以及MindSpore和python软件版本配套关系请参见《[MindSpore版本发布列表](https://www.mindspore.cn/versions)》。
47
+ - msprobe支持的固件驱动版本与配套CANN软件支持的固件驱动版本相同,开发者可通过“[昇腾社区-固件与驱动](https://gitee.com/link?target=https%3A%2F%2Fwww.hiascend.com%2Fhardware%2Ffirmware-drivers%2Fcommunity%3Fproduct%3D2%26model%3D28%26cann%3D8.0.RC3.alpha003%26driver%3D1.0.25.alpha)”页面根据产品型号与CANN软件版本获取配套的固件与驱动。
48
+
49
+
50
+ ## 🚨 工具限制与注意事项
51
+
52
+ **1. Pytorch 框架下,工具暂不支持 Fully Sharded Data Parallel(FSDP)。**
53
+
54
+ ## ⚙️ [安装](./docs/01.installation.md)
55
+
56
+ ## 🛠️ config.json [介绍](./docs/02.config_introduction.md) 和 [示例](./docs/03.config_examples.md)
57
+
58
+ ## 🧰 主要功能
59
+
60
+ ### 0 用前必看
61
+
62
+ 使用工具前,建议先浏览[**工具功能模块简介、适用场景和当前版本局限性**](./docs/23.tool_function_introduction.md),了解功能特性。
63
+
64
+ ### 1 数据采集
65
+
66
+ msprobe 通过在训练脚本中添加 PrecisionDebugger 接口的方式对 API 执行精度数据 dump 操作,对应 config.json 中的 task 为 statistics 或 tensor。
67
+
68
+ [PyTorch 场景的数据采集](./docs/05.data_dump_PyTorch.md)
69
+
70
+ [MindSpore 场景的数据采集](./docs/06.data_dump_MindSpore.md)
71
+
72
+ ### 2 精度预检
73
+
74
+ 精度预检旨在昇腾 NPU 上扫描训练模型中的所有 API 进行 API 复现,给出精度情况的诊断和分析。对应 config.json 中的 task 为 run_ut。
75
+
76
+ PyTorch 场景的[离线预检](./docs/07.accuracy_checker_PyTorch.md)和[在线预检](./docs/08.accuracy_checker_online_PyTorch.md)
77
+
78
+ MindSpore 动态图场景的[离线预检](./docs/09.accuracy_checker_MindSpore.md)
79
+
80
+ ### 3 精度比对
81
+
82
+ 该功能进行 PyTorch 整网 API 粒度的数据 dump、精度比对,进而定位训练场景下的精度问题。
83
+
84
+ [PyTorch 场景的精度比对](./docs/10.accuracy_compare_PyTorch.md)
85
+
86
+ [MindSpore 场景的精度比对](./docs/11.accuracy_compare_MindSpore.md)
87
+
88
+ ### 4 溢出检测与解析
89
+
90
+ 溢出检测与解析是在执行精度数据 dump 时,判断是否存在输入正常但输出存在溢出的 API,从而判断是否为正常溢出。对应 config.json 中的 overflow_check。
91
+
92
+ [PyTorch 场景的溢出检测与解析](./docs/12.overflow_check_PyTorch.md)
93
+
94
+ [MindSpore 场景的溢出检测与解析](./docs/13.overflow_check_MindSpore.md)
95
+
96
+ ### 5 数据解析
97
+
98
+ 该功能用于比对前后两次 NPU ACL 层级 dump 数据的一致性。
99
+
100
+ [PyTorch 场景的数据解析](./docs/14.data_parse_PyTorch.md)
101
+
102
+ ### 6 无标杆比对
103
+
104
+ [PyTorch 场景的无标杆比对](./docs/15.free_benchmarking_PyTorch.md)
105
+
106
+ [MindSpore 场景的无标杆比对](./docs/16.free_benchmarking_MindSpore.md)
107
+
108
+ ### 7 梯度状态监测
109
+
110
+ 本功能用于采集梯度数据并进行梯度相似度比对,可以精准定位出现问题的 step。
111
+
112
+ [兼容 PyTorch 和 MindSpore 框架的梯度监测](./docs/17.grad_probe.md)
113
+
114
+ ### 8 在线精度比对
115
+
116
+ 在线精度比对是实现在PyTorch训练过程中直接完成精度比对并输出比对结果的功能,是NPU与CPU之间的精度比对。
117
+
118
+ [PyTorch 场景的在线精度比对](./docs/18.online_dispatch.md)
119
+
120
+ ### 9 训练状态监控
121
+
122
+ 该功能收集和聚合模型训练过程中的网络层,优化器, 通信算子的中间值,帮助诊断模型训练过程中计算, 通信,优化器各部分出现的异常情况。
123
+
124
+ [PyTorch 场景的训练状态监控](./docs/19.monitor.md)
125
+
126
+ ### 10 分级可视化构图比对
127
+
128
+ 该功能将msprobe工具dump的精度数据进行解析,还原模型图结构,实现模型各个层级的精度数据比对,方便用户理解模型结构、分析精度问题。
129
+
130
+ [PyTorch 场景的分级可视化构图比对](./docs/21.visualization_PyTorch.md)
131
+
132
+ [MindSpore 场景的分级可视化构图比对](./docs/22.visualization_MindSpore.md)
133
+
134
+ ## 🌟 新版本特性
135
+
136
+ 若查看历史版本特性,请参见[安装](./docs/01.installation.md)。
137
+
138
+ 【数据采集】
139
+ - 支持 config.json 中的 step 传入范围;
140
+ - 优化了指定 step 的机制,指定 step 结束后工具不再采集数据,但训练会继续运行。工具结束运行后,日志提示信息如下:
141
+ ```bash
142
+ ****************************************
143
+ * msprobe ends successfully. *
144
+ ****************************************
145
+ ```
146
+ 注:在多卡场景,每张卡进程训练到指定 step 之后都会打印一次上述信息。
147
+
148
+ 【精度预检】
149
+ - 在 PyTorch 场景,支持部分 NPU 融合算子预检。
150
+
151
+ 【精度比对】
152
+ - 解决了使用 MindSpore 需要安装 PyTorch 的问题。
153
+
154
+ 【无标杆比对】
155
+ - 补充在 PyTorch 场景的性能基线报告;
156
+ - 支持 MindSpore 场景的 change_value 扰动模式。
157
+
158
+ ## 📑 补充材料
159
+
160
+ [无标杆比对功能在 PyTorch 场景的性能基线报告](./docs/S02.report_free_benchmarking_validation_performance_baseline.md)
161
+
162
+ ## ❗ 免责声明
163
+ 本工具建议执行用户与安装用户保持一致,如果您要使用 root 执行,请自行关注 root 高权限触及的安全风险。
164
+
165
+ ## ❓ FAQ
166
+
167
+ [FAQ for PyTorch](./docs/FAQ.md)
@@ -0,0 +1,16 @@
1
+ # Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
2
+ # All rights reserved.
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
5
+ # you may not use this file except in compliance with the License.
6
+ # You may obtain a copy of the License at
7
+ #
8
+ # http://www.apache.org/licenses/LICENSE-2.0
9
+ #
10
+ # Unless required by applicable law or agreed to in writing, software
11
+ # distributed under the License is distributed on an "AS IS" BASIS,
12
+ # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
13
+ # See the License for the specific language governing permissions and
14
+ # limitations under the License.
15
+
16
+ from msprobe.core.grad_probe.grad_compare import GradComparator
@@ -4,15 +4,11 @@
4
4
  "rank": [],
5
5
  "step": [],
6
6
  "level": "L1",
7
- "seed": 1234,
8
- "is_deterministic": false,
9
7
  "enable_dataloader": false,
10
- "acl_config": "",
11
8
  "tensor": {
12
9
  "scope": [],
13
10
  "list":[],
14
- "data_mode": ["all"],
15
- "backward_input": [],
11
+ "data_mode": ["all"],
16
12
  "file_format": "npy"
17
13
  },
18
14
  "statistics": {
@@ -1,8 +1,7 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- # Copyright (C) 2022-2024. Huawei Technologies Co., Ltd. All rights reserved.
5
- # Licensed under the Apache License, Version 2.0 (the "License");
1
+ # Copyright (c) 2022-2024, Huawei Technologies Co., Ltd.
2
+ # All rights reserved.
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
5
  # you may not use this file except in compliance with the License.
7
6
  # You may obtain a copy of the License at
8
7
  #
@@ -13,7 +12,6 @@
13
12
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
13
  # See the License for the specific language governing permissions and
15
14
  # limitations under the License.
16
- """
17
15
 
18
16
  import os
19
17
 
@@ -24,15 +22,17 @@ from msprobe.core.common.utils import CompareException
24
22
  from msprobe.core.common.file_utils import FileChecker
25
23
  from msprobe.core.common.const import Const, CompareConst, FileCheckConst
26
24
 
25
+
27
26
  class Advisor:
28
27
  """
29
28
  Class for generate advisor
30
29
  """
31
30
 
32
- def __init__(self, input_data, out_path=""):
31
+ def __init__(self, input_data, out_path="", suffix=""):
33
32
  self.input_data = input_data
34
33
  self.out_path = os.path.realpath(out_path)
35
34
  self.file_type = None
35
+ self.suffix = suffix
36
36
 
37
37
  @staticmethod
38
38
  def deterministic_advisor(message, node_name):
@@ -62,7 +62,12 @@ class Advisor:
62
62
  .format(item[CompareConst.NPU_NAME]))
63
63
 
64
64
  def gen_advisor_result(self, pd_data):
65
- first_failing_data = pd_data.iloc[0]
65
+ try:
66
+ first_failing_data = pd_data.iloc[0]
67
+ except IndexError as e:
68
+ err_msg = "index out of bounds error occurs, pd_data is empty, please check!"
69
+ logger.error(err_msg)
70
+ raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR) from e
66
71
  node_name = first_failing_data[CompareConst.NPU_NAME]
67
72
  index = first_failing_data['index']
68
73
  message = self.gen_advisor_message(node_name)
@@ -87,7 +92,7 @@ class Advisor:
87
92
  return message
88
93
 
89
94
  def analysis(self):
90
- self._check_path_vaild()
95
+ self._check_path_valid()
91
96
  analyze_data = self._parse_input_data()
92
97
  logger.info("Start analyzing the comparison result: %s" % self.file_type)
93
98
  self.analyze_unmatched(analyze_data)
@@ -103,7 +108,7 @@ class Advisor:
103
108
  else:
104
109
  result = self.gen_advisor_result(failing_data)
105
110
  message_list = result.print_advisor_log()
106
- result.gen_summary_file(self.out_path, message_list)
111
+ result.gen_summary_file(self.out_path, message_list, suffix=self.suffix)
107
112
 
108
113
  def _parse_input_data(self):
109
114
  data_columns = self.input_data.columns.values
@@ -119,6 +124,6 @@ class Advisor:
119
124
  df = self.input_data.reset_index()
120
125
  return df
121
126
 
122
- def _check_path_vaild(self):
127
+ def _check_path_valid(self):
123
128
  out_path_checker = FileChecker(self.out_path, FileCheckConst.DIR, FileCheckConst.WRITE_ABLE)
124
129
  out_path_checker.common_check()
@@ -1,8 +1,7 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- # Copyright (C) 2022-2024. Huawei Technologies Co., Ltd. All rights reserved.
5
- # Licensed under the Apache License, Version 2.0 (the "License");
1
+ # Copyright (c) 2022-2024, Huawei Technologies Co., Ltd.
2
+ # All rights reserved.
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
5
  # you may not use this file except in compliance with the License.
7
6
  # You may obtain a copy of the License at
8
7
  #
@@ -13,7 +12,6 @@
13
12
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
13
  # See the License for the specific language governing permissions and
15
14
  # limitations under the License.
16
- """
17
15
 
18
16
 
19
17
  class AdvisorConst:
@@ -35,7 +33,8 @@ class AdvisorConst:
35
33
  # advisor message
36
34
  NO_ERR_SUGGEST = "All data in comparison result meets the accuracy requirements."
37
35
  FORWARD_INPUT_SUGGEST = "1. Analyze the model to view the input source.\n" \
38
- "2. Check whether an inplace API causes the output result to overwrite the input result. That is, the fault is actually caused by a computation error.\n" \
36
+ "2. Check whether an inplace API causes the output result to overwrite the input result. "\
37
+ "That is, the fault is actually caused by a computation error.\n" \
39
38
  "3. The fault may be caused by memory corruption and further analysis is required."
40
39
  FORWARD_OUTPUT_SUGGEST = "This is a forward API computation error. Check the computation implementation."
41
40
  BACKWARD_INPUT_SUGGEST = "Check whether the forward computation result is affected."
@@ -1,8 +1,7 @@
1
- #!/usr/bin/env python3
2
- # -*- coding: utf-8 -*-
3
- """
4
- # Copyright (C) 2022-2024. Huawei Technologies Co., Ltd. All rights reserved.
5
- # Licensed under the Apache License, Version 2.0 (the "License");
1
+ # Copyright (c) 2022-2024, Huawei Technologies Co., Ltd.
2
+ # All rights reserved.
3
+ #
4
+ # Licensed under the Apache License, Version 2.0 (the "License");
6
5
  # you may not use this file except in compliance with the License.
7
6
  # You may obtain a copy of the License at
8
7
  #
@@ -13,13 +12,12 @@
13
12
  # WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
14
13
  # See the License for the specific language governing permissions and
15
14
  # limitations under the License.
16
- """
17
15
  import os
18
16
  import time
19
17
 
20
18
  from msprobe.core.advisor.advisor_const import AdvisorConst
21
19
  from msprobe.core.common.log import logger
22
- from msprobe.core.common.const import Const, FileCheckConst
20
+ from msprobe.core.common.const import FileCheckConst
23
21
  from msprobe.core.common.file_utils import change_mode, FileOpen
24
22
 
25
23
 
@@ -34,8 +32,8 @@ class AdvisorResult:
34
32
  self.advisor_message = message
35
33
 
36
34
  @staticmethod
37
- def gen_summary_file(out_path, message_list):
38
- file_name = 'advisor_{}.txt'.format(time.strftime("%Y%m%d%H%M%S", time.localtime(time.time())))
35
+ def gen_summary_file(out_path, message_list, suffix):
36
+ file_name = 'advisor{}_{}.txt'.format(suffix, time.strftime("%Y%m%d%H%M%S", time.localtime(time.time())))
39
37
  result_file = os.path.join(out_path, file_name)
40
38
  try:
41
39
  with FileOpen(result_file, 'w+') as output_file:
@@ -50,9 +48,11 @@ class AdvisorResult:
50
48
 
51
49
  def print_advisor_log(self):
52
50
  logger.info("The summary of the expert advice is as follows: ")
53
- message_list = [AdvisorConst.LINE + AdvisorConst.COLON + str(self.line),
54
- AdvisorConst.SUSPECT_NODES + AdvisorConst.COLON + self.suspect_node,
55
- AdvisorConst.ADVISOR_SUGGEST + AdvisorConst.COLON + self.advisor_message]
51
+ message_list = [
52
+ AdvisorConst.LINE + AdvisorConst.COLON + str(self.line),
53
+ AdvisorConst.SUSPECT_NODES + AdvisorConst.COLON + self.suspect_node,
54
+ AdvisorConst.ADVISOR_SUGGEST + AdvisorConst.COLON + self.advisor_message
55
+ ]
56
56
  for message in message_list:
57
57
  logger.info(message)
58
58
  return message_list