mindstudio-probe 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
Files changed (249) hide show
  1. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/METADATA +5 -1
  2. mindstudio_probe-1.0.3.dist-info/RECORD +272 -0
  3. msprobe/README.md +78 -23
  4. msprobe/__init__.py +1 -0
  5. msprobe/config/README.md +182 -40
  6. msprobe/config/config.json +22 -0
  7. msprobe/core/__init__.py +0 -0
  8. msprobe/{pytorch → core}/advisor/advisor.py +3 -3
  9. msprobe/{pytorch → core}/advisor/advisor_result.py +2 -2
  10. msprobe/core/common/const.py +82 -5
  11. msprobe/core/common/exceptions.py +30 -18
  12. msprobe/core/common/file_check.py +19 -1
  13. msprobe/core/common/log.py +15 -1
  14. msprobe/core/common/utils.py +130 -30
  15. msprobe/core/common_config.py +32 -19
  16. msprobe/core/compare/acc_compare.py +299 -0
  17. msprobe/core/compare/check.py +95 -0
  18. msprobe/core/compare/compare_cli.py +49 -0
  19. msprobe/core/compare/highlight.py +222 -0
  20. msprobe/core/compare/multiprocessing_compute.py +149 -0
  21. msprobe/{pytorch → core}/compare/npy_compare.py +55 -4
  22. msprobe/core/compare/utils.py +429 -0
  23. msprobe/core/data_dump/data_collector.py +39 -35
  24. msprobe/core/data_dump/data_processor/base.py +85 -37
  25. msprobe/core/data_dump/data_processor/factory.py +5 -7
  26. msprobe/core/data_dump/data_processor/mindspore_processor.py +198 -0
  27. msprobe/core/data_dump/data_processor/pytorch_processor.py +94 -51
  28. msprobe/core/data_dump/json_writer.py +11 -11
  29. msprobe/core/grad_probe/__init__.py +0 -0
  30. msprobe/core/grad_probe/constant.py +71 -0
  31. msprobe/core/grad_probe/grad_compare.py +175 -0
  32. msprobe/core/grad_probe/utils.py +52 -0
  33. msprobe/doc/grad_probe/grad_probe.md +207 -0
  34. msprobe/doc/grad_probe/img/image-1.png +0 -0
  35. msprobe/doc/grad_probe/img/image-2.png +0 -0
  36. msprobe/doc/grad_probe/img/image-3.png +0 -0
  37. msprobe/doc/grad_probe/img/image-4.png +0 -0
  38. msprobe/doc/grad_probe/img/image.png +0 -0
  39. msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
  40. msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +246 -0
  41. msprobe/mindspore/api_accuracy_checker/api_info.py +69 -0
  42. msprobe/mindspore/api_accuracy_checker/api_runner.py +152 -0
  43. msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +197 -0
  44. msprobe/mindspore/api_accuracy_checker/compute_element.py +224 -0
  45. msprobe/mindspore/api_accuracy_checker/main.py +16 -0
  46. msprobe/mindspore/api_accuracy_checker/type_mapping.py +114 -0
  47. msprobe/mindspore/api_accuracy_checker/utils.py +63 -0
  48. msprobe/mindspore/cell_processor.py +34 -0
  49. msprobe/mindspore/common/const.py +87 -0
  50. msprobe/mindspore/common/log.py +38 -0
  51. msprobe/mindspore/common/utils.py +57 -0
  52. msprobe/mindspore/compare/distributed_compare.py +75 -0
  53. msprobe/mindspore/compare/ms_compare.py +117 -0
  54. msprobe/mindspore/compare/ms_graph_compare.py +317 -0
  55. msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -0
  56. msprobe/mindspore/debugger/debugger_config.py +38 -15
  57. msprobe/mindspore/debugger/precision_debugger.py +79 -4
  58. msprobe/mindspore/doc/compare.md +58 -0
  59. msprobe/mindspore/doc/dump.md +158 -6
  60. msprobe/mindspore/dump/dump_tool_factory.py +19 -22
  61. msprobe/mindspore/dump/hook_cell/api_registry.py +104 -0
  62. msprobe/mindspore/dump/hook_cell/hook_cell.py +53 -0
  63. msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +925 -0
  64. msprobe/mindspore/dump/hook_cell/wrap_functional.py +91 -0
  65. msprobe/mindspore/dump/hook_cell/wrap_tensor.py +63 -0
  66. msprobe/mindspore/dump/jit_dump.py +56 -0
  67. msprobe/mindspore/dump/kernel_kbyk_dump.py +65 -0
  68. msprobe/mindspore/free_benchmark/__init__.py +0 -0
  69. msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -0
  70. msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
  71. msprobe/mindspore/free_benchmark/common/config.py +12 -0
  72. msprobe/mindspore/free_benchmark/common/handler_params.py +17 -0
  73. msprobe/mindspore/free_benchmark/common/utils.py +71 -0
  74. msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -0
  75. msprobe/mindspore/free_benchmark/decorator/__init__.py +0 -0
  76. msprobe/mindspore/free_benchmark/decorator/dec_forward.py +42 -0
  77. msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -0
  78. msprobe/mindspore/free_benchmark/handler/__init__.py +0 -0
  79. msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -0
  80. msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -0
  81. msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -0
  82. msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -0
  83. msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -0
  84. msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -0
  85. msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -0
  86. msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +34 -0
  87. msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -0
  88. msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +27 -0
  89. msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -0
  90. msprobe/mindspore/grad_probe/__init__.py +0 -0
  91. msprobe/mindspore/grad_probe/global_context.py +91 -0
  92. msprobe/mindspore/grad_probe/grad_analyzer.py +231 -0
  93. msprobe/mindspore/grad_probe/grad_monitor.py +27 -0
  94. msprobe/mindspore/grad_probe/grad_stat_csv.py +132 -0
  95. msprobe/mindspore/grad_probe/hook.py +92 -0
  96. msprobe/mindspore/grad_probe/utils.py +29 -0
  97. msprobe/mindspore/ms_config.py +63 -15
  98. msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +17 -15
  99. msprobe/mindspore/runtime.py +4 -0
  100. msprobe/mindspore/service.py +354 -0
  101. msprobe/mindspore/task_handler_factory.py +7 -4
  102. msprobe/msprobe.py +66 -26
  103. msprobe/pytorch/__init__.py +1 -1
  104. msprobe/pytorch/api_accuracy_checker/common/config.py +21 -16
  105. msprobe/pytorch/api_accuracy_checker/common/utils.py +1 -60
  106. msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +2 -5
  107. msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +46 -10
  108. msprobe/pytorch/api_accuracy_checker/compare/compare.py +84 -48
  109. msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +8 -12
  110. msprobe/pytorch/api_accuracy_checker/config.yaml +7 -1
  111. msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +15 -11
  112. msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +11 -15
  113. msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +16 -9
  114. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +193 -105
  115. msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +68 -1
  116. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py +0 -0
  117. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +202 -0
  118. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +324 -0
  119. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -0
  120. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +218 -0
  121. msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -0
  122. msprobe/pytorch/bench_functions/__init__.py +15 -0
  123. msprobe/pytorch/bench_functions/apply_adam_w.py +28 -0
  124. msprobe/pytorch/bench_functions/confusion_transpose.py +19 -0
  125. msprobe/pytorch/bench_functions/fast_gelu.py +55 -0
  126. msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -0
  127. msprobe/pytorch/bench_functions/linear.py +12 -0
  128. msprobe/pytorch/bench_functions/matmul_backward.py +48 -0
  129. msprobe/pytorch/bench_functions/npu_fusion_attention.py +421 -0
  130. msprobe/pytorch/bench_functions/rms_norm.py +15 -0
  131. msprobe/pytorch/bench_functions/rotary_mul.py +52 -0
  132. msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -0
  133. msprobe/pytorch/bench_functions/swiglu.py +55 -0
  134. msprobe/pytorch/common/parse_json.py +3 -1
  135. msprobe/pytorch/common/utils.py +83 -7
  136. msprobe/pytorch/compare/distributed_compare.py +19 -64
  137. msprobe/pytorch/compare/match.py +3 -6
  138. msprobe/pytorch/compare/pt_compare.py +40 -0
  139. msprobe/pytorch/debugger/debugger_config.py +11 -2
  140. msprobe/pytorch/debugger/precision_debugger.py +34 -4
  141. msprobe/pytorch/doc/api_accuracy_checker.md +57 -13
  142. msprobe/pytorch/doc/api_accuracy_checker_online.md +187 -0
  143. msprobe/pytorch/doc/dump.md +73 -20
  144. msprobe/pytorch/doc/ptdbg_ascend_compare.md +75 -11
  145. msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +3 -3
  146. msprobe/pytorch/doc/run_overflow_check.md +1 -1
  147. msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +151 -0
  148. msprobe/pytorch/free_benchmark/common/constant.py +3 -0
  149. msprobe/pytorch/free_benchmark/common/utils.py +4 -0
  150. msprobe/pytorch/free_benchmark/compare/grad_saver.py +22 -26
  151. msprobe/pytorch/free_benchmark/main.py +7 -4
  152. msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +1 -1
  153. msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +1 -1
  154. msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +1 -1
  155. msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +3 -3
  156. msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +1 -1
  157. msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +1 -1
  158. msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +43 -29
  159. msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -1
  160. msprobe/pytorch/function_factory.py +75 -0
  161. msprobe/pytorch/functional/dump_module.py +4 -4
  162. msprobe/pytorch/grad_probe/__init__.py +0 -0
  163. msprobe/pytorch/grad_probe/grad_monitor.py +90 -0
  164. msprobe/pytorch/grad_probe/grad_stat_csv.py +129 -0
  165. msprobe/pytorch/hook_module/hook_module.py +14 -3
  166. msprobe/pytorch/hook_module/support_wrap_ops.yaml +2 -1
  167. msprobe/pytorch/hook_module/utils.py +9 -9
  168. msprobe/pytorch/hook_module/wrap_aten.py +20 -10
  169. msprobe/pytorch/hook_module/wrap_distributed.py +10 -7
  170. msprobe/pytorch/hook_module/wrap_functional.py +4 -7
  171. msprobe/pytorch/hook_module/wrap_npu_custom.py +21 -10
  172. msprobe/pytorch/hook_module/wrap_tensor.py +5 -6
  173. msprobe/pytorch/hook_module/wrap_torch.py +5 -7
  174. msprobe/pytorch/hook_module/wrap_vf.py +6 -8
  175. msprobe/pytorch/module_processer.py +53 -13
  176. msprobe/pytorch/online_dispatch/compare.py +4 -4
  177. msprobe/pytorch/online_dispatch/dispatch.py +39 -41
  178. msprobe/pytorch/online_dispatch/dump_compare.py +17 -47
  179. msprobe/pytorch/online_dispatch/single_compare.py +5 -5
  180. msprobe/pytorch/online_dispatch/utils.py +2 -43
  181. msprobe/pytorch/parse_tool/lib/compare.py +31 -19
  182. msprobe/pytorch/parse_tool/lib/config.py +2 -1
  183. msprobe/pytorch/parse_tool/lib/parse_tool.py +4 -4
  184. msprobe/pytorch/parse_tool/lib/utils.py +34 -80
  185. msprobe/pytorch/parse_tool/lib/visualization.py +4 -3
  186. msprobe/pytorch/pt_config.py +100 -6
  187. msprobe/pytorch/service.py +104 -19
  188. mindstudio_probe-1.0.1.dist-info/RECORD +0 -228
  189. msprobe/mindspore/dump/api_kbk_dump.py +0 -55
  190. msprobe/pytorch/compare/acc_compare.py +0 -1024
  191. msprobe/pytorch/compare/highlight.py +0 -100
  192. msprobe/test/core_ut/common/test_utils.py +0 -345
  193. msprobe/test/core_ut/data_dump/test_data_collector.py +0 -47
  194. msprobe/test/core_ut/data_dump/test_json_writer.py +0 -183
  195. msprobe/test/core_ut/data_dump/test_scope.py +0 -151
  196. msprobe/test/core_ut/test_common_config.py +0 -152
  197. msprobe/test/core_ut/test_file_check.py +0 -218
  198. msprobe/test/core_ut/test_log.py +0 -109
  199. msprobe/test/mindspore_ut/test_api_kbk_dump.py +0 -51
  200. msprobe/test/mindspore_ut/test_debugger_config.py +0 -42
  201. msprobe/test/mindspore_ut/test_dump_tool_factory.py +0 -51
  202. msprobe/test/mindspore_ut/test_kernel_graph_dump.py +0 -66
  203. msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +0 -63
  204. msprobe/test/mindspore_ut/test_ms_config.py +0 -69
  205. msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +0 -51
  206. msprobe/test/mindspore_ut/test_precision_debugger.py +0 -56
  207. msprobe/test/mindspore_ut/test_task_handler_factory.py +0 -58
  208. msprobe/test/pytorch_ut/advisor/test_advisor.py +0 -83
  209. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +0 -108
  210. msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +0 -39
  211. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +0 -112
  212. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +0 -77
  213. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +0 -125
  214. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +0 -10
  215. msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +0 -43
  216. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +0 -179
  217. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +0 -63
  218. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +0 -99
  219. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +0 -115
  220. msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +0 -72
  221. msprobe/test/pytorch_ut/compare/test_acc_compare.py +0 -17
  222. msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +0 -105
  223. msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +0 -121
  224. msprobe/test/pytorch_ut/free_benchmark/test_main.py +0 -101
  225. msprobe/test/pytorch_ut/functional/test_dump_module.py +0 -15
  226. msprobe/test/pytorch_ut/hook_module/test_api_registry.py +0 -130
  227. msprobe/test/pytorch_ut/hook_module/test_hook_module.py +0 -42
  228. msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +0 -65
  229. msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +0 -35
  230. msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +0 -20
  231. msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +0 -35
  232. msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +0 -43
  233. msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +0 -11
  234. msprobe/test/pytorch_ut/test_pt_config.py +0 -69
  235. msprobe/test/pytorch_ut/test_service.py +0 -59
  236. msprobe/test/resources/advisor.txt +0 -3
  237. msprobe/test/resources/compare_result_20230703104808.csv +0 -9
  238. msprobe/test/resources/compare_result_without_accuracy.csv +0 -9
  239. msprobe/test/resources/config.yaml +0 -3
  240. msprobe/test/resources/npu_test.pkl +0 -8
  241. msprobe/test/run_test.sh +0 -30
  242. msprobe/test/run_ut.py +0 -58
  243. msprobe/test/test_module_processer.py +0 -64
  244. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/LICENSE +0 -0
  245. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/WHEEL +0 -0
  246. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/entry_points.txt +0 -0
  247. {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/top_level.txt +0 -0
  248. /msprobe/{pytorch → core}/advisor/advisor_const.py +0 -0
  249. /msprobe/pytorch/doc/{atat → msprobe}/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md" +0 -0
File without changes
@@ -0,0 +1,42 @@
1
+ from msprobe.mindspore.free_benchmark.common.config import Config
2
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
3
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
4
+ from msprobe.mindspore.free_benchmark.handler.handler_factory import HandlerFactory
5
+ from msprobe.mindspore.free_benchmark.perturbation.perturbation_factory import PerturbationFactory
6
+
7
+
8
+ class ForwardSelfChecker:
9
+
10
+ def __init__(self, api_name: str):
11
+ self.api_name = api_name
12
+
13
+ def handle(self, params: HandlerParams):
14
+ """
15
+ 装饰器实际执行逻辑
16
+
17
+ """
18
+ perturbation = PerturbationFactory.create(self.api_name)
19
+ params.fuzzed_result = perturbation.handle(params)
20
+ params.original_result = params.original_func(*params.args, **params.kwargs)
21
+ if params.fuzzed_result is not False:
22
+ return self.deal_fuzzed_and_original_result(params)
23
+ return params.original_result
24
+
25
+ def get_compare_data(self, params: HandlerParams):
26
+ if self.api_name not in FreeBenchmarkConst.COMMUNICATION_API_LIST:
27
+ return
28
+ # 以下为通讯类api处理逻辑
29
+ params.fuzzed_result = params.fuzzed_value
30
+ if Config.pert_type == FreeBenchmarkConst.IMPROVE_PRECISION:
31
+ params.original_result = params.args
32
+ else:
33
+ params.original_result = params.args[params.index]
34
+
35
+ def deal_fuzzed_and_original_result(self, params: HandlerParams):
36
+ original_result = params.original_result
37
+ self.get_compare_data(params)
38
+ handler = HandlerFactory.create(self.api_name)
39
+ result = handler.handle(params)
40
+ if self.api_name in FreeBenchmarkConst.COMMUNICATION_API_LIST:
41
+ result = original_result
42
+ return result
@@ -0,0 +1,107 @@
1
+ import os
2
+ import sys
3
+ import traceback
4
+ from functools import wraps
5
+ from typing import Tuple, Dict, List
6
+
7
+ from mindspore import ops
8
+
9
+ from msprobe.mindspore.runtime import Runtime
10
+ from msprobe.mindspore.common.log import logger
11
+ from msprobe.mindspore.free_benchmark.common.config import Config
12
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
13
+ from .dec_forward import ForwardSelfChecker
14
+
15
+
16
+ def decorate(original_func, decorate_func, api_name=None):
17
+ """
18
+ 总装饰器
19
+ """
20
+ @wraps(original_func)
21
+ def fuzz_wrapper(*args, **kwargs):
22
+
23
+ def __exec_decorate_func():
24
+ params = data_pre_deal(api_name, original_func, *args, **kwargs)
25
+ result = decorate_func(params)
26
+ return result
27
+
28
+ try:
29
+ if Runtime.rank_id == -1:
30
+ Runtime.rank_id = os.environ.get("RANK_ID", -1)
31
+ if need_wrapper_func():
32
+ logger.info(f"[{api_name}] is checking.")
33
+ return __exec_decorate_func()
34
+ except Exception as e:
35
+ logger.error(f"[{api_name}] Error: {str(e)}")
36
+ logger.error(f"[{api_name}] Error detail: {traceback.format_exc()}")
37
+
38
+ return original_func(*args, **kwargs)
39
+
40
+ return fuzz_wrapper
41
+
42
+
43
+ def decorate_forward_function(func, api_name=None):
44
+ """
45
+ 前向装饰器
46
+ """
47
+
48
+ if not api_name:
49
+ api_name = func.__name__
50
+
51
+ def forward_func(params: HandlerParams):
52
+ forward = ForwardSelfChecker(api_name)
53
+ result = forward.handle(params)
54
+ return result
55
+
56
+ return decorate(func, forward_func, api_name)
57
+
58
+
59
+ def stack_depth_check() -> bool:
60
+ nested_depth = 1
61
+ frame = sys._getframe(1)
62
+ while frame:
63
+ if frame.f_code.co_name == "fuzz_wrapper":
64
+ nested_depth -= 1
65
+ if nested_depth < 0:
66
+ return False
67
+ frame = frame.f_back
68
+ return True
69
+
70
+
71
+ def get_target_arg_index(args: Tuple) -> int:
72
+ """
73
+ 类型校验
74
+
75
+ """
76
+ for i, arg in enumerate(args):
77
+ if ops.is_tensor(arg):
78
+ if not ops.is_floating_point(arg):
79
+ continue
80
+ return i
81
+ if isinstance(arg, (List, Tuple, Dict)):
82
+ return i
83
+ return -1
84
+
85
+
86
+ def data_pre_deal(api_name, func, *args, **kwargs):
87
+ params = HandlerParams()
88
+ params.args = args
89
+ params.kwargs = kwargs
90
+ params.original_func = func
91
+ index = get_target_arg_index(args)
92
+ if index == -1:
93
+ raise Exception(f"{api_name} has no supported input type")
94
+ params.index = index
95
+ return params
96
+
97
+
98
+ def need_wrapper_func():
99
+ if not (Runtime.is_running and Config.is_enable):
100
+ return False
101
+ if not stack_depth_check():
102
+ return False
103
+ if Config.steps and Runtime.step_count not in Config.steps:
104
+ return False
105
+ if Config.ranks and Runtime.rank_id != -1 and Runtime.rank_id not in Config.ranks:
106
+ return False
107
+ return True
File without changes
@@ -0,0 +1,90 @@
1
+ import math
2
+ from abc import ABC, abstractmethod
3
+ from typing import Any, Tuple, Optional
4
+
5
+ import mindspore as ms
6
+ from mindspore import Tensor, ops
7
+
8
+ from msprobe.mindspore.common.log import logger
9
+ from msprobe.mindspore.free_benchmark.common.utils import Tools
10
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
11
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
12
+
13
+
14
+ class BaseHandler(ABC):
15
+
16
+ def __init__(self, api_name: str):
17
+ self.api_name = api_name
18
+
19
+ @staticmethod
20
+ def pre_calculate(original_output, fuzzed_output):
21
+ abs_tol = FreeBenchmarkConst.PERT_VALUE_DICT.get(fuzzed_output.dtype,
22
+ FreeBenchmarkConst.PERT_VALUE_DICT.get(ms.float32))
23
+
24
+ return original_output.to(fuzzed_output.dtype), fuzzed_output, abs_tol
25
+
26
+ @staticmethod
27
+ def get_threshold(dtype):
28
+ err = Tools.get_default_error_threshold(dtype)
29
+ return err
30
+
31
+ @staticmethod
32
+ def convert_overflow_ratio_to_consistent(ratio):
33
+ if math.isnan(ratio) or math.isinf(ratio):
34
+ return FreeBenchmarkConst.NO_CHANGE_ERROR_THRESHOLD
35
+ return ratio
36
+
37
+ @staticmethod
38
+ def get_endless_norm(first_tensor, second_tensor, abs_tol):
39
+ if first_tensor.dtype != ms.bfloat16 and second_tensor.dtype != ms.bfloat16:
40
+ ratio_tensor1 = ops.where(ops.abs(second_tensor) > abs_tol, ops.div(first_tensor, second_tensor), 1)
41
+ ratio_tensor2 = ops.where(ops.abs(first_tensor) > abs_tol, ops.div(second_tensor, first_tensor), 1)
42
+ else:
43
+ ratio_tensor1 = ops.where(ops.abs(second_tensor).to(ms.float32) > abs_tol,
44
+ ops.div(first_tensor.to(ms.float32), second_tensor.to(ms.float32)), 1)
45
+ ratio_tensor2 = ops.where(ops.abs(first_tensor).to(ms.float32) > abs_tol,
46
+ ops.div(second_tensor.to(ms.float32), first_tensor.to(ms.float32)), 1)
47
+ norm1 = BaseHandler.convert_overflow_ratio_to_consistent(ops.max(ratio_tensor1)[0].to(ms.float32).item())
48
+ norm2 = BaseHandler.convert_overflow_ratio_to_consistent(ops.max(ratio_tensor2)[0].to(ms.float32).item())
49
+ norm3 = BaseHandler.convert_overflow_ratio_to_consistent(ops.min(ratio_tensor1)[0].to(ms.float32).item())
50
+ ratio = FreeBenchmarkConst.SYMBOL_FLIPPING_RATIO if norm3 < 0 else max(norm1, norm2)
51
+
52
+ return ratio
53
+
54
+ @staticmethod
55
+ def ratio_calculate(original_output, fuzzed_output) -> float:
56
+ try:
57
+ original_output, fuzzed_output, abs_tol = BaseHandler.pre_calculate(original_output, fuzzed_output)
58
+ except Exception as e:
59
+ logger.error(f"When computing ratio, y1 or y2 dtype is not supported {str(e)}")
60
+ return FreeBenchmarkConst.NO_CHANGE_ERROR_THRESHOLD
61
+
62
+ abs_tol = abs_tol ** 0.5
63
+
64
+ return BaseHandler.get_endless_norm(original_output, fuzzed_output, abs_tol)
65
+
66
+ @staticmethod
67
+ def npu_compare(original_output, fuzzed_output) -> Tuple[bool, Optional[float]]:
68
+ if not isinstance(fuzzed_output, Tensor):
69
+ logger.error(f"The compare for output type `{type(fuzzed_output)}` is not supported")
70
+ return True, 1.0
71
+
72
+ # 范数计算等
73
+ err_thd = BaseHandler.get_threshold(original_output.dtype)
74
+ ratio = BaseHandler.ratio_calculate(original_output, fuzzed_output)
75
+ is_consistent = err_thd >= ratio >= 1.0 / err_thd
76
+ return is_consistent, ratio
77
+
78
+ @staticmethod
79
+ def is_float_tensor(output) -> bool:
80
+ if isinstance(output, Tensor) and ops.is_floating_point(output):
81
+ return True
82
+ if isinstance(output, (list, tuple)):
83
+ for i in output:
84
+ if isinstance(i, Tensor) and ops.is_floating_point(i):
85
+ return True
86
+ return False
87
+
88
+ @abstractmethod
89
+ def handle(self, params: HandlerParams) -> Any:
90
+ pass
@@ -0,0 +1,41 @@
1
+ from typing import Any
2
+ from dataclasses import asdict
3
+
4
+ from mindspore import Tensor, ops
5
+
6
+ from msprobe.mindspore.common.log import logger
7
+ from msprobe.mindspore.free_benchmark.common.config import Config
8
+ from msprobe.mindspore.free_benchmark.handler.base_handler import BaseHandler
9
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
10
+ from msprobe.mindspore.free_benchmark.common.utils import make_unequal_row
11
+ from msprobe.core.data_dump.json_writer import DataWriter
12
+
13
+
14
+ class CheckHandler(BaseHandler):
15
+
16
+ def npu_compare_and_save(self, original_output, fuzzed_output, params: HandlerParams, output_index=None):
17
+ is_consistent, ratio = self.npu_compare(original_output, fuzzed_output)
18
+ params.is_consistent = params.is_consistent and is_consistent
19
+ if not is_consistent:
20
+ row = make_unequal_row(self.api_name, params, ratio, output_index)
21
+ data_dict = asdict(row)
22
+ DataWriter.write_data_to_csv(
23
+ data_dict.values(),
24
+ data_dict.keys(),
25
+ Config.dump_path
26
+ )
27
+ logger.error(f"{self.api_name} is not consistent")
28
+
29
+ def handle(self, params: HandlerParams) -> Any:
30
+ try:
31
+ if not self.is_float_tensor(params.fuzzed_result):
32
+ return params.original_result
33
+ if isinstance(params.fuzzed_result, Tensor):
34
+ self.npu_compare_and_save(params.original_result, params.fuzzed_result, params)
35
+ elif isinstance(params.fuzzed_result, (list, tuple)):
36
+ for i, item in enumerate(params.original_result):
37
+ if ops.is_tensor(item) and ops.is_floating_point(item):
38
+ self.npu_compare_and_save(item, params.fuzzed_result[i], params, output_index=i)
39
+ except Exception as e:
40
+ logger.error(str(e))
41
+ return params.original_result
@@ -0,0 +1,36 @@
1
+ from typing import Any
2
+
3
+ from mindspore import Tensor
4
+
5
+ from msprobe.mindspore.common.log import logger
6
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
7
+
8
+
9
+ class FixHandler:
10
+
11
+ def __init__(self, api_name: str):
12
+ self.api_name = api_name
13
+
14
+ @staticmethod
15
+ def use_fuzzed_result(original_result, fuzzed_result):
16
+ if isinstance(original_result, Tensor):
17
+ return fuzzed_result.to(original_result.dtype)
18
+ if isinstance(original_result, dict):
19
+ dict_fixed_result = dict()
20
+ for k, v in original_result.items():
21
+ dict_fixed_result[k] = FixHandler.use_fuzzed_result(v, fuzzed_result[k])
22
+ return dict_fixed_result
23
+ if isinstance(original_result, (tuple, list)):
24
+ list_fixed_result = list()
25
+ for i, v in enumerate(original_result):
26
+ list_fixed_result.append(FixHandler.use_fuzzed_result(v, fuzzed_result[i]))
27
+ return type(original_result)(list_fixed_result)
28
+ return original_result
29
+
30
+ def handle(self, params: HandlerParams) -> Any:
31
+ try:
32
+ return FixHandler.use_fuzzed_result(params.original_result, params.fuzzed_result)
33
+ except Exception as e:
34
+ logger.error(f"{self.api_name} failed to fix.")
35
+ logger.error(str(e))
36
+ return params.original_result
@@ -0,0 +1,21 @@
1
+ from msprobe.mindspore.common.log import logger
2
+ from msprobe.mindspore.free_benchmark.common.config import Config
3
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
4
+ from .check_handler import CheckHandler
5
+ from .fix_handler import FixHandler
6
+
7
+
8
+ class HandlerFactory:
9
+ result_handlers = {
10
+ FreeBenchmarkConst.CHECK: CheckHandler,
11
+ FreeBenchmarkConst.FIX: FixHandler,
12
+ }
13
+
14
+ @staticmethod
15
+ def create(api_name: str):
16
+ handler = HandlerFactory.result_handlers.get(Config.handler_type)
17
+ if handler:
18
+ return handler(api_name)
19
+ else:
20
+ logger.error(f"{Config.handler_type} is not supported.")
21
+ raise Exception
@@ -0,0 +1,67 @@
1
+ from typing import Any
2
+
3
+ from mindspore import Tensor, ops
4
+
5
+ from msprobe.mindspore.common.log import logger
6
+ from msprobe.mindspore.free_benchmark.perturbation.base_perturbation import BasePerturbation
7
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
8
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
9
+
10
+
11
+ class AddNoisePerturbation(BasePerturbation):
12
+
13
+ def handle(self, params: HandlerParams) -> Any:
14
+ """
15
+ 返回增加扰动后的api输出
16
+
17
+ """
18
+ params.fuzzed_value = self.add_noise(params.args[params.index])
19
+ if not self.is_fuzzed:
20
+ logger.warning(f"{self.api_name} can not add noise.")
21
+ return False
22
+ return self.get_fuzzed_result(params)
23
+
24
+ def add_noise(self, inputs) -> Any:
25
+ """
26
+ 返回增加扰动后的api输入
27
+
28
+ """
29
+ if isinstance(inputs, Tensor):
30
+ noise = self._get_noise(inputs)
31
+ if noise is not False:
32
+ result = ops.where(ops.abs(inputs) > self.perturbation_value ** 0.5,
33
+ ops.add(noise, inputs), inputs)
34
+ result = result.type(dtype=inputs.dtype)
35
+ self.is_fuzzed = True
36
+ return result
37
+
38
+ if isinstance(inputs, dict):
39
+ return {k: self.add_noise(v) for k, v in inputs.items()}
40
+
41
+ if isinstance(inputs, (list, tuple)):
42
+ return [self.add_noise(v) for v in inputs]
43
+
44
+ return inputs
45
+
46
+ def _get_noise(self, input):
47
+ """
48
+ 得到要添加的噪声值
49
+
50
+ """
51
+ if self.is_fuzzed:
52
+ return False
53
+ if not ops.is_floating_point(input) or ops.numel(input) == 0:
54
+ return False
55
+
56
+ pert_value = FreeBenchmarkConst.PERT_VALUE_DICT.get(input.dtype)
57
+ if not pert_value:
58
+ return False
59
+ else:
60
+ self.perturbation_value = pert_value
61
+
62
+ max_val = ops.max(ops.abs(input))[0].item()
63
+ if max_val < pert_value:
64
+ return False
65
+
66
+ noise = ops.full(input.shape, self.perturbation_value, dtype=input.dtype)
67
+ return noise
@@ -0,0 +1,21 @@
1
+ from typing import Any
2
+
3
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
4
+
5
+
6
+ class BasePerturbation:
7
+
8
+ def __init__(self, api_name: str):
9
+ self.api_name = api_name
10
+ self.is_fuzzed = False
11
+ self.perturbation_value = None
12
+
13
+ @staticmethod
14
+ def get_fuzzed_result(params: HandlerParams):
15
+ args_front = params.args[:params.index]
16
+ args_rear = params.args[params.index + 1:]
17
+ fuzzed_result = params.original_func(*args_front, params.fuzzed_value, *args_rear, **params.kwargs)
18
+ return fuzzed_result
19
+
20
+ def handler(self, params: HandlerParams) -> Any:
21
+ pass
@@ -0,0 +1,63 @@
1
+ from typing import Any
2
+
3
+ import numpy as np
4
+ from mindspore import Tensor, ops
5
+
6
+ from msprobe.mindspore.common.log import logger
7
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
8
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
9
+ from msprobe.mindspore.free_benchmark.perturbation.base_perturbation import BasePerturbation
10
+
11
+
12
+ class BitNoisePerturbation(BasePerturbation):
13
+
14
+ def add_bit_noise(self, inputs) -> Any:
15
+ if isinstance(inputs, Tensor):
16
+ bit_len_type = self._get_bit_len_type(inputs)
17
+ if bit_len_type is not False:
18
+ sub_normal_np = np.finfo(FreeBenchmarkConst.MS_NUMPY_DTYPE_DICT.get(inputs.dtype)).smallest_normal
19
+ sub_normal = Tensor(sub_normal_np)
20
+ noise_type = list(FreeBenchmarkConst.MS_NUMPY_DTYPE_DICT.keys())[
21
+ list(FreeBenchmarkConst.MS_NUMPY_DTYPE_DICT.values()).index(bit_len_type)]
22
+ noise = ops.full(inputs.shape, 1, dtype=noise_type)
23
+ input_np = inputs.asnumpy()
24
+ input_np_int = input_np.view(bit_len_type)
25
+ result = Tensor(input_np_int)
26
+ result = ops.where(ops.abs(inputs) > sub_normal,
27
+ ops.bitwise_xor(result, noise), result)
28
+ result_np = result.asnumpy()
29
+ result_np_float = result_np.view(FreeBenchmarkConst.MS_NUMPY_DTYPE_DICT.get(inputs.dtype))
30
+ self.is_fuzzed = True
31
+ return Tensor(result_np_float)
32
+
33
+ if isinstance(inputs, dict):
34
+ return {k: self.add_bit_noise(v) for k, v in inputs.items()}
35
+ if isinstance(inputs, (tuple, list)):
36
+ return type(inputs)([self.add_bit_noise(v) for v in inputs])
37
+ return inputs
38
+
39
+ def handle(self, params: HandlerParams) -> any:
40
+ args = params.args
41
+ params.fuzzed_value = self.add_bit_noise(params.args[params.index])
42
+ if not self.is_fuzzed:
43
+ logger.warning(f"{self.api_name} can not add bit noise.")
44
+ return False
45
+ params.args = args
46
+ return self.get_fuzzed_result(params)
47
+
48
+ def _get_bit_len_type(self, input):
49
+ if self.is_fuzzed:
50
+ return False
51
+ if not isinstance(input, Tensor) or not ops.is_floating_point(input) or \
52
+ input.numel() == 0:
53
+ return False
54
+ bit_len_type = FreeBenchmarkConst.PERT_BIT_DICT.get(input.dtype)
55
+ if not bit_len_type:
56
+ return False
57
+ pert_value = FreeBenchmarkConst.PERT_VALUE_DICT.get(input.dtype)
58
+ if not pert_value:
59
+ return False
60
+ max_val = ops.max(ops.abs(input))[0].item()
61
+ if max_val < pert_value:
62
+ return False
63
+ return bit_len_type
@@ -0,0 +1,34 @@
1
+ from typing import Any
2
+
3
+ import mindspore as ms
4
+ from mindspore import Tensor, ops
5
+
6
+ from msprobe.mindspore.free_benchmark.perturbation.base_perturbation import BasePerturbation
7
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
8
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
9
+ from msprobe.mindspore.common.log import logger
10
+
11
+
12
+ class ImprovePrecisionPerturbation(BasePerturbation):
13
+
14
+ def improve_tensor_precision(self, target_tensor):
15
+ if isinstance(target_tensor, Tensor) and ops.is_floating_point(target_tensor) and \
16
+ target_tensor.dtype not in [ms.float64, ms.float32]:
17
+ self.is_fuzzed = True
18
+ return target_tensor.to(ms.float32)
19
+ if isinstance(target_tensor, dict):
20
+ return {k: self.improve_tensor_precision(v) for k, v in target_tensor.items()}
21
+ if isinstance(target_tensor, (tuple, list)):
22
+ return type(target_tensor)([self.improve_tensor_precision(v) for v in target_tensor])
23
+ return target_tensor
24
+
25
+ def handle(self, params: HandlerParams) -> Any:
26
+ args = self.improve_tensor_precision(params.args)
27
+ kwargs = self.improve_tensor_precision(params.kwargs)
28
+ fuzzed_value = args
29
+ if self.api_name in FreeBenchmarkConst.COMMUNICATION_API_LIST:
30
+ params.fuzzed_value = fuzzed_value
31
+ if not self.is_fuzzed:
32
+ logger.warning(f"{self.api_name} can not improve precision.")
33
+ return False
34
+ return params.original_func(*args, **kwargs)
@@ -0,0 +1,12 @@
1
+ from typing import Any
2
+
3
+ from msprobe.mindspore.free_benchmark.perturbation.base_perturbation import BasePerturbation
4
+ from msprobe.mindspore.free_benchmark.common.handler_params import HandlerParams
5
+
6
+
7
+ class NoChangePerturbation(BasePerturbation):
8
+
9
+ def handle(self, params: HandlerParams) -> Any:
10
+ params.fuzzed_value = params.args[params.index]
11
+ self.is_fuzzed = True
12
+ return self.get_fuzzed_result(params)
@@ -0,0 +1,27 @@
1
+ from msprobe.mindspore.common.const import FreeBenchmarkConst
2
+ from msprobe.mindspore.free_benchmark.common.config import Config
3
+ from .add_noise import AddNoisePerturbation
4
+ from .bit_noise import BitNoisePerturbation
5
+ from .no_change import NoChangePerturbation
6
+ from .improve_precision import ImprovePrecisionPerturbation
7
+
8
+
9
+ class PerturbationFactory:
10
+ """
11
+ 扰动工厂类
12
+
13
+ """
14
+ perturbations = {
15
+ FreeBenchmarkConst.IMPROVE_PRECISION: ImprovePrecisionPerturbation,
16
+ FreeBenchmarkConst.ADD_NOISE: AddNoisePerturbation,
17
+ FreeBenchmarkConst.BIT_NOISE: BitNoisePerturbation,
18
+ FreeBenchmarkConst.NO_CHANGE: NoChangePerturbation,
19
+ }
20
+
21
+ @staticmethod
22
+ def create(api_name: str):
23
+ perturbation = PerturbationFactory.perturbations.get(Config.pert_type)
24
+ if perturbation:
25
+ return perturbation(api_name)
26
+ else:
27
+ raise Exception(f'{Config.pert_type} is a invalid perturbation type')
@@ -0,0 +1,33 @@
1
+ from msprobe.mindspore.common.const import Const
2
+ from msprobe.mindspore.debugger.debugger_config import DebuggerConfig
3
+ from msprobe.mindspore.free_benchmark.api_pynative_self_check import ApiPyNativeSelFCheck
4
+
5
+
6
+ class SelfCheckToolFactory:
7
+ tools = {
8
+ Const.CELL: {
9
+ Const.GRAPH_KBYK_MODE: None,
10
+ Const.GRAPH_GE_MODE: None,
11
+ Const.PYNATIVE_MODE: None
12
+ },
13
+ Const.API: {
14
+ Const.GRAPH_KBYK_MODE: None,
15
+ Const.GRAPH_GE_MODE: None,
16
+ Const.PYNATIVE_MODE: ApiPyNativeSelFCheck
17
+ },
18
+ Const.KERNEL: {
19
+ Const.GRAPH_KBYK_MODE: None,
20
+ Const.GRAPH_GE_MODE: None,
21
+ Const.PYNATIVE_MODE: None
22
+ }
23
+ }
24
+
25
+ @staticmethod
26
+ def create(config: DebuggerConfig):
27
+ tool = SelfCheckToolFactory.tools.get(config.level)
28
+ if not tool:
29
+ raise Exception(f"{config.level} is not supported.")
30
+ tool = tool.get(config.execution_mode)
31
+ if not tool:
32
+ raise Exception(f"Task free_benchmark is not supported in this mode: {config.execution_mode}.")
33
+ return tool(config)
File without changes