mindstudio-probe 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/LICENSE +201 -201
- {mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/METADATA +36 -34
- mindstudio_probe-1.1.0.dist-info/RECORD +287 -0
- {mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/WHEEL +1 -1
- {mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/entry_points.txt +1 -0
- msprobe/README.md +131 -237
- msprobe/__init__.py +16 -1
- msprobe/{config/config.json → config.json} +47 -49
- msprobe/core/advisor/advisor.py +124 -124
- msprobe/core/advisor/advisor_const.py +58 -59
- msprobe/core/advisor/advisor_result.py +58 -58
- msprobe/core/common/const.py +402 -318
- msprobe/core/common/exceptions.py +99 -99
- msprobe/core/common/{file_check.py → file_utils.py} +523 -283
- msprobe/core/common/inplace_op_checker.py +38 -0
- msprobe/core/common/inplace_ops.yaml +251 -0
- msprobe/core/common/log.py +86 -69
- msprobe/core/common/utils.py +371 -616
- msprobe/core/common_config.py +78 -71
- msprobe/core/compare/acc_compare.py +472 -298
- msprobe/core/compare/check.py +180 -95
- msprobe/core/compare/compare_cli.py +69 -49
- msprobe/core/compare/highlight.py +259 -222
- msprobe/core/compare/multiprocessing_compute.py +174 -149
- msprobe/core/compare/npy_compare.py +310 -295
- msprobe/core/compare/utils.py +464 -429
- msprobe/core/data_dump/data_collector.py +153 -144
- msprobe/core/data_dump/data_processor/base.py +337 -293
- msprobe/core/data_dump/data_processor/factory.py +76 -59
- msprobe/core/data_dump/data_processor/mindspore_processor.py +192 -198
- msprobe/core/data_dump/data_processor/pytorch_processor.py +383 -389
- msprobe/core/data_dump/json_writer.py +117 -116
- msprobe/core/data_dump/scope.py +194 -178
- msprobe/core/grad_probe/constant.py +74 -70
- msprobe/core/grad_probe/grad_compare.py +170 -175
- msprobe/core/grad_probe/utils.py +77 -52
- msprobe/docs/01.installation.md +99 -0
- msprobe/docs/02.config_introduction.md +137 -0
- msprobe/docs/03.config_examples.md +237 -0
- msprobe/docs/04.acl_config_examples.md +78 -0
- msprobe/docs/05.data_dump_PyTorch.md +326 -0
- msprobe/docs/06.data_dump_MindSpore.md +285 -0
- msprobe/docs/07.accuracy_checker_PyTorch.md +297 -0
- msprobe/docs/08.accuracy_checker_online_PyTorch.md +238 -0
- msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
- msprobe/docs/10.accuracy_compare_PyTorch.md +327 -0
- msprobe/docs/11.accuracy_compare_MindSpore.md +333 -0
- msprobe/docs/12.overflow_check_PyTorch.md +79 -0
- msprobe/docs/13.overflow_check_MindSpore.md +31 -0
- msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
- msprobe/docs/15.free_benchmarking_PyTorch.md +170 -0
- msprobe/docs/16.free_benchmarking_MindSpore.md +140 -0
- msprobe/{doc/grad_probe/grad_probe.md → docs/17.grad_probe.md} +205 -207
- msprobe/{pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md → docs/18.online_dispatch.md} +89 -90
- msprobe/docs/FAQ.md +189 -0
- msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
- msprobe/docs/img/free_benchmark_framework.png +0 -0
- msprobe/docs/img/ms_dump.png +0 -0
- msprobe/docs/img/ms_layer.png +0 -0
- msprobe/docs/img/pt_dump.png +0 -0
- msprobe/mindspore/__init__.py +2 -1
- msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +278 -245
- msprobe/mindspore/api_accuracy_checker/api_info.py +76 -69
- msprobe/mindspore/api_accuracy_checker/api_runner.py +155 -151
- msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +196 -196
- msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
- msprobe/mindspore/api_accuracy_checker/compute_element.py +238 -223
- msprobe/mindspore/api_accuracy_checker/main.py +8 -15
- msprobe/mindspore/api_accuracy_checker/type_mapping.py +113 -113
- msprobe/mindspore/api_accuracy_checker/utils.py +79 -62
- msprobe/mindspore/cell_processor.py +58 -34
- msprobe/mindspore/common/const.py +108 -87
- msprobe/mindspore/common/log.py +37 -37
- msprobe/mindspore/common/utils.py +97 -57
- msprobe/mindspore/compare/distributed_compare.py +62 -75
- msprobe/mindspore/compare/layer_mapping.py +146 -0
- msprobe/mindspore/compare/modify_mapping.py +107 -0
- msprobe/mindspore/compare/ms_compare.py +357 -117
- msprobe/mindspore/compare/ms_graph_compare.py +364 -317
- msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -399
- msprobe/mindspore/debugger/debugger_config.py +69 -74
- msprobe/mindspore/debugger/precision_debugger.py +150 -107
- msprobe/mindspore/dump/dump_tool_factory.py +50 -35
- msprobe/mindspore/dump/hook_cell/api_registry.py +128 -104
- msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -53
- msprobe/mindspore/dump/hook_cell/primitive_hooks.py +206 -0
- msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +994 -925
- msprobe/mindspore/dump/hook_cell/wrap_api.py +121 -0
- msprobe/mindspore/dump/jit_dump.py +96 -56
- msprobe/mindspore/dump/kernel_graph_dump.py +75 -60
- msprobe/mindspore/dump/kernel_kbyk_dump.py +79 -65
- msprobe/mindspore/free_benchmark/api_pynative_self_check.py +131 -116
- msprobe/mindspore/free_benchmark/common/config.py +27 -12
- msprobe/mindspore/free_benchmark/common/handler_params.py +32 -17
- msprobe/mindspore/free_benchmark/common/utils.py +85 -71
- msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -842
- msprobe/mindspore/free_benchmark/decorator/dec_forward.py +57 -42
- msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +122 -107
- msprobe/mindspore/free_benchmark/handler/base_handler.py +105 -90
- msprobe/mindspore/free_benchmark/handler/check_handler.py +56 -41
- msprobe/mindspore/free_benchmark/handler/fix_handler.py +51 -36
- msprobe/mindspore/free_benchmark/handler/handler_factory.py +36 -21
- msprobe/mindspore/free_benchmark/perturbation/add_noise.py +82 -67
- msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +36 -21
- msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +78 -63
- msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +77 -0
- msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +49 -34
- msprobe/mindspore/free_benchmark/perturbation/no_change.py +27 -12
- msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +44 -27
- msprobe/mindspore/free_benchmark/self_check_tool_factory.py +48 -33
- msprobe/mindspore/grad_probe/global_context.py +100 -91
- msprobe/mindspore/grad_probe/grad_analyzer.py +231 -231
- msprobe/mindspore/grad_probe/grad_monitor.py +27 -27
- msprobe/mindspore/grad_probe/grad_stat_csv.py +131 -131
- msprobe/mindspore/grad_probe/hook.py +94 -92
- msprobe/mindspore/grad_probe/utils.py +29 -28
- msprobe/mindspore/ms_config.py +128 -126
- msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +60 -45
- msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +49 -34
- msprobe/mindspore/runtime.py +4 -4
- msprobe/mindspore/service.py +297 -354
- msprobe/mindspore/task_handler_factory.py +24 -24
- msprobe/msprobe.py +105 -107
- msprobe/pytorch/__init__.py +23 -4
- msprobe/pytorch/api_accuracy_checker/common/config.py +70 -55
- msprobe/pytorch/api_accuracy_checker/common/utils.py +246 -165
- msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +230 -213
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +632 -581
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
- msprobe/pytorch/api_accuracy_checker/compare/compare.py +416 -381
- msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +90 -73
- msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +265 -244
- msprobe/pytorch/api_accuracy_checker/config.yaml +10 -10
- msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +370 -332
- msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +221 -199
- msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +150 -134
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +518 -581
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +213 -74
- msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +218 -202
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +370 -324
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +227 -204
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +110 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +244 -218
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml +63 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +44 -0
- msprobe/pytorch/bench_functions/__init__.py +30 -15
- msprobe/pytorch/bench_functions/apply_adam_w.py +43 -28
- msprobe/pytorch/bench_functions/confusion_transpose.py +34 -19
- msprobe/pytorch/bench_functions/fast_gelu.py +70 -55
- msprobe/pytorch/bench_functions/layer_norm_eval.py +21 -6
- msprobe/pytorch/bench_functions/linear.py +27 -12
- msprobe/pytorch/bench_functions/matmul_backward.py +63 -48
- msprobe/pytorch/bench_functions/npu_fusion_attention.py +538 -421
- msprobe/pytorch/bench_functions/rms_norm.py +30 -15
- msprobe/pytorch/bench_functions/rotary_mul.py +71 -52
- msprobe/pytorch/bench_functions/scaled_mask_softmax.py +41 -26
- msprobe/pytorch/bench_functions/swiglu.py +70 -55
- msprobe/pytorch/common/__init__.py +17 -2
- msprobe/pytorch/common/compare_script.template +14 -14
- msprobe/pytorch/common/log.py +33 -32
- msprobe/pytorch/common/parse_json.py +54 -39
- msprobe/pytorch/common/utils.py +310 -300
- msprobe/pytorch/compare/distributed_compare.py +66 -66
- msprobe/pytorch/compare/mapping.yaml +607 -607
- msprobe/pytorch/compare/match.py +49 -33
- msprobe/pytorch/compare/pt_compare.py +82 -40
- msprobe/pytorch/debugger/debugger_config.py +108 -95
- msprobe/pytorch/debugger/precision_debugger.py +173 -125
- msprobe/pytorch/free_benchmark/__init__.py +23 -8
- msprobe/pytorch/free_benchmark/common/constant.py +70 -70
- msprobe/pytorch/free_benchmark/common/counter.py +71 -71
- msprobe/pytorch/free_benchmark/common/enums.py +65 -37
- msprobe/pytorch/free_benchmark/common/params.py +144 -129
- msprobe/pytorch/free_benchmark/common/utils.py +118 -102
- msprobe/pytorch/free_benchmark/compare/grad_saver.py +200 -179
- msprobe/pytorch/free_benchmark/compare/single_benchmark.py +119 -104
- msprobe/pytorch/free_benchmark/main.py +120 -105
- msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +28 -13
- msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +56 -41
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +105 -90
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +119 -104
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +87 -63
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +83 -68
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +43 -28
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +60 -45
- msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +34 -19
- msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +256 -217
- msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +54 -39
- msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +38 -23
- msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +45 -30
- msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +185 -170
- msprobe/pytorch/function_factory.py +91 -75
- msprobe/pytorch/functional/module_dump.py +84 -0
- msprobe/pytorch/grad_probe/grad_monitor.py +91 -90
- msprobe/pytorch/grad_probe/grad_stat_csv.py +128 -128
- msprobe/pytorch/hook_module/__init__.py +16 -1
- msprobe/pytorch/hook_module/api_registry.py +166 -161
- msprobe/pytorch/hook_module/hook_module.py +118 -120
- msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1877
- msprobe/pytorch/hook_module/utils.py +28 -29
- msprobe/pytorch/hook_module/wrap_aten.py +111 -110
- msprobe/pytorch/hook_module/wrap_distributed.py +77 -78
- msprobe/pytorch/hook_module/wrap_functional.py +104 -105
- msprobe/pytorch/hook_module/wrap_npu_custom.py +85 -84
- msprobe/pytorch/hook_module/wrap_tensor.py +69 -71
- msprobe/pytorch/hook_module/wrap_torch.py +84 -86
- msprobe/pytorch/hook_module/wrap_vf.py +60 -62
- msprobe/pytorch/module_processer.py +153 -138
- msprobe/pytorch/online_dispatch/__init__.py +20 -20
- msprobe/pytorch/online_dispatch/compare.py +235 -236
- msprobe/pytorch/online_dispatch/dispatch.py +271 -271
- msprobe/pytorch/online_dispatch/dump_compare.py +155 -156
- msprobe/pytorch/online_dispatch/single_compare.py +391 -391
- msprobe/pytorch/online_dispatch/torch_ops_config.yaml +57 -49
- msprobe/pytorch/online_dispatch/utils.py +127 -146
- msprobe/pytorch/parse.py +19 -4
- msprobe/pytorch/parse_tool/cli.py +31 -32
- msprobe/pytorch/parse_tool/lib/compare.py +259 -271
- msprobe/pytorch/parse_tool/lib/config.py +52 -52
- msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
- msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
- msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
- msprobe/pytorch/parse_tool/lib/parse_tool.py +161 -158
- msprobe/pytorch/parse_tool/lib/utils.py +320 -321
- msprobe/pytorch/parse_tool/lib/visualization.py +85 -91
- msprobe/pytorch/pt_config.py +317 -187
- msprobe/pytorch/service.py +311 -252
- mindstudio_probe-1.0.3.dist-info/RECORD +0 -272
- msprobe/config/README.md +0 -539
- msprobe/mindspore/doc/compare.md +0 -58
- msprobe/mindspore/doc/dump.md +0 -217
- msprobe/mindspore/dump/hook_cell/wrap_functional.py +0 -91
- msprobe/mindspore/dump/hook_cell/wrap_tensor.py +0 -63
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +0 -10
- msprobe/pytorch/doc/FAQ.md +0 -193
- msprobe/pytorch/doc/api_accuracy_checker.md +0 -313
- msprobe/pytorch/doc/api_accuracy_checker_online.md +0 -187
- msprobe/pytorch/doc/dump.md +0 -260
- msprobe/pytorch/doc/msprobe/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
- msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -240
- msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
- msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
- msprobe/pytorch/doc/run_overflow_check.md +0 -25
- msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -151
- msprobe/pytorch/functional/data_processor.py +0 -0
- msprobe/pytorch/functional/dump_module.py +0 -39
- {mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/top_level.txt +0 -0
- /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
- /msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
- /msprobe/{config → docs}/img/free_benchmark.png +0 -0
- /msprobe/{doc/grad_probe/img/image-1.png → docs/img/grad_probe_image-1.png} +0 -0
- /msprobe/{doc/grad_probe/img/image-2.png → docs/img/grad_probe_image-2.png} +0 -0
- /msprobe/{doc/grad_probe/img/image-3.png → docs/img/grad_probe_image-3.png} +0 -0
- /msprobe/{doc/grad_probe/img/image-4.png → docs/img/grad_probe_image-4.png} +0 -0
- /msprobe/{doc/grad_probe/img/image.png → docs/img/grad_probe_image.png} +0 -0
- /msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0
|
@@ -1,381 +1,416 @@
|
|
|
1
|
-
|
|
2
|
-
|
|
3
|
-
|
|
4
|
-
|
|
5
|
-
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
|
|
13
|
-
|
|
14
|
-
|
|
15
|
-
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
|
|
21
|
-
|
|
22
|
-
|
|
23
|
-
|
|
24
|
-
|
|
25
|
-
|
|
26
|
-
|
|
27
|
-
|
|
28
|
-
|
|
29
|
-
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
|
|
34
|
-
|
|
35
|
-
|
|
36
|
-
|
|
37
|
-
|
|
38
|
-
|
|
39
|
-
|
|
40
|
-
|
|
41
|
-
|
|
42
|
-
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
|
|
46
|
-
|
|
47
|
-
|
|
48
|
-
|
|
49
|
-
|
|
50
|
-
|
|
51
|
-
|
|
52
|
-
|
|
53
|
-
|
|
54
|
-
|
|
55
|
-
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
|
|
59
|
-
|
|
60
|
-
|
|
61
|
-
|
|
62
|
-
|
|
63
|
-
|
|
64
|
-
|
|
65
|
-
|
|
66
|
-
|
|
67
|
-
|
|
68
|
-
|
|
69
|
-
|
|
70
|
-
|
|
71
|
-
|
|
72
|
-
|
|
73
|
-
else:
|
|
74
|
-
|
|
75
|
-
|
|
76
|
-
@staticmethod
|
|
77
|
-
def
|
|
78
|
-
|
|
79
|
-
|
|
80
|
-
|
|
81
|
-
|
|
82
|
-
|
|
83
|
-
|
|
84
|
-
|
|
85
|
-
|
|
86
|
-
|
|
87
|
-
|
|
88
|
-
|
|
89
|
-
|
|
90
|
-
|
|
91
|
-
|
|
92
|
-
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
|
|
96
|
-
|
|
97
|
-
|
|
98
|
-
|
|
99
|
-
|
|
100
|
-
|
|
101
|
-
|
|
102
|
-
|
|
103
|
-
|
|
104
|
-
|
|
105
|
-
|
|
106
|
-
|
|
107
|
-
|
|
108
|
-
|
|
109
|
-
|
|
110
|
-
|
|
111
|
-
|
|
112
|
-
|
|
113
|
-
|
|
114
|
-
|
|
115
|
-
|
|
116
|
-
|
|
117
|
-
|
|
118
|
-
|
|
119
|
-
|
|
120
|
-
|
|
121
|
-
|
|
122
|
-
|
|
123
|
-
|
|
124
|
-
|
|
125
|
-
|
|
126
|
-
|
|
127
|
-
|
|
128
|
-
|
|
129
|
-
|
|
130
|
-
|
|
131
|
-
|
|
132
|
-
|
|
133
|
-
|
|
134
|
-
|
|
135
|
-
|
|
136
|
-
|
|
137
|
-
|
|
138
|
-
|
|
139
|
-
|
|
140
|
-
|
|
141
|
-
|
|
142
|
-
|
|
143
|
-
|
|
144
|
-
|
|
145
|
-
|
|
146
|
-
|
|
147
|
-
|
|
148
|
-
|
|
149
|
-
|
|
150
|
-
|
|
151
|
-
|
|
152
|
-
|
|
153
|
-
|
|
154
|
-
|
|
155
|
-
|
|
156
|
-
|
|
157
|
-
|
|
158
|
-
|
|
159
|
-
|
|
160
|
-
|
|
161
|
-
|
|
162
|
-
|
|
163
|
-
|
|
164
|
-
|
|
165
|
-
|
|
166
|
-
|
|
167
|
-
|
|
168
|
-
|
|
169
|
-
|
|
170
|
-
|
|
171
|
-
|
|
172
|
-
|
|
173
|
-
|
|
174
|
-
|
|
175
|
-
|
|
176
|
-
|
|
177
|
-
|
|
178
|
-
|
|
179
|
-
|
|
180
|
-
|
|
181
|
-
|
|
182
|
-
|
|
183
|
-
|
|
184
|
-
|
|
185
|
-
|
|
186
|
-
|
|
187
|
-
|
|
188
|
-
|
|
189
|
-
|
|
190
|
-
|
|
191
|
-
|
|
192
|
-
|
|
193
|
-
|
|
194
|
-
|
|
195
|
-
|
|
196
|
-
|
|
197
|
-
|
|
198
|
-
|
|
199
|
-
|
|
200
|
-
|
|
201
|
-
|
|
202
|
-
|
|
203
|
-
|
|
204
|
-
|
|
205
|
-
|
|
206
|
-
|
|
207
|
-
|
|
208
|
-
|
|
209
|
-
|
|
210
|
-
|
|
211
|
-
|
|
212
|
-
|
|
213
|
-
|
|
214
|
-
|
|
215
|
-
|
|
216
|
-
|
|
217
|
-
|
|
218
|
-
|
|
219
|
-
|
|
220
|
-
|
|
221
|
-
|
|
222
|
-
|
|
223
|
-
|
|
224
|
-
|
|
225
|
-
|
|
226
|
-
|
|
227
|
-
|
|
228
|
-
|
|
229
|
-
|
|
230
|
-
|
|
231
|
-
|
|
232
|
-
|
|
233
|
-
|
|
234
|
-
|
|
235
|
-
|
|
236
|
-
|
|
237
|
-
|
|
238
|
-
|
|
239
|
-
|
|
240
|
-
|
|
241
|
-
|
|
242
|
-
|
|
243
|
-
|
|
244
|
-
|
|
245
|
-
|
|
246
|
-
|
|
247
|
-
|
|
248
|
-
|
|
249
|
-
|
|
250
|
-
|
|
251
|
-
|
|
252
|
-
|
|
253
|
-
|
|
254
|
-
|
|
255
|
-
|
|
256
|
-
|
|
257
|
-
|
|
258
|
-
|
|
259
|
-
|
|
260
|
-
|
|
261
|
-
|
|
262
|
-
|
|
263
|
-
|
|
264
|
-
|
|
265
|
-
|
|
266
|
-
|
|
267
|
-
|
|
268
|
-
|
|
269
|
-
|
|
270
|
-
|
|
271
|
-
|
|
272
|
-
|
|
273
|
-
|
|
274
|
-
|
|
275
|
-
|
|
276
|
-
|
|
277
|
-
|
|
278
|
-
|
|
279
|
-
|
|
280
|
-
|
|
281
|
-
|
|
282
|
-
|
|
283
|
-
|
|
284
|
-
|
|
285
|
-
|
|
286
|
-
|
|
287
|
-
|
|
288
|
-
|
|
289
|
-
|
|
290
|
-
|
|
291
|
-
|
|
292
|
-
|
|
293
|
-
|
|
294
|
-
|
|
295
|
-
def
|
|
296
|
-
|
|
297
|
-
|
|
298
|
-
|
|
299
|
-
|
|
300
|
-
|
|
301
|
-
|
|
302
|
-
|
|
303
|
-
|
|
304
|
-
|
|
305
|
-
|
|
306
|
-
|
|
307
|
-
|
|
308
|
-
|
|
309
|
-
|
|
310
|
-
|
|
311
|
-
|
|
312
|
-
|
|
313
|
-
|
|
314
|
-
|
|
315
|
-
|
|
316
|
-
|
|
317
|
-
|
|
318
|
-
|
|
319
|
-
|
|
320
|
-
|
|
321
|
-
|
|
322
|
-
|
|
323
|
-
|
|
324
|
-
|
|
325
|
-
|
|
326
|
-
|
|
327
|
-
|
|
328
|
-
|
|
329
|
-
|
|
330
|
-
|
|
331
|
-
|
|
332
|
-
|
|
333
|
-
|
|
334
|
-
|
|
335
|
-
|
|
336
|
-
|
|
337
|
-
|
|
338
|
-
|
|
339
|
-
|
|
340
|
-
|
|
341
|
-
|
|
342
|
-
|
|
343
|
-
|
|
344
|
-
|
|
345
|
-
|
|
346
|
-
|
|
347
|
-
|
|
348
|
-
|
|
349
|
-
|
|
350
|
-
|
|
351
|
-
|
|
352
|
-
|
|
353
|
-
|
|
354
|
-
|
|
355
|
-
|
|
356
|
-
|
|
357
|
-
|
|
358
|
-
|
|
359
|
-
|
|
360
|
-
|
|
361
|
-
|
|
362
|
-
|
|
363
|
-
|
|
364
|
-
|
|
365
|
-
|
|
366
|
-
|
|
367
|
-
|
|
368
|
-
|
|
369
|
-
|
|
370
|
-
|
|
371
|
-
|
|
372
|
-
|
|
373
|
-
|
|
374
|
-
|
|
375
|
-
|
|
376
|
-
|
|
377
|
-
|
|
378
|
-
|
|
379
|
-
|
|
380
|
-
|
|
381
|
-
|
|
1
|
+
#!/usr/bin/env python3
|
|
2
|
+
# -*- coding: utf-8 -*-
|
|
3
|
+
# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
|
|
4
|
+
# All rights reserved.
|
|
5
|
+
#
|
|
6
|
+
# Licensed under the Apache License, Version 2.0 (the "License");
|
|
7
|
+
# you may not use this file except in compliance with the License.
|
|
8
|
+
# You may obtain a copy of the License at
|
|
9
|
+
#
|
|
10
|
+
# http://www.apache.org/licenses/LICENSE-2.0
|
|
11
|
+
#
|
|
12
|
+
# Unless required by applicable law or agreed to in writing, software
|
|
13
|
+
# distributed under the License is distributed on an "AS IS" BASIS,
|
|
14
|
+
# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
|
|
15
|
+
# See the License for the specific language governing permissions and
|
|
16
|
+
# limitations under the License.
|
|
17
|
+
|
|
18
|
+
# 进行比对及结果展示
|
|
19
|
+
import os
|
|
20
|
+
from collections import namedtuple
|
|
21
|
+
|
|
22
|
+
import numpy as np
|
|
23
|
+
from msprobe.core.common.utils import CompareException
|
|
24
|
+
from msprobe.core.common.file_utils import get_json_contents, write_csv
|
|
25
|
+
import torch
|
|
26
|
+
from msprobe.core.common.const import CompareConst
|
|
27
|
+
from msprobe.pytorch.api_accuracy_checker.compare.algorithm import get_rmse, get_error_balance, get_max_rel_err, \
|
|
28
|
+
get_mean_rel_err, get_rel_err, get_abs_err, get_max_abs_err, get_rel_err_ratio, cosine_sim, get_rel_err_origin, \
|
|
29
|
+
get_small_value_err_ratio, get_finite_and_infinite_mask, get_small_value_mask, check_inf_nan_value, \
|
|
30
|
+
check_small_value, check_norm_value, get_abs_bench_with_eps, get_ulp_err
|
|
31
|
+
from msprobe.pytorch.api_accuracy_checker.common.config import msCheckerConfig
|
|
32
|
+
from msprobe.pytorch.api_accuracy_checker.compare.compare_column import CompareColumn
|
|
33
|
+
from msprobe.pytorch.api_accuracy_checker.compare.compare_utils import check_dtype_comparable, \
|
|
34
|
+
DETAIL_TEST_ROWS, precision_configs, BENCHMARK_COMPARE_SUPPORT_LIST, absolute_standard_api, binary_standard_api, \
|
|
35
|
+
ulp_standard_api, thousandth_standard_api, apis_threshold
|
|
36
|
+
from msprobe.pytorch.api_accuracy_checker.common.utils import extract_basic_api_segments
|
|
37
|
+
from msprobe.pytorch.common.log import logger
|
|
38
|
+
|
|
39
|
+
|
|
40
|
+
ResultInfo = namedtuple('ResultInfo', ['full_api_name', 'fwd_success_status', 'bwd_success_status',
|
|
41
|
+
'fwd_compare_alg_results', 'bwd_compare_alg_results', 'rank'])
|
|
42
|
+
|
|
43
|
+
|
|
44
|
+
INDEX_TEST_RESULT_GROUP = 3
|
|
45
|
+
INDEX_FIRST_GROUP = 0
|
|
46
|
+
INDEX_MESSAGE = -1
|
|
47
|
+
|
|
48
|
+
|
|
49
|
+
class Comparator:
|
|
50
|
+
# consts for result csv
|
|
51
|
+
COLUMN_API_NAME = "API name"
|
|
52
|
+
COLUMN_FORWARD_SUCCESS = "Forward Test Success"
|
|
53
|
+
COLUMN_BACKWARD_SUCCESS = "Backward Test Success"
|
|
54
|
+
COLUMN_STACK_INFO = "Traceback callstack info"
|
|
55
|
+
|
|
56
|
+
def __init__(self, result_csv_path, details_csv_path, is_continue_run_ut, stack_info_json_path=None, config=None):
|
|
57
|
+
self.save_path_str = result_csv_path
|
|
58
|
+
self.detail_save_path_str = details_csv_path
|
|
59
|
+
self.save_path_list = [result_csv_path]
|
|
60
|
+
self.detail_save_path_list = [details_csv_path]
|
|
61
|
+
|
|
62
|
+
if config and config.online_config.is_online:
|
|
63
|
+
self.save_path_str = result_csv_path.replace(".csv", "_rank{}.csv")
|
|
64
|
+
self.detail_save_path_str = details_csv_path.replace(".csv", "_rank{}.csv")
|
|
65
|
+
self.save_path_list = [self.save_path_str.format(rank) for rank in config.online_config.rank_list]
|
|
66
|
+
self.detail_save_path_list = \
|
|
67
|
+
[self.detail_save_path_str.format(rank) for rank in config.online_config.rank_list]
|
|
68
|
+
|
|
69
|
+
if not is_continue_run_ut:
|
|
70
|
+
self.write_csv_title()
|
|
71
|
+
if stack_info_json_path:
|
|
72
|
+
self.stack_info = get_json_contents(stack_info_json_path)
|
|
73
|
+
else:
|
|
74
|
+
self.stack_info = None
|
|
75
|
+
|
|
76
|
+
@staticmethod
|
|
77
|
+
def get_path_from_rank(rank, path_list, path_pattern):
|
|
78
|
+
return path_list[-1] if len(path_list) == 1 else path_pattern.format(rank)
|
|
79
|
+
|
|
80
|
+
@staticmethod
|
|
81
|
+
def print_pretest_result():
|
|
82
|
+
logger.info("Successfully completed run_ut/multi_run_ut.")
|
|
83
|
+
|
|
84
|
+
@staticmethod
|
|
85
|
+
def _compare_dropout(bench_output, device_output):
|
|
86
|
+
tensor_num = bench_output.numel()
|
|
87
|
+
if tensor_num >= 100:
|
|
88
|
+
if abs((bench_output == 0).sum() - (device_output == 0).cpu().sum()) / tensor_num < 0.1:
|
|
89
|
+
return CompareConst.PASS, 1
|
|
90
|
+
else:
|
|
91
|
+
return CompareConst.ERROR, 0
|
|
92
|
+
else:
|
|
93
|
+
return CompareConst.PASS, 1
|
|
94
|
+
|
|
95
|
+
@staticmethod
|
|
96
|
+
def _compare_builtin_type(bench_output, device_output, compare_column):
|
|
97
|
+
if not isinstance(bench_output, (bool, int, float, str)):
|
|
98
|
+
return CompareConst.PASS, compare_column, ""
|
|
99
|
+
if bench_output != device_output:
|
|
100
|
+
return CompareConst.ERROR, compare_column, ""
|
|
101
|
+
compare_column.error_rate = 0
|
|
102
|
+
return CompareConst.PASS, compare_column, ""
|
|
103
|
+
|
|
104
|
+
@staticmethod
|
|
105
|
+
def _compare_bool_tensor(bench_output, device_output):
|
|
106
|
+
error_nums = (bench_output != device_output).sum()
|
|
107
|
+
if bench_output.size == 0:
|
|
108
|
+
return CompareConst.NAN, CompareConst.ERROR, "There is not bench calculation result."
|
|
109
|
+
error_rate = float(error_nums / bench_output.size)
|
|
110
|
+
result = CompareConst.PASS if error_rate == 0 else CompareConst.ERROR
|
|
111
|
+
return error_rate, result, ""
|
|
112
|
+
|
|
113
|
+
@staticmethod
|
|
114
|
+
def _get_absolute_threshold_attribute(api_name, dtype):
|
|
115
|
+
small_value_threshold = apis_threshold.get(api_name).get(dtype).get('small_value')
|
|
116
|
+
small_value_atol = apis_threshold.get(api_name).get(dtype).get('small_value_atol')
|
|
117
|
+
rtol = apis_threshold.get(api_name).get(dtype).get('rtol')
|
|
118
|
+
return small_value_threshold, small_value_atol, rtol
|
|
119
|
+
|
|
120
|
+
@staticmethod
|
|
121
|
+
def _get_run_ut_detail(test_result):
|
|
122
|
+
"""get run_ut detail before write to csv, called by online run_ut"""
|
|
123
|
+
test_rows = []
|
|
124
|
+
try:
|
|
125
|
+
subject_prefix = test_result[0]
|
|
126
|
+
fwd_result = test_result[3]
|
|
127
|
+
bwd_result = test_result[4]
|
|
128
|
+
except IndexError as e:
|
|
129
|
+
logger.error("List index out of bounds when writing detail CSV.")
|
|
130
|
+
raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR, "list index out of bounds") from e
|
|
131
|
+
|
|
132
|
+
if isinstance(fwd_result, list):
|
|
133
|
+
for i, test_subject in enumerate(fwd_result):
|
|
134
|
+
subject = subject_prefix + ".forward.output." + str(i)
|
|
135
|
+
test_subject = ["{:.{}f}".format(item, msCheckerConfig.precision)
|
|
136
|
+
if isinstance(item, float) else item for item in test_subject]
|
|
137
|
+
test_rows.append([subject] + list(test_subject))
|
|
138
|
+
if isinstance(bwd_result, list):
|
|
139
|
+
for i, test_subject in enumerate(bwd_result):
|
|
140
|
+
subject = subject_prefix + ".backward.output." + str(i)
|
|
141
|
+
test_subject = ["{:.{}f}".format(item, msCheckerConfig.precision)
|
|
142
|
+
if isinstance(item, float) else item for item in test_subject]
|
|
143
|
+
test_rows.append([subject] + list(test_subject))
|
|
144
|
+
return test_rows
|
|
145
|
+
|
|
146
|
+
def write_csv_title(self):
|
|
147
|
+
summary_test_rows = [
|
|
148
|
+
[self.COLUMN_API_NAME,
|
|
149
|
+
self.COLUMN_FORWARD_SUCCESS,
|
|
150
|
+
self.COLUMN_BACKWARD_SUCCESS,
|
|
151
|
+
"Message"]
|
|
152
|
+
]
|
|
153
|
+
for save_path, detail_save_path in zip(self.save_path_list, self.detail_save_path_list):
|
|
154
|
+
if not os.path.exists(save_path):
|
|
155
|
+
write_csv(summary_test_rows, save_path)
|
|
156
|
+
if not os.path.exists(detail_save_path):
|
|
157
|
+
write_csv(DETAIL_TEST_ROWS, detail_save_path)
|
|
158
|
+
|
|
159
|
+
def write_summary_csv(self, test_result):
|
|
160
|
+
test_rows = []
|
|
161
|
+
try:
|
|
162
|
+
name = test_result[0]
|
|
163
|
+
df_row = list(test_result[:INDEX_TEST_RESULT_GROUP])
|
|
164
|
+
if test_result[1] == CompareConst.SKIP:
|
|
165
|
+
df_row.append(test_result[INDEX_TEST_RESULT_GROUP][INDEX_FIRST_GROUP][INDEX_MESSAGE])
|
|
166
|
+
if self.stack_info:
|
|
167
|
+
stack_info = "\n".join(self.stack_info[name])
|
|
168
|
+
df_row.append(stack_info)
|
|
169
|
+
test_rows.append(df_row)
|
|
170
|
+
save_path = self.get_path_from_rank(test_result[-1], self.save_path_list, self.save_path_str)
|
|
171
|
+
except IndexError as e:
|
|
172
|
+
logger.error("List index out of bounds when writing summary CSV.")
|
|
173
|
+
raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR, "list index out of bounds") from e
|
|
174
|
+
write_csv(test_rows, save_path)
|
|
175
|
+
|
|
176
|
+
def write_detail_csv(self, test_result):
|
|
177
|
+
test_rows = self._get_run_ut_detail(test_result)
|
|
178
|
+
detail_save_path = self.get_path_from_rank(test_result[-1],
|
|
179
|
+
self.detail_save_path_list,
|
|
180
|
+
self.detail_save_path_str)
|
|
181
|
+
write_csv(test_rows, detail_save_path)
|
|
182
|
+
|
|
183
|
+
def record_results(self, args):
|
|
184
|
+
self.write_summary_csv(args)
|
|
185
|
+
self.write_detail_csv(args)
|
|
186
|
+
|
|
187
|
+
|
|
188
|
+
def compare_output(self, full_api_name, data_info, is_online=False):
|
|
189
|
+
"""Get compare result and write to result and detail csv.
|
|
190
|
+
is_online: bool, default False. True: called by online api precision compare, only compare without write to csv.
|
|
191
|
+
"""
|
|
192
|
+
_, api_name = extract_basic_api_segments(full_api_name)
|
|
193
|
+
if not api_name:
|
|
194
|
+
raise ValueError(f"API name {full_api_name} has not been adapted.")
|
|
195
|
+
bench_output, device_output = data_info.bench_output, data_info.device_output
|
|
196
|
+
bench_grad, device_grad = data_info.bench_grad, data_info.device_grad
|
|
197
|
+
backward_message = data_info.backward_message
|
|
198
|
+
if "dropout" in full_api_name:
|
|
199
|
+
fwd_success_status, fwd_compare_alg_results = self._compare_dropout(bench_output, device_output)
|
|
200
|
+
else:
|
|
201
|
+
fwd_success_status, fwd_compare_alg_results = self._compare_core_wrapper(api_name, bench_output,
|
|
202
|
+
device_output)
|
|
203
|
+
if not (bench_grad and device_grad):
|
|
204
|
+
bwd_success_status, bwd_compare_alg_results = (CompareConst.SPACE, [])
|
|
205
|
+
else:
|
|
206
|
+
if "dropout" in full_api_name:
|
|
207
|
+
bwd_success_status, bwd_compare_alg_results = self._compare_dropout(bench_grad[0], device_grad[0])
|
|
208
|
+
else:
|
|
209
|
+
bwd_success_status, bwd_compare_alg_results = self._compare_core_wrapper(api_name, bench_grad,
|
|
210
|
+
device_grad)
|
|
211
|
+
if backward_message:
|
|
212
|
+
backward_column = CompareColumn()
|
|
213
|
+
bwd_compare_alg_results = [backward_column.to_column_value(CompareConst.SKIP, backward_message)]
|
|
214
|
+
else:
|
|
215
|
+
bwd_success_status = bwd_success_status if bwd_compare_alg_results is not None else CompareConst.SPACE
|
|
216
|
+
result_info = ResultInfo(full_api_name,
|
|
217
|
+
fwd_success_status,
|
|
218
|
+
bwd_success_status,
|
|
219
|
+
fwd_compare_alg_results,
|
|
220
|
+
bwd_compare_alg_results,
|
|
221
|
+
data_info.rank)
|
|
222
|
+
if is_online:
|
|
223
|
+
# get run_ut compare detail
|
|
224
|
+
return self._get_run_ut_detail(result_info)
|
|
225
|
+
self.record_results(result_info)
|
|
226
|
+
return fwd_success_status == CompareConst.PASS, bwd_success_status == CompareConst.PASS \
|
|
227
|
+
or bwd_success_status == CompareConst.SPACE
|
|
228
|
+
|
|
229
|
+
def _compare_core_wrapper(self, api_name, bench_output, device_output):
|
|
230
|
+
detailed_result_total = []
|
|
231
|
+
test_final_success = CompareConst.PASS
|
|
232
|
+
if isinstance(bench_output, (list, tuple)):
|
|
233
|
+
status, compare_result, message = [], [], []
|
|
234
|
+
if len(bench_output) > len(device_output):
|
|
235
|
+
status = [CompareConst.ERROR]
|
|
236
|
+
message = ["bench and npu output structure is different."]
|
|
237
|
+
else:
|
|
238
|
+
device_output = device_output[:len(bench_output)]
|
|
239
|
+
for b_out_i, n_out_i in zip(bench_output, device_output):
|
|
240
|
+
status_i, compare_result_i, message_i = self._compare_core(api_name, b_out_i, n_out_i)
|
|
241
|
+
status.append(status_i)
|
|
242
|
+
compare_result.append(compare_result_i)
|
|
243
|
+
message.append(message_i)
|
|
244
|
+
else:
|
|
245
|
+
status, compare_result, message = self._compare_core(api_name, bench_output, device_output)
|
|
246
|
+
if not isinstance(status, list):
|
|
247
|
+
detailed_result_total.append(compare_result.to_column_value(status, message))
|
|
248
|
+
if status == CompareConst.ERROR:
|
|
249
|
+
test_final_success = CompareConst.ERROR
|
|
250
|
+
elif status == CompareConst.WARNING:
|
|
251
|
+
test_final_success = CompareConst.WARNING
|
|
252
|
+
else:
|
|
253
|
+
for item, item_status in enumerate(status):
|
|
254
|
+
detailed_result_total.append(compare_result[item].to_column_value(item_status, message[item]))
|
|
255
|
+
if item_status == CompareConst.ERROR:
|
|
256
|
+
test_final_success = CompareConst.ERROR
|
|
257
|
+
elif item_status == CompareConst.WARNING:
|
|
258
|
+
test_final_success = CompareConst.WARNING
|
|
259
|
+
return test_final_success, detailed_result_total
|
|
260
|
+
|
|
261
|
+
def _compare_core(self, api_name, bench_output, device_output):
|
|
262
|
+
compare_column = CompareColumn()
|
|
263
|
+
if not isinstance(bench_output, type(device_output)):
|
|
264
|
+
status = CompareConst.ERROR
|
|
265
|
+
message = "bench and npu output type is different."
|
|
266
|
+
elif isinstance(bench_output, dict):
|
|
267
|
+
b_keys, n_keys = set(bench_output.keys()), set(device_output.keys())
|
|
268
|
+
if b_keys != n_keys:
|
|
269
|
+
status = CompareConst.ERROR
|
|
270
|
+
message = "bench and npu output dict keys are different."
|
|
271
|
+
else:
|
|
272
|
+
status, compare_column, message = self._compare_core(api_name, list(bench_output.values()),
|
|
273
|
+
list(device_output.values()))
|
|
274
|
+
elif isinstance(bench_output, torch.Tensor):
|
|
275
|
+
copy_bench_out = bench_output.detach().clone()
|
|
276
|
+
copy_device_output = device_output.detach().clone()
|
|
277
|
+
compare_column.bench_type = str(copy_bench_out.dtype)
|
|
278
|
+
compare_column.npu_type = str(copy_device_output.dtype)
|
|
279
|
+
compare_column.shape = tuple(device_output.shape)
|
|
280
|
+
status, compare_column, message = self._compare_torch_tensor(api_name, copy_bench_out, copy_device_output,
|
|
281
|
+
compare_column)
|
|
282
|
+
elif isinstance(bench_output, (bool, int, float, str)):
|
|
283
|
+
compare_column.bench_type = str(type(bench_output))
|
|
284
|
+
compare_column.npu_type = str(type(device_output))
|
|
285
|
+
status, compare_column, message = self._compare_builtin_type(bench_output, device_output, compare_column)
|
|
286
|
+
elif bench_output is None:
|
|
287
|
+
status = CompareConst.SKIP
|
|
288
|
+
message = "Bench output is None, skip this test."
|
|
289
|
+
else:
|
|
290
|
+
status = CompareConst.ERROR
|
|
291
|
+
message = "Unexpected output type in compare_core: {}".format(type(bench_output))
|
|
292
|
+
|
|
293
|
+
return status, compare_column, message
|
|
294
|
+
|
|
295
|
+
def _compare_torch_tensor(self, api_name, bench_output, device_output, compare_column):
|
|
296
|
+
cpu_shape = bench_output.shape
|
|
297
|
+
npu_shape = device_output.shape
|
|
298
|
+
npu_dtype = device_output.dtype
|
|
299
|
+
if npu_dtype == torch.bfloat16:
|
|
300
|
+
bench_output = bench_output.to(torch.float32)
|
|
301
|
+
device_output = device_output.to(torch.float32)
|
|
302
|
+
bench_output = bench_output.cpu().numpy()
|
|
303
|
+
device_output = device_output.cpu().numpy()
|
|
304
|
+
if cpu_shape != npu_shape:
|
|
305
|
+
return CompareConst.ERROR, compare_column, f"The shape of bench{str(cpu_shape)} " \
|
|
306
|
+
f"and npu{str(npu_shape)} not equal."
|
|
307
|
+
if not check_dtype_comparable(bench_output, device_output):
|
|
308
|
+
return CompareConst.ERROR, compare_column, f"Bench out dtype is {bench_output.dtype} but " \
|
|
309
|
+
f"npu output dtype is {device_output.dtype}, cannot compare."
|
|
310
|
+
message = ""
|
|
311
|
+
if bench_output.dtype in [bool, np.uint8, np.int8, np.int16, np.uint16, np.uint32, np.int32,
|
|
312
|
+
np.int64, np.uint64]:
|
|
313
|
+
message += f"Compare algorithm is not supported for {bench_output.dtype} data. " \
|
|
314
|
+
f"Only judged by Error Rate."
|
|
315
|
+
err_rate, status, msg = self._compare_bool_tensor(bench_output, device_output)
|
|
316
|
+
message += msg + "\n"
|
|
317
|
+
compare_column.error_rate = err_rate
|
|
318
|
+
return status, compare_column, message
|
|
319
|
+
else:
|
|
320
|
+
status, compare_column, message = self._compare_float_tensor(api_name, bench_output, device_output,
|
|
321
|
+
compare_column, npu_dtype)
|
|
322
|
+
return status, compare_column, message
|
|
323
|
+
|
|
324
|
+
def _compare_float_tensor(self, api_name, bench_output, device_output, compare_column, dtype):
|
|
325
|
+
message = ""
|
|
326
|
+
abs_bench, abs_bench_with_eps = get_abs_bench_with_eps(bench_output, dtype)
|
|
327
|
+
abs_err = get_abs_err(bench_output, device_output)
|
|
328
|
+
rel_err_orign = get_rel_err_origin(abs_err, abs_bench_with_eps)
|
|
329
|
+
if api_name in thousandth_standard_api:
|
|
330
|
+
thousand_res, thousand_status = get_rel_err_ratio(rel_err_orign, CompareConst.THOUSAND_RATIO_THRESHOLD)
|
|
331
|
+
compare_column.rel_err_thousandth = thousand_res
|
|
332
|
+
if str(dtype) in BENCHMARK_COMPARE_SUPPORT_LIST:
|
|
333
|
+
both_finite_mask, inf_nan_mask = get_finite_and_infinite_mask(bench_output, device_output)
|
|
334
|
+
if api_name in binary_standard_api:
|
|
335
|
+
err_rate, _, _ = self._compare_bool_tensor(bench_output, device_output)
|
|
336
|
+
compare_column.error_rate = err_rate
|
|
337
|
+
elif api_name in absolute_standard_api:
|
|
338
|
+
small_value_threshold, small_value_atol, rtol = self._get_absolute_threshold_attribute(
|
|
339
|
+
api_name, str(dtype))
|
|
340
|
+
rel_err = abs_err / abs_bench_with_eps
|
|
341
|
+
small_value_mask = get_small_value_mask(abs_bench, both_finite_mask, small_value_threshold)
|
|
342
|
+
normal_value_mask = np.logical_and(both_finite_mask, np.logical_not(small_value_mask))
|
|
343
|
+
compare_column.inf_nan_error_ratio = check_inf_nan_value(inf_nan_mask, bench_output, device_output,
|
|
344
|
+
dtype, rtol)
|
|
345
|
+
compare_column.rel_err_ratio = check_norm_value(normal_value_mask, rel_err, rtol)
|
|
346
|
+
compare_column.abs_err_ratio = check_small_value(abs_err, small_value_mask, small_value_atol)
|
|
347
|
+
elif api_name in ulp_standard_api:
|
|
348
|
+
if bench_output.size == 0:
|
|
349
|
+
compare_column.max_ulp_error = 0
|
|
350
|
+
compare_column.mean_ulp_error = 0
|
|
351
|
+
compare_column.ulp_error_proportion = 0
|
|
352
|
+
else:
|
|
353
|
+
ulp_err = get_ulp_err(bench_output, device_output, dtype)
|
|
354
|
+
compare_column.max_ulp_error = np.max(ulp_err)
|
|
355
|
+
compare_column.mean_ulp_error = np.mean(ulp_err)
|
|
356
|
+
if dtype == torch.float32:
|
|
357
|
+
compare_column.ulp_error_proportion = \
|
|
358
|
+
np.sum(ulp_err > CompareConst.ULP_FLOAT32_THRESHOLD) / bench_output.size
|
|
359
|
+
else:
|
|
360
|
+
compare_column.ulp_error_proportion = \
|
|
361
|
+
np.sum(ulp_err > CompareConst.ULP_FLOAT16_THRESHOLD) / bench_output.size
|
|
362
|
+
else:
|
|
363
|
+
dtype_config = precision_configs.get(dtype)
|
|
364
|
+
small_value_mask = get_small_value_mask(abs_bench, both_finite_mask, dtype_config['small_value'][0])
|
|
365
|
+
abs_err_greater_mask = np.greater(abs_err, dtype_config['small_value_atol'][0])
|
|
366
|
+
compare_column.small_value_err_ratio = get_small_value_err_ratio(small_value_mask, abs_err_greater_mask)
|
|
367
|
+
rel_err = get_rel_err(abs_err, abs_bench_with_eps, small_value_mask, inf_nan_mask)
|
|
368
|
+
compare_column.rmse = get_rmse(abs_err, np.logical_or(inf_nan_mask, small_value_mask))
|
|
369
|
+
compare_column.eb = get_error_balance(bench_output, device_output)
|
|
370
|
+
if rel_err.size == 0:
|
|
371
|
+
return CompareConst.ERROR, compare_column, "Relative error result list is empty."
|
|
372
|
+
compare_column.max_rel_error = get_max_rel_err(rel_err)
|
|
373
|
+
compare_column.mean_rel_error = get_mean_rel_err(rel_err)
|
|
374
|
+
|
|
375
|
+
cos_res, cos_status, msg = cosine_sim(bench_output, device_output)
|
|
376
|
+
compare_column.cosine_sim = cos_res
|
|
377
|
+
message += msg + "\n"
|
|
378
|
+
if not cos_status:
|
|
379
|
+
message += "Cosine similarity is less than 0.99, consider as error, skip other check and set to SPACE.\n"
|
|
380
|
+
return CompareConst.ERROR, compare_column, message
|
|
381
|
+
|
|
382
|
+
max_abs_res, max_abs_status = get_max_abs_err(abs_err)
|
|
383
|
+
compare_column.max_abs_err = max_abs_res
|
|
384
|
+
if max_abs_status:
|
|
385
|
+
message += "Max abs error is less than 0.001, consider as pass, skip other check and set to SPACE.\n"
|
|
386
|
+
return CompareConst.PASS, compare_column, message
|
|
387
|
+
|
|
388
|
+
if dtype in [torch.float16, torch.bfloat16]:
|
|
389
|
+
hundred_res, hundred_status = get_rel_err_ratio(rel_err_orign, CompareConst.HUNDRED_RATIO_THRESHOLD)
|
|
390
|
+
compare_column.rel_err_hundredth = hundred_res
|
|
391
|
+
if not hundred_status:
|
|
392
|
+
message += "Relative error is greater than 0.01, consider as error, " \
|
|
393
|
+
"skip other check and set to SPACE.\n"
|
|
394
|
+
return CompareConst.ERROR, compare_column, message
|
|
395
|
+
thousand_res, thousand_status = get_rel_err_ratio(rel_err_orign, CompareConst.THOUSAND_RATIO_THRESHOLD)
|
|
396
|
+
compare_column.rel_err_thousandth = thousand_res
|
|
397
|
+
if dtype in [torch.float16, torch.bfloat16]:
|
|
398
|
+
if thousand_status:
|
|
399
|
+
message += "Relative error is less than 0.001, consider as pass, skip other check and set to SPACE.\n"
|
|
400
|
+
return CompareConst.PASS, compare_column, message
|
|
401
|
+
message += "Relative error is greater than 0.001, consider as warning, skip other check and set to SPACE.\n"
|
|
402
|
+
return CompareConst.WARNING, compare_column, message
|
|
403
|
+
ten_thousand_res, ten_thousand_status = get_rel_err_ratio(
|
|
404
|
+
rel_err_orign, CompareConst.TEN_THOUSAND_RATIO_THRESHOLD)
|
|
405
|
+
compare_column.rel_err_ten_thousandth = ten_thousand_res
|
|
406
|
+
if dtype in [torch.float32, torch.float64]:
|
|
407
|
+
if not thousand_status:
|
|
408
|
+
message += "Relative error is greater than 0.001, consider as error, " \
|
|
409
|
+
"skip other check and set to SPACE.\n"
|
|
410
|
+
return CompareConst.ERROR, compare_column, message
|
|
411
|
+
if not ten_thousand_status:
|
|
412
|
+
message += "Relative error is greater than 0.0001, consider as warning, " \
|
|
413
|
+
"skip other check and set to SPACE.\n"
|
|
414
|
+
return CompareConst.WARNING, compare_column, message
|
|
415
|
+
message += "Relative error is less than 0.0001, consider as pass.\n"
|
|
416
|
+
return CompareConst.PASS, compare_column, message
|