PyPI - mindstudio-probe - Versions diffs - 1.0.1__py3-none-any.whl → 1.0.4__py3-none-any.whl - Mend

mindstudio-probe 1.0.1py3-none-any.whl → 1.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (323) hide show

{mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/LICENSE +201 -201
{mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/METADATA +36 -30
mindstudio_probe-1.0.4.dist-info/RECORD +276 -0
{mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/entry_points.txt +1 -0
msprobe/README.md +101 -182
msprobe/__init__.py +1 -0
msprobe/{config/config.json → config.json} +49 -27
msprobe/core/__init__.py +0 -0
msprobe/{pytorch → core}/advisor/advisor.py +124 -124
msprobe/{pytorch → core}/advisor/advisor_const.py +59 -59
msprobe/{pytorch → core}/advisor/advisor_result.py +58 -58
msprobe/core/common/const.py +341 -241
msprobe/core/common/exceptions.py +100 -88
msprobe/core/common/{file_check.py → file_utils.py} +478 -265
msprobe/core/common/log.py +76 -55
msprobe/core/common/utils.py +385 -516
msprobe/core/common_config.py +85 -58
msprobe/core/compare/acc_compare.py +300 -0
msprobe/core/compare/check.py +95 -0
msprobe/core/compare/compare_cli.py +49 -0
msprobe/core/compare/highlight.py +223 -0
msprobe/core/compare/multiprocessing_compute.py +149 -0
msprobe/{pytorch → core}/compare/npy_compare.py +295 -244
msprobe/core/compare/utils.py +430 -0
msprobe/core/data_dump/data_collector.py +154 -140
msprobe/core/data_dump/data_processor/base.py +314 -245
msprobe/core/data_dump/data_processor/factory.py +59 -61
msprobe/core/data_dump/data_processor/mindspore_processor.py +186 -0
msprobe/core/data_dump/data_processor/pytorch_processor.py +366 -346
msprobe/core/data_dump/json_writer.py +96 -116
msprobe/core/data_dump/scope.py +178 -178
msprobe/core/grad_probe/__init__.py +0 -0
msprobe/core/grad_probe/constant.py +71 -0
msprobe/core/grad_probe/grad_compare.py +171 -0
msprobe/core/grad_probe/utils.py +64 -0
msprobe/docs/01.installation.md +89 -0
msprobe/docs/02.config_introduction.md +165 -0
msprobe/docs/03.config_examples.md +247 -0
msprobe/docs/04.acl_config_examples.md +76 -0
msprobe/docs/05.data_dump_PyTorch.md +198 -0
msprobe/docs/06.data_dump_MindSpore.md +243 -0
msprobe/docs/07.accuracy_checker_PyTorch.md +274 -0
msprobe/docs/08.accuracy_checker_online_PyTorch.md +198 -0
msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
msprobe/docs/10.accuracy_compare_PyTorch.md +245 -0
msprobe/docs/11.accuracy_compare_MindSpore.md +202 -0
msprobe/docs/12.overflow_check_PyTorch.md +79 -0
msprobe/docs/13.overflow_check_MindSpore.md +31 -0
msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
msprobe/docs/15.free_benchmarking_PyTorch.md +164 -0
msprobe/docs/17.grad_probe.md +207 -0
msprobe/docs/FAQ_PyTorch.md +177 -0
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/grad_probe_image-1.png +0 -0
msprobe/docs/img/grad_probe_image-2.png +0 -0
msprobe/docs/img/grad_probe_image-3.png +0 -0
msprobe/docs/img/grad_probe_image-4.png +0 -0
msprobe/docs/img/grad_probe_image.png +0 -0
msprobe/mindspore/__init__.py +1 -1
msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +255 -0
msprobe/mindspore/api_accuracy_checker/api_info.py +69 -0
msprobe/mindspore/api_accuracy_checker/api_runner.py +156 -0
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +197 -0
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
msprobe/mindspore/api_accuracy_checker/compute_element.py +239 -0
msprobe/mindspore/api_accuracy_checker/main.py +9 -0
msprobe/mindspore/api_accuracy_checker/type_mapping.py +114 -0
msprobe/mindspore/api_accuracy_checker/utils.py +80 -0
msprobe/mindspore/cell_processor.py +34 -0
msprobe/mindspore/common/const.py +106 -0
msprobe/mindspore/common/log.py +38 -0
msprobe/mindspore/common/utils.py +81 -0
msprobe/mindspore/compare/distributed_compare.py +75 -0
msprobe/mindspore/compare/ms_compare.py +219 -0
msprobe/mindspore/compare/ms_graph_compare.py +348 -0
msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -0
msprobe/mindspore/debugger/debugger_config.py +66 -51
msprobe/mindspore/debugger/precision_debugger.py +126 -32
msprobe/mindspore/dump/dump_tool_factory.py +35 -38
msprobe/mindspore/dump/hook_cell/api_registry.py +118 -0
msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -0
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +922 -0
msprobe/mindspore/dump/hook_cell/wrap_api.py +113 -0
msprobe/mindspore/dump/jit_dump.py +72 -0
msprobe/mindspore/dump/kernel_graph_dump.py +59 -60
msprobe/mindspore/dump/kernel_kbyk_dump.py +64 -0
msprobe/mindspore/free_benchmark/__init__.py +0 -0
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -0
msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
msprobe/mindspore/free_benchmark/common/config.py +12 -0
msprobe/mindspore/free_benchmark/common/handler_params.py +17 -0
msprobe/mindspore/free_benchmark/common/utils.py +71 -0
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -0
msprobe/mindspore/free_benchmark/decorator/__init__.py +0 -0
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +43 -0
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -0
msprobe/mindspore/free_benchmark/handler/__init__.py +0 -0
msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -0
msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -0
msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -0
msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -0
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -0
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -0
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -0
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +51 -0
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +35 -0
msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -0
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +29 -0
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -0
msprobe/mindspore/grad_probe/__init__.py +0 -0
msprobe/mindspore/grad_probe/global_context.py +90 -0
msprobe/mindspore/grad_probe/grad_analyzer.py +231 -0
msprobe/mindspore/grad_probe/grad_monitor.py +27 -0
msprobe/mindspore/grad_probe/grad_stat_csv.py +132 -0
msprobe/mindspore/grad_probe/hook.py +94 -0
msprobe/mindspore/grad_probe/utils.py +30 -0
msprobe/mindspore/ms_config.py +128 -78
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +44 -45
msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +34 -32
msprobe/mindspore/runtime.py +4 -0
msprobe/mindspore/service.py +378 -0
msprobe/mindspore/task_handler_factory.py +24 -21
msprobe/msprobe.py +105 -67
msprobe/pytorch/__init__.py +4 -4
msprobe/pytorch/api_accuracy_checker/common/config.py +53 -50
msprobe/pytorch/api_accuracy_checker/common/utils.py +214 -224
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +213 -216
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +606 -545
msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
msprobe/pytorch/api_accuracy_checker/compare/compare.py +386 -345
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +73 -73
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +245 -248
msprobe/pytorch/api_accuracy_checker/config.yaml +10 -4
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +335 -328
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +200 -203
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +133 -127
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +592 -493
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +70 -7
msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py +0 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +197 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +325 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +219 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -0
msprobe/pytorch/bench_functions/__init__.py +15 -0
msprobe/pytorch/bench_functions/apply_adam_w.py +28 -0
msprobe/pytorch/bench_functions/confusion_transpose.py +19 -0
msprobe/pytorch/bench_functions/fast_gelu.py +55 -0
msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -0
msprobe/pytorch/bench_functions/linear.py +12 -0
msprobe/pytorch/bench_functions/matmul_backward.py +48 -0
msprobe/pytorch/bench_functions/npu_fusion_attention.py +509 -0
msprobe/pytorch/bench_functions/rms_norm.py +15 -0
msprobe/pytorch/bench_functions/rotary_mul.py +52 -0
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -0
msprobe/pytorch/bench_functions/swiglu.py +55 -0
msprobe/pytorch/common/__init__.py +2 -2
msprobe/pytorch/common/compare_script.template +14 -14
msprobe/pytorch/common/log.py +20 -31
msprobe/pytorch/common/parse_json.py +39 -37
msprobe/pytorch/common/utils.py +305 -224
msprobe/pytorch/compare/distributed_compare.py +66 -111
msprobe/pytorch/compare/mapping.yaml +607 -607
msprobe/pytorch/compare/match.py +34 -36
msprobe/pytorch/compare/pt_compare.py +50 -0
msprobe/pytorch/debugger/debugger_config.py +95 -86
msprobe/pytorch/debugger/precision_debugger.py +125 -95
msprobe/pytorch/free_benchmark/__init__.py +8 -8
msprobe/pytorch/free_benchmark/common/constant.py +70 -67
msprobe/pytorch/free_benchmark/common/counter.py +71 -71
msprobe/pytorch/free_benchmark/common/enums.py +37 -37
msprobe/pytorch/free_benchmark/common/params.py +129 -129
msprobe/pytorch/free_benchmark/common/utils.py +102 -98
msprobe/pytorch/free_benchmark/compare/grad_saver.py +179 -183
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +104 -104
msprobe/pytorch/free_benchmark/main.py +105 -102
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +13 -13
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +41 -41
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +90 -90
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +104 -104
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +63 -63
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +68 -68
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +28 -28
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +45 -45
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +19 -19
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +217 -203
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +39 -39
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +23 -23
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +30 -31
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +170 -170
msprobe/pytorch/function_factory.py +76 -0
msprobe/pytorch/functional/dump_module.py +39 -39
msprobe/pytorch/grad_probe/__init__.py +0 -0
msprobe/pytorch/grad_probe/grad_monitor.py +91 -0
msprobe/pytorch/grad_probe/grad_stat_csv.py +129 -0
msprobe/pytorch/hook_module/api_registry.py +161 -161
msprobe/pytorch/hook_module/hook_module.py +120 -109
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1876
msprobe/pytorch/hook_module/utils.py +30 -29
msprobe/pytorch/hook_module/wrap_aten.py +110 -100
msprobe/pytorch/hook_module/wrap_distributed.py +78 -75
msprobe/pytorch/hook_module/wrap_functional.py +105 -108
msprobe/pytorch/hook_module/wrap_npu_custom.py +93 -73
msprobe/pytorch/hook_module/wrap_tensor.py +71 -72
msprobe/pytorch/hook_module/wrap_torch.py +86 -88
msprobe/pytorch/hook_module/wrap_vf.py +62 -64
msprobe/pytorch/module_processer.py +138 -98
msprobe/pytorch/online_dispatch/__init__.py +20 -20
msprobe/pytorch/online_dispatch/compare.py +236 -236
msprobe/pytorch/online_dispatch/dispatch.py +271 -273
msprobe/pytorch/online_dispatch/dump_compare.py +155 -186
msprobe/pytorch/online_dispatch/single_compare.py +391 -391
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +49 -49
msprobe/pytorch/online_dispatch/utils.py +130 -187
msprobe/pytorch/parse.py +4 -4
msprobe/pytorch/parse_tool/cli.py +32 -32
msprobe/pytorch/parse_tool/lib/compare.py +260 -259
msprobe/pytorch/parse_tool/lib/config.py +52 -51
msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +158 -158
msprobe/pytorch/parse_tool/lib/utils.py +316 -367
msprobe/pytorch/parse_tool/lib/visualization.py +85 -90
msprobe/pytorch/pt_config.py +188 -93
msprobe/pytorch/service.py +246 -167
mindstudio_probe-1.0.1.dist-info/RECORD +0 -228
msprobe/config/README.md +0 -397
msprobe/mindspore/doc/dump.md +0 -65
msprobe/mindspore/dump/api_kbk_dump.py +0 -55
msprobe/pytorch/compare/acc_compare.py +0 -1024
msprobe/pytorch/compare/highlight.py +0 -100
msprobe/pytorch/doc/FAQ.md +0 -193
msprobe/pytorch/doc/api_accuracy_checker.md +0 -269
msprobe/pytorch/doc/atat/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
msprobe/pytorch/doc/dump.md +0 -207
msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -176
msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
msprobe/pytorch/doc/run_overflow_check.md +0 -25
msprobe/pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md +0 -90
msprobe/test/core_ut/common/test_utils.py +0 -345
msprobe/test/core_ut/data_dump/test_data_collector.py +0 -47
msprobe/test/core_ut/data_dump/test_json_writer.py +0 -183
msprobe/test/core_ut/data_dump/test_scope.py +0 -151
msprobe/test/core_ut/test_common_config.py +0 -152
msprobe/test/core_ut/test_file_check.py +0 -218
msprobe/test/core_ut/test_log.py +0 -109
msprobe/test/mindspore_ut/test_api_kbk_dump.py +0 -51
msprobe/test/mindspore_ut/test_debugger_config.py +0 -42
msprobe/test/mindspore_ut/test_dump_tool_factory.py +0 -51
msprobe/test/mindspore_ut/test_kernel_graph_dump.py +0 -66
msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +0 -63
msprobe/test/mindspore_ut/test_ms_config.py +0 -69
msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +0 -51
msprobe/test/mindspore_ut/test_precision_debugger.py +0 -56
msprobe/test/mindspore_ut/test_task_handler_factory.py +0 -58
msprobe/test/pytorch_ut/advisor/test_advisor.py +0 -83
msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +0 -108
msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +0 -39
msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +0 -112
msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +0 -77
msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +0 -125
msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +0 -10
msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +0 -43
msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +0 -179
msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +0 -63
msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +0 -99
msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +0 -115
msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +0 -72
msprobe/test/pytorch_ut/compare/test_acc_compare.py +0 -17
msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +0 -105
msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +0 -121
msprobe/test/pytorch_ut/free_benchmark/test_main.py +0 -101
msprobe/test/pytorch_ut/functional/test_dump_module.py +0 -15
msprobe/test/pytorch_ut/hook_module/test_api_registry.py +0 -130
msprobe/test/pytorch_ut/hook_module/test_hook_module.py +0 -42
msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +0 -65
msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +0 -35
msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +0 -20
msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +0 -35
msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +0 -43
msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +0 -11
msprobe/test/pytorch_ut/test_pt_config.py +0 -69
msprobe/test/pytorch_ut/test_service.py +0 -59
msprobe/test/resources/advisor.txt +0 -3
msprobe/test/resources/compare_result_20230703104808.csv +0 -9
msprobe/test/resources/compare_result_without_accuracy.csv +0 -9
msprobe/test/resources/config.yaml +0 -3
msprobe/test/resources/npu_test.pkl +0 -8
msprobe/test/run_test.sh +0 -30
msprobe/test/run_ut.py +0 -58
msprobe/test/test_module_processer.py +0 -64
{mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.4.dist-info}/top_level.txt +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
/msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
/msprobe/{config → docs}/img/free_benchmark.png +0 -0
/msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0

msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py CHANGED Viewed

@@ -1,545 +1,606 @@
-import argparse
-import math
-import os
-import sys
-from collections import namedtuple
-import torch
-import pandas as pd
-from msprobe.pytorch.api_accuracy_checker.common.utils import write_csv
-from msprobe.pytorch.api_accuracy_checker.common.config import msCheckerConfig
-from msprobe.pytorch.api_accuracy_checker.compare.compare_utils import API_PRECISION_COMPARE_RESULT_FILE_NAME, \
-    API_PRECISION_COMPARE_DETAILS_FILE_NAME, BENCHMARK_COMPARE_SUPPORT_LIST, API_PRECISION_COMPARE_UNSUPPORT_LIST, \
-    ApiPrecisionCompareColumn, AbsoluteStandardApi, BinaryStandardApi, ULPStandardApi, ThousandthStandardApi, \
-    BINARY_COMPARE_UNSUPPORT_LIST, ULP_COMPARE_SUPPORT_LIST, convert_str_to_float, CompareMessage, is_inf_or_nan, \
-    check_inf_or_nan
-from msprobe.pytorch.api_accuracy_checker.compare.compare_column import ApiPrecisionOutputColumn
-from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut import get_validated_result_csv_path
-from msprobe.core.common.file_check import FileChecker, change_mode, check_path_before_create, create_directory
-from msprobe.pytorch.common.log import logger
-from msprobe.core.common.utils import CompareException
-from msprobe.core.common.const import CompareConst, FileCheckConst
-CompareConfig = namedtuple('CompareConfig', ['npu_csv_path', 'gpu_csv_path', 'result_csv_path', 'details_csv_path'])
-BenchmarkInf_Nan_Consistency = namedtuple('BenchmarkInf_Nan_Consistency', ['small_value_inf_nan_consistency',
-                                                                           'rmse_inf_nan_consistency',
-                                                                           'max_rel_inf_nan_consistency',
-                                                                           'mean_rel_inf_nan_consistency',
-                                                                           'eb_inf_nan_consistency'])
-unsupported_message = 'This data type does not support benchmark compare.'
-DEFAULT_THRESHOLD = 1
-benchmark_algorithms_thresholds = {
-    'small_value': {
-        'error_threshold': 2,
-        'warning_threshold': 1
-    },
-    'rmse': {
-        'error_threshold': 2,
-        'warning_threshold': 1
-    },
-    'max_rel_err': {
-        'error_threshold': 10,
-        'warning_threshold': 1
-    },
-    'mean_rel_err': {
-        'error_threshold': 2,
-        'warning_threshold': 1
-    },
-    'eb': {
-        'error_threshold': 2,
-        'warning_threshold': 1
-    }
-}
-benchmark_message = {
-    "small_value_err_status": {
-        CompareConst.ERROR: "ERROR: 小值域错误比值超过阈值\n",
-        CompareConst.WARNING: "WARNING: 小值域错误比值超过阈值\n"
-    },
-    "rmse_status": {
-        CompareConst.ERROR: "ERROR: 均方根误差比值超过阈值\n",
-        CompareConst.WARNING: "WARNING: 均方根误差比值超过阈值\n"
-    },
-    "max_rel_err_status": {
-        CompareConst.ERROR: "ERROR: 相对误差最大值比值超过阈值\n",
-        CompareConst.WARNING: "WARNING: 相对误差最大值比值超过阈值\n"
-    },
-    "mean_rel_err_status": {
-        CompareConst.ERROR: "ERROR: 相对误差平均值比值超过阈值\n",
-        CompareConst.WARNING: "WARNING: 相对误差平均值比值超过阈值\n"
-    }
-}
-class Standard:
-    @staticmethod
-    def _calc_ratio(column_name, x, y, default_value):
-        '''
-        计算npu侧和gpu侧统计量的比值
-        输入：
-            column_name：统计量名称
-            x：npu侧统计量
-            y：gpu侧统计量
-            default：当x不接近0，y接近0，设置的比值默认值
-        输出：
-            ratio：统计量x和y的比值
-            inf_nan_consistency：不出现inf或nan时为True，出现inf或nan时必须同时为inf或-inf或nan才为True，否则为False
-            message：当出现inf或nan时的提示信息
-        '''
-        x, y = convert_str_to_float(x), convert_str_to_float(y)
-        if is_inf_or_nan(x) or is_inf_or_nan(y):
-            return check_inf_or_nan(x, y, column_name)
-        inf_nan_consistency = True
-        message = ""
-        if math.isclose(y, 0.0):
-            if math.isclose(x, 0.0):
-                return 1.0, inf_nan_consistency, message
-            else:
-                return default_value, inf_nan_consistency, message
-        else:
-            return abs(x / y), inf_nan_consistency, message
-class BenchmarkStandard(Standard):
-    def __init__(self, api_name, npu_precision, gpu_precision):
-        self.api_name = api_name
-        self.npu_precision = npu_precision
-        self.gpu_precision = gpu_precision
-        self.small_value_err_ratio = 1
-        self.rmse_ratio = 1
-        self.max_rel_err_ratio = 1
-        self.mean_rel_err_ratio = 1
-        self.eb_ratio = 1
-        self.small_value_err_status = CompareConst.PASS
-        self.rmse_status = CompareConst.PASS
-        self.max_rel_err_status = CompareConst.PASS
-        self.mean_rel_err_status = CompareConst.PASS
-        self.eb_status = CompareConst.PASS
-        self.check_result_list = []
-        self.final_result = CompareConst.PASS
-        self.compare_message = ""
-    def __str__(self):
-        return "%s" % (self.api_name)
-    @staticmethod
-    def _get_status(ratio, algorithm):
-        if math.isnan(ratio) or math.isinf(ratio):
-            return CompareConst.PASS
-        error_threshold = benchmark_algorithms_thresholds.get(algorithm, {}).get('error_threshold', DEFAULT_THRESHOLD)
-        warning_threshold = benchmark_algorithms_thresholds.get(algorithm, {}).get('warning_threshold',
-                                                                                   DEFAULT_THRESHOLD)
-        if ratio > error_threshold:
-            return CompareConst.ERROR
-        elif ratio > warning_threshold:
-            return CompareConst.WARNING
-        return CompareConst.PASS
-    def get_result(self):
-        inf_nan_consistency = self._compare_ratio()
-        small_value_inf_nan_consistency = inf_nan_consistency.small_value_inf_nan_consistency
-        rmse_inf_nan_consistency = inf_nan_consistency.rmse_inf_nan_consistency
-        max_rel_inf_nan_consistency = inf_nan_consistency.max_rel_inf_nan_consistency
-        mean_rel_inf_nan_consistency = inf_nan_consistency.mean_rel_inf_nan_consistency
-        eb_inf_nan_consistency = inf_nan_consistency.eb_inf_nan_consistency
-        self.small_value_err_status = self._get_status(self.small_value_err_ratio, 'small_value') if \
-            small_value_inf_nan_consistency else CompareConst.ERROR
-        self.check_result_list.append(self.small_value_err_status)
-        self.rmse_status = self._get_status(self.rmse_ratio, 'rmse') if rmse_inf_nan_consistency \
-            else CompareConst.ERROR
-        self.check_result_list.append(self.rmse_status)
-        self.max_rel_err_status = self._get_status(self.max_rel_err_ratio, 'max_rel_err') if max_rel_inf_nan_consistency \
-            else CompareConst.ERROR
-        self.check_result_list.append(self.max_rel_err_status)
-        self.mean_rel_err_status = self._get_status(self.mean_rel_err_ratio, 'mean_rel_err') if mean_rel_inf_nan_consistency \
-            else CompareConst.ERROR
-        self.check_result_list.append(self.mean_rel_err_status)
-        self.eb_status = self._get_status(self.eb_ratio, 'eb')
-        if CompareConst.ERROR in self.check_result_list:
-            self.final_result = CompareConst.ERROR
-        elif CompareConst.WARNING in self.check_result_list:
-            self.final_result = CompareConst.WARNING
-    def to_column_value(self):
-        return [self.small_value_err_ratio, self.small_value_err_status, self.rmse_ratio,
-                self.rmse_status, self.max_rel_err_ratio, self.max_rel_err_status, self.mean_rel_err_ratio,
-                self.mean_rel_err_status, self.eb_ratio, self.eb_status]
-    def _compare_ratio(self):
-        self.small_value_err_ratio, small_value_inf_nan_consistency, small_value_message = self._calc_ratio(
-                                    ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE,
-                                    self.npu_precision.get(ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE),
-                                    self.gpu_precision.get(ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE), 10000.0)
-        self.compare_message += small_value_message
-        self.rmse_ratio, rmse_inf_nan_consistency, rmse_message = self._calc_ratio(ApiPrecisionCompareColumn.RMSE,
-                                        self.npu_precision.get(ApiPrecisionCompareColumn.RMSE),
-                                        self.gpu_precision.get(ApiPrecisionCompareColumn.RMSE), 10000.0)
-        self.compare_message += rmse_message
-        self.max_rel_err_ratio, max_rel_inf_nan_consistency, max_rel_message = self._calc_ratio(
-                                        ApiPrecisionCompareColumn.MAX_REL_ERR,
-                                        self.npu_precision.get(ApiPrecisionCompareColumn.MAX_REL_ERR),
-                                        self.gpu_precision.get(ApiPrecisionCompareColumn.MAX_REL_ERR), 10000.0)
-        self.compare_message += max_rel_message
-        self.mean_rel_err_ratio, mean_rel_inf_nan_consistency, mean_rel_message = self._calc_ratio(ApiPrecisionCompareColumn.MEAN_REL_ERR,
-                                        self.npu_precision.get(ApiPrecisionCompareColumn.MEAN_REL_ERR),
-                                        self.gpu_precision.get(ApiPrecisionCompareColumn.MEAN_REL_ERR), 10000.0)
-        self.compare_message += mean_rel_message
-        self.eb_ratio, eb_inf_nan_consistency, eb_message = self._calc_ratio(ApiPrecisionCompareColumn.EB,
-                                        self.npu_precision.get(ApiPrecisionCompareColumn.EB),
-                                        self.gpu_precision.get(ApiPrecisionCompareColumn.EB), 10000.0)
-        self.compare_message += eb_message
-        return BenchmarkInf_Nan_Consistency(small_value_inf_nan_consistency, rmse_inf_nan_consistency,
-                                            max_rel_inf_nan_consistency, mean_rel_inf_nan_consistency, eb_inf_nan_consistency)
-class ULPStandard(Standard):
-    def __init__(self, api_name, npu_precision, gpu_precision):
-        self.api_name = api_name
-        self.npu_precision = npu_precision
-        self.gpu_precision = gpu_precision
-        self.mean_ulp_err = 0
-        self.ulp_err_proportion = 0
-        self.ulp_err_proportion_ratio = 1
-        self.ulp_err_status = CompareConst.PASS
-        self.compare_message = ""
-    def __str__(self):
-        return f"{self.api_name}"
-    def get_result(self):
-        self.mean_ulp_err = convert_str_to_float(self.npu_precision.get(ApiPrecisionCompareColumn.MEAN_ULP_ERR))
-        gpu_mean_ulp_err = convert_str_to_float(self.gpu_precision.get(ApiPrecisionCompareColumn.MEAN_ULP_ERR))
-        inf_nan_consistency = True
-        if is_inf_or_nan(self.mean_ulp_err) or is_inf_or_nan(gpu_mean_ulp_err):
-            _, inf_nan_consistency, message = check_inf_or_nan(self.mean_ulp_err, gpu_mean_ulp_err,
-                                                                 ApiPrecisionCompareColumn.MEAN_ULP_ERR)
-            self.compare_message += message
-        self.ulp_err_proportion = convert_str_to_float(
-                                                self.npu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION))
-        self.ulp_err_proportion_ratio, ulp_inf_nan_consistency, message = self._calc_ratio(
-                    ApiPrecisionCompareColumn.ULP_ERR_PROPORTION,
-                    self.npu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION),
-                    self.gpu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION), 10000.0)
-        inf_nan_consistency = inf_nan_consistency and ulp_inf_nan_consistency
-        self.compare_message += message
-        if inf_nan_consistency:
-            self.ulp_err_status = self._get_ulp_status(self.npu_precision.get(ApiPrecisionCompareColumn.DEVICE_DTYPE))
-        else:
-            self.ulp_err_status = CompareConst.ERROR
-    def _get_ulp_status(self, dtype):
-        if dtype == torch.float32:
-            if self.mean_ulp_err < 64:
-                return CompareConst.PASS
-            elif self.ulp_err_proportion < 0.05:
-                return CompareConst.PASS
-            elif self.ulp_err_proportion_ratio < 1:
-                return CompareConst.PASS
-            else:
-                self.compare_message += "ERROR: ULP误差不满足标准\n"
-                return CompareConst.ERROR
-        else:
-            if self.ulp_err_proportion < 0.001:
-                return CompareConst.PASS
-            elif self.ulp_err_proportion_ratio < 1:
-                return CompareConst.PASS
-            else:
-                self.compare_message += "ERROR: ULP误差不满足标准\n"
-                return CompareConst.ERROR
-def write_detail_csv(content, save_path):
-    rows = []
-    content = ["{:.{}f}".format(item, msCheckerConfig.precision) \
-                   if isinstance(item, float) else item for item in content]
-    rows.append(content)
-    write_csv(rows, save_path)
-def api_precision_compare(config):
-    logger.info("Start compare task")
-    logger.info(f"Compare task result will be saved in {config.result_csv_path}")
-    logger.info(f"Compare task detail will be saved in {config.details_csv_path}")
-    try:
-        npu_data = pd.read_csv(config.npu_csv_path)
-    except Exception as err:
-        logger.error(f"Open npu csv Error: %s" % str(err))
-    check_csv_columns(npu_data.columns, "npu_csv")
-    try:
-        gpu_data = pd.read_csv(config.gpu_csv_path)
-    except Exception as err:
-        logger.error(f"Open gpu csv Error: %s" % str(err))
-    check_csv_columns(gpu_data.columns, "gpu_csv")
-    detail_csv_title = [ApiPrecisionCompareColumn.get_detail_csv_title()]
-    result_csv_title = [ApiPrecisionCompareColumn.get_result_csv_title()]
-    write_csv(result_csv_title, config.result_csv_path)
-    write_csv(detail_csv_title, config.details_csv_path)
-    try:
-        analyse_csv(npu_data, gpu_data, config)
-    except Exception as err:
-        logger.error(f"Analyse csv Error: %s" % str(err))
-    change_mode(config.result_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
-    change_mode(config.details_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
-def analyse_csv(npu_data, gpu_data, config):
-    forward_status, backward_status = [], []
-    last_api_name, last_api_dtype = None, None
-    for _, row_npu in npu_data.iterrows():
-        message = ''
-        compare_column = ApiPrecisionOutputColumn()
-        full_api_name_with_direction_status = row_npu[ApiPrecisionCompareColumn.API_NAME]
-        row_gpu = gpu_data[gpu_data[ApiPrecisionCompareColumn.API_NAME] == full_api_name_with_direction_status]
-        _, api_name, _, direction_status, _, _ = full_api_name_with_direction_status.split(".")
-        if row_gpu.empty:
-            logger.warning(f'This API : {full_api_name_with_direction_status} does not exist in the GPU data.')
-            continue
-        if len(row_gpu) > 1:
-            msg = f'This API : {full_api_name_with_direction_status} has multiple records in the GPU data.'
-            raise CompareException(CompareException.INVALID_DATA_ERROR, msg)
-        row_gpu = row_gpu.iloc[0]
-        new_status = CompareConst.SPACE
-        # 当前API的输出为空（例如反向过程中requires_grad=False）,跳过比对
-        if row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE].isspace():
-            compare_column.api_name = full_api_name_with_direction_status
-            compare_column.compare_result = CompareConst.SKIP
-            compare_column.compare_message = row_npu[ApiPrecisionCompareColumn.MESSAGE]
-            new_status = CompareConst.SKIP
-            write_detail_csv(compare_column.to_column_value(), config.details_csv_path)
-        else:
-            compare_column.api_name = full_api_name_with_direction_status
-            if api_name in ThousandthStandardApi:
-                new_status = record_thousandth_threshold_result(compare_column, row_npu)
-            elif row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] not in BINARY_COMPARE_UNSUPPORT_LIST or \
-                api_name in BinaryStandardApi:
-                new_status = record_binary_consistency_result(api_name, compare_column, row_npu)
-            elif api_name in AbsoluteStandardApi:
-                new_status = record_absolute_threshold_result(compare_column, row_npu)
-            elif api_name in ULPStandardApi and \
-                row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] in ULP_COMPARE_SUPPORT_LIST:
-                us = ULPStandard(full_api_name_with_direction_status, row_npu, row_gpu)
-                new_status = record_ulp_compare_result(compare_column, us)
-            elif row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] in BENCHMARK_COMPARE_SUPPORT_LIST:
-                bs = BenchmarkStandard(full_api_name_with_direction_status, row_npu, row_gpu)
-                new_status = record_benchmark_compare_result(compare_column, bs)
-            write_detail_csv(compare_column.to_column_value(), config.details_csv_path)
-        if last_api_name is not None and api_name != last_api_name:
-            if last_api_dtype in API_PRECISION_COMPARE_UNSUPPORT_LIST:
-                message = unsupported_message
-                write_csv([[last_api_name, "skip", "skip", message]], config.result_csv_path)
-                forward_status, backward_status = [], []
-                message = ''
-            else:
-                forward_result = get_api_checker_result(forward_status)
-                backward_result = get_api_checker_result(backward_status)
-                message += CompareMessage.get(last_api_name, "") if forward_result == CompareConst.ERROR else ""
-                write_csv([[last_api_name, forward_result, backward_result, message]], config.result_csv_path)
-                forward_status, backward_status = [], []
-                message = ''
-        is_supported = row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] not in API_PRECISION_COMPARE_UNSUPPORT_LIST
-        last_api_name = api_name
-        last_api_dtype = row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE]
-        if not is_supported:
-            continue
-        if direction_status == 'forward':
-            forward_status.append(new_status)
-        elif direction_status == 'backward':
-            backward_status.append(new_status)
-        else:
-            logger.error(f"Invalid direction status: {direction_status}")
-    if last_api_name is not None:
-        if last_api_dtype in API_PRECISION_COMPARE_UNSUPPORT_LIST:
-            message = unsupported_message
-            write_csv([[last_api_name, "skip", "skip", message]], config.result_csv_path)
-        else:
-            forward_result = get_api_checker_result(forward_status)
-            backward_result = get_api_checker_result(backward_status)
-            message += CompareMessage.get(last_api_name, "") if forward_result == CompareConst.ERROR else ""
-            write_csv([[last_api_name, forward_result, backward_result, message]], config.result_csv_path)
-def check_error_rate(npu_error_rate):
-    return CompareConst.PASS if convert_str_to_float(npu_error_rate) == 0 else CompareConst.ERROR
-def get_absolute_threshold_result(row_npu):
-    inf_nan_error_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.INF_NAN_ERROR_RATIO])
-    rel_err_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.REL_ERR_RATIO])
-    abs_err_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.ABS_ERR_RATIO])
-    inf_nan_result = CompareConst.PASS if inf_nan_error_ratio == 0 else CompareConst.ERROR
-    rel_err_result = CompareConst.PASS if rel_err_ratio == 0 else CompareConst.ERROR
-    abs_err_result = CompareConst.PASS if abs_err_ratio == 0 else CompareConst.ERROR
-    if CompareConst.ERROR in [inf_nan_result, rel_err_result, abs_err_result]:
-        absolute_threshold_result = CompareConst.ERROR
-    else:
-        absolute_threshold_result = CompareConst.PASS
-    return {
-        "inf_nan_error_ratio": inf_nan_error_ratio,
-        "inf_nan_result": inf_nan_result,
-        "rel_err_ratio": rel_err_ratio,
-        "rel_err_result": rel_err_result,
-        "abs_err_ratio": abs_err_ratio,
-        "abs_err_result": abs_err_result,
-        "absolute_threshold_result": absolute_threshold_result,
-    }
-def get_api_checker_result(status):
-    if not status:
-        return CompareConst.SPACE
-    if all(item == CompareConst.SKIP for item in status):
-        return CompareConst.SKIP
-    for const in (CompareConst.ERROR, CompareConst.WARNING):
-        if const in status:
-            return const
-    return CompareConst.PASS
-def check_csv_columns(columns, csv_type):
-    required_columns = ApiPrecisionCompareColumn.to_required_columns()
-    missing_columns = [column for column in required_columns if column not in columns]
-    if missing_columns:
-        msg = f"The following columns {','.join(missing_columns)} are missing in{csv_type}"
-        raise CompareException(CompareException.INVALID_DATA_ERROR, msg)
-def record_binary_consistency_result(api_name, compare_column, row_npu):
-    new_status = check_error_rate(row_npu[ApiPrecisionCompareColumn.ERROR_RATE])
-    compare_column.error_rate = row_npu[ApiPrecisionCompareColumn.ERROR_RATE]
-    compare_column.error_rate_status = new_status
-    compare_column.compare_result = new_status
-    compare_column.compare_algorithm = "二进制一致法"
-    message = ''
-    if compare_column.error_rate_status == CompareConst.ERROR:
-        message += "ERROR: 二进制一致错误率超过阈值\n"
-        message += CompareMessage.get(api_name, "")
-    compare_column.compare_message = message
-    return new_status
-def record_absolute_threshold_result(compare_column, row_npu):
-    absolute_threshold_result = get_absolute_threshold_result(row_npu)
-    compare_column.inf_nan_error_ratio = absolute_threshold_result.get("inf_nan_error_ratio")
-    compare_column.inf_nan_error_ratio_status = absolute_threshold_result.get("inf_nan_result")
-    compare_column.rel_err_ratio = absolute_threshold_result.get("rel_err_ratio")
-    compare_column.rel_err_ratio_status = absolute_threshold_result.get("rel_err_result")
-    compare_column.abs_err_ratio = absolute_threshold_result.get("abs_err_ratio")
-    compare_column.abs_err_ratio_status = absolute_threshold_result.get("abs_err_result")
-    compare_column.compare_result = absolute_threshold_result.get("absolute_threshold_result")
-    compare_column.compare_algorithm = "绝对阈值法"
-    message = ''
-    if compare_column.inf_nan_error_ratio_status == CompareConst.ERROR:
-        message += "ERROR: inf/nan错误率超过阈值\n"
-    if compare_column.rel_err_ratio_status == CompareConst.ERROR:
-        message += "ERROR: 相对误差错误率超过阈值\n"
-    if compare_column.abs_err_ratio_status == CompareConst.ERROR:
-        message += "ERROR: 绝对误差错误率超过阈值\n"
-    compare_column.compare_message = message
-    return compare_column.compare_result
-def record_benchmark_compare_result(compare_column, bs):
-    bs.get_result()
-    compare_column.small_value_err_ratio = bs.small_value_err_ratio
-    compare_column.small_value_err_status = bs.small_value_err_status
-    compare_column.rmse_ratio = bs.rmse_ratio
-    compare_column.rmse_status = bs.rmse_status
-    compare_column.max_rel_err_ratio = bs.max_rel_err_ratio
-    compare_column.max_rel_err_status = bs.max_rel_err_status
-    compare_column.mean_rel_err_ratio = bs.mean_rel_err_ratio
-    compare_column.mean_rel_err_status = bs.mean_rel_err_status
-    compare_column.eb_ratio = bs.eb_ratio
-    compare_column.eb_status = bs.eb_status
-    compare_column.compare_result = bs.final_result
-    compare_column.compare_algorithm = "标杆比对法"
-    compare_column.compare_message = bs.compare_message
-    for status_attr, messages in benchmark_message.items():
-        status_value = getattr(compare_column, status_attr)
-        if status_value in messages:
-            compare_column.compare_message += messages[status_value]
-    return compare_column.compare_result
-def record_ulp_compare_result(compare_column, us):
-    us.get_result()
-    compare_column.mean_ulp_err = us.mean_ulp_err
-    compare_column.ulp_err_proportion = us.ulp_err_proportion
-    compare_column.ulp_err_proportion_ratio = us.ulp_err_proportion_ratio
-    compare_column.ulp_err_status = us.ulp_err_status
-    compare_column.compare_result = us.ulp_err_status
-    compare_column.compare_algorithm = "ULP误差比对法"
-    compare_column.compare_message = us.compare_message
-    return compare_column.compare_result
-def check_thousandth_rate(thousandth_rate):
-    return CompareConst.PASS if convert_str_to_float(thousandth_rate) >= 0.999 else CompareConst.ERROR
-def record_thousandth_threshold_result(compare_column, row_npu):
-    new_status = check_thousandth_rate(row_npu[ApiPrecisionCompareColumn.REL_ERR_THOUSANDTH])
-    compare_column.rel_err_thousandth = row_npu[ApiPrecisionCompareColumn.REL_ERR_THOUSANDTH]
-    compare_column.rel_err_thousandth_status = new_status
-    compare_column.compare_result = new_status
-    compare_column.compare_algorithm = "双千指标法"
-    message = ''
-    if compare_column.rel_err_thousandth_status == CompareConst.ERROR:
-        message += "ERROR: 双千指标不达标\n"
-    compare_column.compare_message = message
-    return compare_column.compare_result
-def _api_precision_compare(parser=None):
-    if not parser:
-        parser = argparse.ArgumentParser()
-    _api_precision_compare_parser(parser)
-    args = parser.parse_args(sys.argv[1:])
-    _api_precision_compare_command(args)
-def _api_precision_compare_command(args):
-    npu_csv_path = get_validated_result_csv_path(args.npu_csv_path, 'detail')
-    gpu_csv_path = get_validated_result_csv_path(args.gpu_csv_path, 'detail')
-    out_path = os.path.realpath(args.out_path) if args.out_path else "./"
-    check_path_before_create(out_path)
-    create_directory(out_path)
-    out_path_checker = FileChecker(out_path, FileCheckConst.DIR, ability=FileCheckConst.WRITE_ABLE)
-    out_path = out_path_checker.common_check()
-    result_csv_path = os.path.join(out_path, API_PRECISION_COMPARE_RESULT_FILE_NAME)
-    details_csv_path = os.path.join(out_path, API_PRECISION_COMPARE_DETAILS_FILE_NAME)
-    compare_config = CompareConfig(npu_csv_path, gpu_csv_path, result_csv_path, details_csv_path)
-    api_precision_compare(compare_config)
-def _api_precision_compare_parser(parser):
-    parser.add_argument("-npu", "--npu_csv_path", dest="npu_csv_path", default="", type=str,
-                        help="<Required> , Accuracy_checking_details.csv generated on the NPU by using the "
-                             "api_accuracy_checker tool.",
-                        required=True)
-    parser.add_argument("-gpu", "--gpu_csv_path", dest="gpu_csv_path", default="", type=str,
-                        help="<Required> Accuracy_checking_details.csv generated on the GPU by using the "
-                             "api_accuracy_checker tool.",
-                        required=False)
-    parser.add_argument("-o", "--out_path", dest="out_path", default="", type=str,
-                        help="<optional> The api precision compare task result out path.",
-                        required=False)
-if __name__ == '__main__':
-    _api_precision_compare()
-    logger.info("Compare task completed.")
+import argparse
+import math
+import os
+import sys
+from collections import namedtuple
+import torch
+import pandas as pd
+from msprobe.core.common.file_utils import write_csv
+from msprobe.pytorch.api_accuracy_checker.common.config import msCheckerConfig
+from msprobe.pytorch.api_accuracy_checker.compare.compare_utils import API_PRECISION_COMPARE_RESULT_FILE_NAME, \
+    API_PRECISION_COMPARE_DETAILS_FILE_NAME, BENCHMARK_COMPARE_SUPPORT_LIST, API_PRECISION_COMPARE_UNSUPPORT_LIST, \
+    ApiPrecisionCompareColumn, absolute_standard_api, binary_standard_api, ulp_standard_api, thousandth_standard_api, \
+    BINARY_COMPARE_UNSUPPORT_LIST, ULP_COMPARE_SUPPORT_LIST, convert_str_to_float, CompareMessage, is_inf_or_nan, \
+    check_inf_or_nan
+from msprobe.pytorch.api_accuracy_checker.compare.compare_column import ApiPrecisionOutputColumn
+from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut_utils import get_validated_result_csv_path
+from msprobe.pytorch.api_accuracy_checker.common.utils import extract_detailed_api_segments
+from msprobe.core.common.file_utils import FileChecker, change_mode, check_path_before_create, create_directory
+from msprobe.pytorch.common.log import logger
+from msprobe.core.common.utils import CompareException
+from msprobe.core.common.const import Const, CompareConst, FileCheckConst
+CompareConfig = namedtuple('CompareConfig', ['npu_csv_path', 'gpu_csv_path', 'result_csv_path', 'details_csv_path'])
+BenchmarkInf_Nan_Consistency = namedtuple('BenchmarkInf_Nan_Consistency', ['small_value_inf_nan_consistency',
+                                                                           'rmse_inf_nan_consistency',
+                                                                           'max_rel_inf_nan_consistency',
+                                                                           'mean_rel_inf_nan_consistency',
+                                                                           'eb_inf_nan_consistency'])
+unsupported_message = 'This data type does not support benchmark compare.'
+DEFAULT_THRESHOLD = 1
+benchmark_algorithms_thresholds = {
+    'small_value': {
+        'error_threshold': 2,
+        'warning_threshold': 1
+    },
+    'rmse': {
+        'error_threshold': 2,
+        'warning_threshold': 1
+    },
+    'max_rel_err': {
+        'error_threshold': 10,
+        'warning_threshold': 1
+    },
+    'mean_rel_err': {
+        'error_threshold': 2,
+        'warning_threshold': 1
+    },
+    'eb': {
+        'error_threshold': 2,
+        'warning_threshold': 1
+    }
+}
+benchmark_message = {
+    "small_value_err_status": {
+        CompareConst.ERROR: "ERROR: 小值域错误比值超过阈值\n",
+        CompareConst.WARNING: "WARNING: 小值域错误比值超过阈值\n"
+    },
+    "rmse_status": {
+        CompareConst.ERROR: "ERROR: 均方根误差比值超过阈值\n",
+        CompareConst.WARNING: "WARNING: 均方根误差比值超过阈值\n"
+    },
+    "max_rel_err_status": {
+        CompareConst.ERROR: "ERROR: 相对误差最大值比值超过阈值\n",
+        CompareConst.WARNING: "WARNING: 相对误差最大值比值超过阈值\n"
+    },
+    "mean_rel_err_status": {
+        CompareConst.ERROR: "ERROR: 相对误差平均值比值超过阈值\n",
+        CompareConst.WARNING: "WARNING: 相对误差平均值比值超过阈值\n"
+    }
+}
+class Standard:
+    @staticmethod
+    def _calc_ratio(column_name, x, y, default_value):
+        '''
+        计算npu侧和gpu侧统计量的比值
+        输入：
+            column_name：统计量名称
+            x：npu侧统计量
+            y：gpu侧统计量
+            default：当x不接近0，y接近0，设置的比值默认值
+        输出：
+            ratio：统计量x和y的比值
+            inf_nan_consistency：不出现inf或nan时为True，出现inf或nan时必须同时为inf或-inf或nan才为True，否则为False
+            message：当出现inf或nan时的提示信息
+        '''
+        x, y = convert_str_to_float(x), convert_str_to_float(y)
+        if is_inf_or_nan(x) or is_inf_or_nan(y):
+            return check_inf_or_nan(x, y, column_name)
+        inf_nan_consistency = True
+        message = ""
+        if math.isclose(y, 0.0):
+            if math.isclose(x, 0.0):
+                return 1.0, inf_nan_consistency, message
+            else:
+                return default_value, inf_nan_consistency, message
+        else:
+            return abs(x / y), inf_nan_consistency, message
+class BenchmarkStandard(Standard):
+    def __init__(self, api_name, npu_precision, gpu_precision):
+        self.api_name = api_name
+        self.npu_precision = npu_precision
+        self.gpu_precision = gpu_precision
+        self.small_value_err_ratio = 1
+        self.rmse_ratio = 1
+        self.max_rel_err_ratio = 1
+        self.mean_rel_err_ratio = 1
+        self.eb_ratio = 1
+        self.small_value_err_status = CompareConst.PASS
+        self.rmse_status = CompareConst.PASS
+        self.max_rel_err_status = CompareConst.PASS
+        self.mean_rel_err_status = CompareConst.PASS
+        self.eb_status = CompareConst.PASS
+        self.check_result_list = []
+        self.final_result = CompareConst.PASS
+        self.compare_message = ""
+    def __str__(self):
+        return "%s" % (self.api_name)
+    @staticmethod
+    def _get_status(ratio, algorithm):
+        if math.isnan(ratio) or math.isinf(ratio):
+            return CompareConst.PASS
+        error_threshold = benchmark_algorithms_thresholds.get(algorithm, {}).get('error_threshold', DEFAULT_THRESHOLD)
+        warning_threshold = benchmark_algorithms_thresholds.get(algorithm, {}).get('warning_threshold',
+                                                                                   DEFAULT_THRESHOLD)
+        if ratio > error_threshold:
+            return CompareConst.ERROR
+        elif ratio > warning_threshold:
+            return CompareConst.WARNING
+        return CompareConst.PASS
+    def get_result(self):
+        inf_nan_consistency = self._compare_ratio()
+        small_value_inf_nan_consistency = inf_nan_consistency.small_value_inf_nan_consistency
+        rmse_inf_nan_consistency = inf_nan_consistency.rmse_inf_nan_consistency
+        max_rel_inf_nan_consistency = inf_nan_consistency.max_rel_inf_nan_consistency
+        mean_rel_inf_nan_consistency = inf_nan_consistency.mean_rel_inf_nan_consistency
+        eb_inf_nan_consistency = inf_nan_consistency.eb_inf_nan_consistency
+        self.small_value_err_status = self._get_status(self.small_value_err_ratio, 'small_value') if \
+            small_value_inf_nan_consistency else CompareConst.ERROR
+        self.check_result_list.append(self.small_value_err_status)
+        self.rmse_status = self._get_status(self.rmse_ratio, 'rmse') if rmse_inf_nan_consistency \
+            else CompareConst.ERROR
+        self.check_result_list.append(self.rmse_status)
+        self.max_rel_err_status = self._get_status(self.max_rel_err_ratio, 'max_rel_err') if max_rel_inf_nan_consistency \
+            else CompareConst.ERROR
+        self.check_result_list.append(self.max_rel_err_status)
+        self.mean_rel_err_status = self._get_status(self.mean_rel_err_ratio, 'mean_rel_err') if mean_rel_inf_nan_consistency \
+            else CompareConst.ERROR
+        self.check_result_list.append(self.mean_rel_err_status)
+        self.eb_status = self._get_status(self.eb_ratio, 'eb')
+        if CompareConst.ERROR in self.check_result_list:
+            self.final_result = CompareConst.ERROR
+        elif CompareConst.WARNING in self.check_result_list:
+            self.final_result = CompareConst.WARNING
+    def to_column_value(self):
+        return [self.small_value_err_ratio, self.small_value_err_status, self.rmse_ratio,
+                self.rmse_status, self.max_rel_err_ratio, self.max_rel_err_status, self.mean_rel_err_ratio,
+                self.mean_rel_err_status, self.eb_ratio, self.eb_status]
+    def _compare_ratio(self):
+        self.small_value_err_ratio, small_value_inf_nan_consistency, small_value_message = self._calc_ratio(
+                                    ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE,
+                                    self.npu_precision.get(ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE),
+                                    self.gpu_precision.get(ApiPrecisionCompareColumn.SMALL_VALUE_ERROR_RATE), 10000.0)
+        self.compare_message += small_value_message
+        self.rmse_ratio, rmse_inf_nan_consistency, rmse_message = self._calc_ratio(ApiPrecisionCompareColumn.RMSE,
+                                        self.npu_precision.get(ApiPrecisionCompareColumn.RMSE),
+                                        self.gpu_precision.get(ApiPrecisionCompareColumn.RMSE), 10000.0)
+        self.compare_message += rmse_message
+        self.max_rel_err_ratio, max_rel_inf_nan_consistency, max_rel_message = self._calc_ratio(
+                                        ApiPrecisionCompareColumn.MAX_REL_ERR,
+                                        self.npu_precision.get(ApiPrecisionCompareColumn.MAX_REL_ERR),
+                                        self.gpu_precision.get(ApiPrecisionCompareColumn.MAX_REL_ERR), 10000.0)
+        self.compare_message += max_rel_message
+        self.mean_rel_err_ratio, mean_rel_inf_nan_consistency, mean_rel_message = self._calc_ratio(ApiPrecisionCompareColumn.MEAN_REL_ERR,
+                                        self.npu_precision.get(ApiPrecisionCompareColumn.MEAN_REL_ERR),
+                                        self.gpu_precision.get(ApiPrecisionCompareColumn.MEAN_REL_ERR), 10000.0)
+        self.compare_message += mean_rel_message
+        self.eb_ratio, eb_inf_nan_consistency, eb_message = self._calc_ratio(ApiPrecisionCompareColumn.EB,
+                                        self.npu_precision.get(ApiPrecisionCompareColumn.EB),
+                                        self.gpu_precision.get(ApiPrecisionCompareColumn.EB), 10000.0)
+        self.compare_message += eb_message
+        return BenchmarkInf_Nan_Consistency(small_value_inf_nan_consistency, rmse_inf_nan_consistency,
+                                            max_rel_inf_nan_consistency, mean_rel_inf_nan_consistency, eb_inf_nan_consistency)
+class ULPStandard(Standard):
+    def __init__(self, api_name, npu_precision, gpu_precision):
+        self.api_name = api_name
+        self.npu_precision = npu_precision
+        self.gpu_precision = gpu_precision
+        self.mean_ulp_err = 0
+        self.ulp_err_proportion = 0
+        self.ulp_err_proportion_ratio = 1
+        self.ulp_err_status = CompareConst.PASS
+        self.compare_message = ""
+    def __str__(self):
+        return f"{self.api_name}"
+    def get_result(self):
+        self.mean_ulp_err = convert_str_to_float(self.npu_precision.get(ApiPrecisionCompareColumn.MEAN_ULP_ERR))
+        gpu_mean_ulp_err = convert_str_to_float(self.gpu_precision.get(ApiPrecisionCompareColumn.MEAN_ULP_ERR))
+        inf_nan_consistency = True
+        if is_inf_or_nan(self.mean_ulp_err) or is_inf_or_nan(gpu_mean_ulp_err):
+            _, inf_nan_consistency, message = check_inf_or_nan(self.mean_ulp_err, gpu_mean_ulp_err,
+                                                                 ApiPrecisionCompareColumn.MEAN_ULP_ERR)
+            self.compare_message += message
+        self.ulp_err_proportion = convert_str_to_float(
+                                                self.npu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION))
+        self.ulp_err_proportion_ratio, ulp_inf_nan_consistency, message = self._calc_ratio(
+                    ApiPrecisionCompareColumn.ULP_ERR_PROPORTION,
+                    self.npu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION),
+                    self.gpu_precision.get(ApiPrecisionCompareColumn.ULP_ERR_PROPORTION), 10000.0)
+        inf_nan_consistency = inf_nan_consistency and ulp_inf_nan_consistency
+        self.compare_message += message
+        if inf_nan_consistency:
+            self.ulp_err_status = self._get_ulp_status(self.npu_precision.get(ApiPrecisionCompareColumn.DEVICE_DTYPE))
+        else:
+            self.ulp_err_status = CompareConst.ERROR
+    def _get_ulp_status(self, dtype):
+        if dtype == torch.float32:
+            if self.mean_ulp_err < 64:
+                return CompareConst.PASS
+            elif self.ulp_err_proportion < 0.05:
+                return CompareConst.PASS
+            elif self.ulp_err_proportion_ratio < 1:
+                return CompareConst.PASS
+            else:
+                self.compare_message += "ERROR: ULP误差不满足标准\n"
+                return CompareConst.ERROR
+        else:
+            if self.ulp_err_proportion < 0.001:
+                return CompareConst.PASS
+            elif self.ulp_err_proportion_ratio < 1:
+                return CompareConst.PASS
+            else:
+                self.compare_message += "ERROR: ULP误差不满足标准\n"
+                return CompareConst.ERROR
+def write_detail_csv(content, save_path):
+    rows = []
+    content = ["{:.{}f}".format(item, msCheckerConfig.precision) \
+                   if isinstance(item, float) else item for item in content]
+    rows.append(content)
+    write_csv(rows, save_path)
+def api_precision_compare(config):
+    logger.info("Start compare task")
+    logger.info(f"Compare task result will be saved in {config.result_csv_path}")
+    logger.info(f"Compare task detail will be saved in {config.details_csv_path}")
+    try:
+        npu_data = pd.read_csv(config.npu_csv_path)
+    except Exception as err:
+        logger.error(f"Open npu csv Error: %s" % str(err))
+    check_csv_columns(npu_data.columns, "npu_csv")
+    try:
+        gpu_data = pd.read_csv(config.gpu_csv_path)
+    except Exception as err:
+        logger.error(f"Open gpu csv Error: %s" % str(err))
+    check_csv_columns(gpu_data.columns, "gpu_csv")
+    detail_csv_title = [ApiPrecisionCompareColumn.get_detail_csv_title()]
+    result_csv_title = [ApiPrecisionCompareColumn.get_result_csv_title()]
+    write_csv(result_csv_title, config.result_csv_path)
+    write_csv(detail_csv_title, config.details_csv_path)
+    try:
+        analyse_csv(npu_data, gpu_data, config)
+    except Exception as err:
+        logger.error(f"Analyse csv Error: %s" % str(err))
+    change_mode(config.result_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
+    change_mode(config.details_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
+def online_api_precision_compare(online_config):
+    rank = online_config.rank
+    result_csv_path = os.path.join(Const.DEFAULT_PATH, online_config.result_csv_path).replace("_rank*.csv", f"_rank{rank}.csv")
+    details_csv_path = os.path.join(Const.DEFAULT_PATH, online_config.details_csv_path).replace("_rank*.csv", f"_rank{rank}.csv")
+    detail_csv_title = [ApiPrecisionCompareColumn.get_detail_csv_title()]
+    result_csv_title = [ApiPrecisionCompareColumn.get_result_csv_title()]
+    if not os.path.exists(result_csv_path):
+        write_csv(result_csv_title, result_csv_path)
+    if not os.path.exists(details_csv_path):
+        write_csv(detail_csv_title, details_csv_path)
+    config = CompareConfig("", "", result_csv_path, details_csv_path)
+    try:
+        npu_data, gpu_data = online_config.npu_data, online_config.gpu_data
+        check_csv_columns(npu_data.columns, "npu_csv")
+        check_csv_columns(gpu_data.columns, "gpu_csv")
+        analyse_csv(npu_data, gpu_data, config)
+    except Exception as err:
+        logger.error(f"Online api precision compare Error: {str(err)}")
+    change_mode(result_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
+    change_mode(details_csv_path, FileCheckConst.DATA_FILE_AUTHORITY)
+def analyse_csv(npu_data, gpu_data, config):
+    forward_status, backward_status = [], []
+    last_api_name, last_api_dtype, last_api_full_name = None, None, None
+    for _, row_npu in npu_data.iterrows():
+        message = ''
+        compare_column = ApiPrecisionOutputColumn()
+        full_api_name_with_direction_status = row_npu[ApiPrecisionCompareColumn.API_NAME]
+        row_gpu = gpu_data[gpu_data[ApiPrecisionCompareColumn.API_NAME] == full_api_name_with_direction_status]
+        api_name, api_full_name, direction_status = extract_detailed_api_segments(full_api_name_with_direction_status)
+        if not api_full_name:
+            err_message = f"The API name {full_api_name_with_direction_status} is invalid."
+            logger.error(err_message)
+            compare_column.api_name = full_api_name_with_direction_status
+            compare_column.compare_result = CompareConst.SKIP
+            compare_column.compare_message = err_message
+            write_detail_csv(compare_column.to_column_value(), config.details_csv_path)
+            write_csv([[full_api_name_with_direction_status, CompareConst.SKIP, CompareConst.SKIP,  err_message]],
+                      config.result_csv_path)
+            continue
+        if row_gpu.empty:
+            logger.warning(f'This API : {full_api_name_with_direction_status} does not exist in the GPU data.')
+            continue
+        if len(row_gpu) > 1:
+            msg = f'This API : {full_api_name_with_direction_status} has multiple records in the GPU data.'
+            raise CompareException(CompareException.INVALID_DATA_ERROR, msg)
+        row_gpu = row_gpu.iloc[0]
+        new_status = CompareConst.SPACE
+        try:
+            new_status = get_api_status(row_npu, row_gpu, api_name, compare_column)
+        except Exception as err:
+            logger.error(f"Get api status error: {str(err)}")
+            compare_column.api_name = full_api_name_with_direction_status
+            compare_column.compare_result = CompareConst.SKIP
+            compare_column.compare_message = str(err)
+            write_detail_csv(compare_column.to_column_value(), config.details_csv_path)
+            write_csv([[full_api_name_with_direction_status, CompareConst.SKIP, CompareConst.SKIP, str(err)]],
+                      config.result_csv_path)
+            continue
+        write_detail_csv(compare_column.to_column_value(), config.details_csv_path)
+        if last_api_name is not None and api_full_name != last_api_name:
+            if last_api_dtype in API_PRECISION_COMPARE_UNSUPPORT_LIST:
+                message = unsupported_message
+                write_csv([[last_api_name, CompareConst.SKIP, CompareConst.SKIP, message]], config.result_csv_path)
+                print_test_success(last_api_name, CompareConst.SKIP, CompareConst.SKIP)
+                forward_status, backward_status = [], []
+                message = ''
+            else:
+                forward_result = get_api_checker_result(forward_status)
+                backward_result = get_api_checker_result(backward_status)
+                message += CompareMessage.get(last_api_name, "") if forward_result == CompareConst.ERROR else ""
+                write_csv([[last_api_name, forward_result, backward_result, message]], config.result_csv_path)
+                print_test_success(last_api_name, forward_result, backward_result)
+                forward_status, backward_status = [], []
+                message = ''
+        is_supported = row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] not in API_PRECISION_COMPARE_UNSUPPORT_LIST
+        last_api_name = api_full_name
+        last_api_dtype = row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE]
+        if not is_supported:
+            continue
+        if direction_status == 'forward':
+            forward_status.append(new_status)
+        elif direction_status == 'backward':
+            backward_status.append(new_status)
+        else:
+            logger.error(f"Invalid direction status: {direction_status}")
+    if last_api_name is not None:
+        if last_api_dtype in API_PRECISION_COMPARE_UNSUPPORT_LIST:
+            message = unsupported_message
+            write_csv([[last_api_name, CompareConst.SKIP, CompareConst.SKIP, message]], config.result_csv_path)
+            print_test_success(last_api_name, CompareConst.SKIP, CompareConst.SKIP)
+        else:
+            forward_result = get_api_checker_result(forward_status)
+            backward_result = get_api_checker_result(backward_status)
+            message += CompareMessage.get(last_api_name, "") if forward_result == CompareConst.ERROR else ""
+            write_csv([[last_api_name, forward_result, backward_result, message]], config.result_csv_path)
+            print_test_success(last_api_name, forward_result, backward_result)
+def get_api_status(row_npu, row_gpu, api_name, compare_column):
+    full_api_name_with_direction_status = row_npu[ApiPrecisionCompareColumn.API_NAME]
+    # 当前API的输出为空（例如反向过程中requires_grad=False）,跳过比对
+    if row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE].isspace():
+        compare_column.api_name = full_api_name_with_direction_status
+        compare_column.compare_result = CompareConst.SKIP
+        compare_column.compare_message = row_npu[ApiPrecisionCompareColumn.MESSAGE]
+        new_status = CompareConst.SKIP
+    else:
+        compare_column.api_name = full_api_name_with_direction_status
+        if api_name in thousandth_standard_api:
+            new_status = record_thousandth_threshold_result(compare_column, row_npu)
+        elif row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] not in BINARY_COMPARE_UNSUPPORT_LIST or \
+            api_name in binary_standard_api:
+            new_status = record_binary_consistency_result(api_name, compare_column, row_npu)
+        elif api_name in absolute_standard_api:
+            new_status = record_absolute_threshold_result(compare_column, row_npu)
+        elif api_name in ulp_standard_api and \
+            row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] in ULP_COMPARE_SUPPORT_LIST:
+            us = ULPStandard(full_api_name_with_direction_status, row_npu, row_gpu)
+            new_status = record_ulp_compare_result(compare_column, us)
+        elif row_npu[ApiPrecisionCompareColumn.DEVICE_DTYPE] in BENCHMARK_COMPARE_SUPPORT_LIST:
+            bs = BenchmarkStandard(full_api_name_with_direction_status, row_npu, row_gpu)
+            new_status = record_benchmark_compare_result(compare_column, bs)
+    return new_status
+def print_test_success(api_full_name, forward_result, backward_result):
+    is_fwd_success = (forward_result == CompareConst.PASS)
+    is_bwd_success = (backward_result == CompareConst.PASS or backward_result == CompareConst.SPACE)
+    logger.info(f"running api_full_name {api_full_name} compare, "
+                f"is_fwd_success: {is_fwd_success}, "
+                f"is_bwd_success: {is_bwd_success}")
+def check_error_rate(npu_error_rate):
+    return CompareConst.PASS if convert_str_to_float(npu_error_rate) == 0 else CompareConst.ERROR
+def get_absolute_threshold_result(row_npu):
+    inf_nan_error_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.INF_NAN_ERROR_RATIO])
+    rel_err_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.REL_ERR_RATIO])
+    abs_err_ratio = convert_str_to_float(row_npu[ApiPrecisionCompareColumn.ABS_ERR_RATIO])
+    inf_nan_result = CompareConst.PASS if inf_nan_error_ratio == 0 else CompareConst.ERROR
+    rel_err_result = CompareConst.PASS if rel_err_ratio == 0 else CompareConst.ERROR
+    abs_err_result = CompareConst.PASS if abs_err_ratio == 0 else CompareConst.ERROR
+    if CompareConst.ERROR in [inf_nan_result, rel_err_result, abs_err_result]:
+        absolute_threshold_result = CompareConst.ERROR
+    else:
+        absolute_threshold_result = CompareConst.PASS
+    return {
+        "inf_nan_error_ratio": inf_nan_error_ratio,
+        "inf_nan_result": inf_nan_result,
+        "rel_err_ratio": rel_err_ratio,
+        "rel_err_result": rel_err_result,
+        "abs_err_ratio": abs_err_ratio,
+        "abs_err_result": abs_err_result,
+        "absolute_threshold_result": absolute_threshold_result,
+    }
+def get_api_checker_result(status):
+    if not status:
+        return CompareConst.SPACE
+    if all(item == CompareConst.SKIP for item in status):
+        return CompareConst.SKIP
+    for const in (CompareConst.ERROR, CompareConst.WARNING):
+        if const in status:
+            return const
+    return CompareConst.PASS
+def check_csv_columns(columns, csv_type):
+    required_columns = ApiPrecisionCompareColumn.to_required_columns()
+    missing_columns = [column for column in required_columns if column not in columns]
+    if missing_columns:
+        msg = f"The following columns {','.join(missing_columns)} are missing in{csv_type}"
+        raise CompareException(CompareException.INVALID_DATA_ERROR, msg)
+def record_binary_consistency_result(api_name, compare_column, row_npu):
+    new_status = check_error_rate(row_npu[ApiPrecisionCompareColumn.ERROR_RATE])
+    compare_column.error_rate = row_npu[ApiPrecisionCompareColumn.ERROR_RATE]
+    compare_column.error_rate_status = new_status
+    compare_column.compare_result = new_status
+    compare_column.compare_algorithm = "二进制一致法"
+    message = ''
+    if compare_column.error_rate_status == CompareConst.ERROR:
+        message += "ERROR: 二进制一致错误率超过阈值\n"
+        message += CompareMessage.get(api_name, "")
+    compare_column.compare_message = message
+    return new_status
+def record_absolute_threshold_result(compare_column, row_npu):
+    absolute_threshold_result = get_absolute_threshold_result(row_npu)
+    compare_column.inf_nan_error_ratio = absolute_threshold_result.get("inf_nan_error_ratio")
+    compare_column.inf_nan_error_ratio_status = absolute_threshold_result.get("inf_nan_result")
+    compare_column.rel_err_ratio = absolute_threshold_result.get("rel_err_ratio")
+    compare_column.rel_err_ratio_status = absolute_threshold_result.get("rel_err_result")
+    compare_column.abs_err_ratio = absolute_threshold_result.get("abs_err_ratio")
+    compare_column.abs_err_ratio_status = absolute_threshold_result.get("abs_err_result")
+    compare_column.compare_result = absolute_threshold_result.get("absolute_threshold_result")
+    compare_column.compare_algorithm = "绝对阈值法"
+    message = ''
+    if compare_column.inf_nan_error_ratio_status == CompareConst.ERROR:
+        message += "ERROR: inf/nan错误率超过阈值\n"
+    if compare_column.rel_err_ratio_status == CompareConst.ERROR:
+        message += "ERROR: 相对误差错误率超过阈值\n"
+    if compare_column.abs_err_ratio_status == CompareConst.ERROR:
+        message += "ERROR: 绝对误差错误率超过阈值\n"
+    compare_column.compare_message = message
+    return compare_column.compare_result
+def record_benchmark_compare_result(compare_column, bs):
+    bs.get_result()
+    compare_column.small_value_err_ratio = bs.small_value_err_ratio
+    compare_column.small_value_err_status = bs.small_value_err_status
+    compare_column.rmse_ratio = bs.rmse_ratio
+    compare_column.rmse_status = bs.rmse_status
+    compare_column.max_rel_err_ratio = bs.max_rel_err_ratio
+    compare_column.max_rel_err_status = bs.max_rel_err_status
+    compare_column.mean_rel_err_ratio = bs.mean_rel_err_ratio
+    compare_column.mean_rel_err_status = bs.mean_rel_err_status
+    compare_column.eb_ratio = bs.eb_ratio
+    compare_column.eb_status = bs.eb_status
+    compare_column.compare_result = bs.final_result
+    compare_column.compare_algorithm = "标杆比对法"
+    compare_column.compare_message = bs.compare_message
+    for status_attr, messages in benchmark_message.items():
+        status_value = getattr(compare_column, status_attr)
+        if status_value in messages:
+            compare_column.compare_message += messages[status_value]
+    return compare_column.compare_result
+def record_ulp_compare_result(compare_column, us):
+    us.get_result()
+    compare_column.mean_ulp_err = us.mean_ulp_err
+    compare_column.ulp_err_proportion = us.ulp_err_proportion
+    compare_column.ulp_err_proportion_ratio = us.ulp_err_proportion_ratio
+    compare_column.ulp_err_status = us.ulp_err_status
+    compare_column.compare_result = us.ulp_err_status
+    compare_column.compare_algorithm = "ULP误差比对法"
+    compare_column.compare_message = us.compare_message
+    return compare_column.compare_result
+def check_thousandth_rate(thousandth_rate):
+    return CompareConst.PASS if convert_str_to_float(thousandth_rate) >= 0.999 else CompareConst.ERROR
+def record_thousandth_threshold_result(compare_column, row_npu):
+    new_status = check_thousandth_rate(row_npu[ApiPrecisionCompareColumn.REL_ERR_THOUSANDTH])
+    compare_column.rel_err_thousandth = row_npu[ApiPrecisionCompareColumn.REL_ERR_THOUSANDTH]
+    compare_column.rel_err_thousandth_status = new_status
+    compare_column.compare_result = new_status
+    compare_column.compare_algorithm = "双千指标法"
+    message = ''
+    if compare_column.rel_err_thousandth_status == CompareConst.ERROR:
+        message += "ERROR: 双千指标不达标\n"
+    compare_column.compare_message = message
+    return compare_column.compare_result
+def _api_precision_compare(parser=None):
+    if not parser:
+        parser = argparse.ArgumentParser()
+    _api_precision_compare_parser(parser)
+    args = parser.parse_args(sys.argv[1:])
+    _api_precision_compare_command(args)
+def _api_precision_compare_command(args):
+    npu_csv_path = get_validated_result_csv_path(args.npu_csv_path, 'detail')
+    gpu_csv_path = get_validated_result_csv_path(args.gpu_csv_path, 'detail')
+    out_path = os.path.realpath(args.out_path) if args.out_path else "./"
+    check_path_before_create(out_path)
+    create_directory(out_path)
+    out_path_checker = FileChecker(out_path, FileCheckConst.DIR, ability=FileCheckConst.WRITE_ABLE)
+    out_path = out_path_checker.common_check()
+    result_csv_path = os.path.join(out_path, API_PRECISION_COMPARE_RESULT_FILE_NAME)
+    details_csv_path = os.path.join(out_path, API_PRECISION_COMPARE_DETAILS_FILE_NAME)
+    compare_config = CompareConfig(npu_csv_path, gpu_csv_path, result_csv_path, details_csv_path)
+    api_precision_compare(compare_config)
+def _api_precision_compare_parser(parser):
+    parser.add_argument("-npu", "--npu_csv_path", dest="npu_csv_path", default="", type=str,
+                        help="<Required> , Accuracy_checking_details.csv generated on the NPU by using the "
+                             "api_accuracy_checker tool.",
+                        required=True)
+    parser.add_argument("-gpu", "--gpu_csv_path", dest="gpu_csv_path", default="", type=str,
+                        help="<Required> Accuracy_checking_details.csv generated on the GPU by using the "
+                             "api_accuracy_checker tool.",
+                        required=False)
+    parser.add_argument("-o", "--out_path", dest="out_path", default="", type=str,
+                        help="<optional> The api precision compare task result out path.",
+                        required=False)
+if __name__ == '__main__':
+    _api_precision_compare()
+    logger.info("Compare task completed.")

mindstudio-probe 1.0.1__py3-none-any.whl → 1.0.4__py3-none-any.whl

mindstudio-probe 1.0.1py3-none-any.whl → 1.0.4py3-none-any.whl