mindstudio-probe 1.0.1__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- mindstudio_probe-1.0.1.dist-info/LICENSE +201 -0
- mindstudio_probe-1.0.1.dist-info/METADATA +30 -0
- mindstudio_probe-1.0.1.dist-info/RECORD +228 -0
- mindstudio_probe-1.0.1.dist-info/WHEEL +5 -0
- mindstudio_probe-1.0.1.dist-info/entry_points.txt +2 -0
- mindstudio_probe-1.0.1.dist-info/top_level.txt +1 -0
- msprobe/README.md +182 -0
- msprobe/__init__.py +0 -0
- msprobe/config/README.md +397 -0
- msprobe/config/config.json +28 -0
- msprobe/config/img/free_benchmark.png +0 -0
- msprobe/core/common/const.py +241 -0
- msprobe/core/common/exceptions.py +88 -0
- msprobe/core/common/file_check.py +265 -0
- msprobe/core/common/log.py +55 -0
- msprobe/core/common/utils.py +516 -0
- msprobe/core/common_config.py +58 -0
- msprobe/core/data_dump/data_collector.py +140 -0
- msprobe/core/data_dump/data_processor/base.py +245 -0
- msprobe/core/data_dump/data_processor/factory.py +61 -0
- msprobe/core/data_dump/data_processor/pytorch_processor.py +346 -0
- msprobe/core/data_dump/json_writer.py +116 -0
- msprobe/core/data_dump/scope.py +178 -0
- msprobe/mindspore/__init__.py +1 -0
- msprobe/mindspore/debugger/__init__.py +0 -0
- msprobe/mindspore/debugger/debugger_config.py +51 -0
- msprobe/mindspore/debugger/precision_debugger.py +32 -0
- msprobe/mindspore/doc/dump.md +65 -0
- msprobe/mindspore/dump/__init__.py +0 -0
- msprobe/mindspore/dump/api_kbk_dump.py +55 -0
- msprobe/mindspore/dump/dump_tool_factory.py +38 -0
- msprobe/mindspore/dump/kernel_graph_dump.py +60 -0
- msprobe/mindspore/ms_config.py +78 -0
- msprobe/mindspore/overflow_check/__init__.py +0 -0
- msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +45 -0
- msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +32 -0
- msprobe/mindspore/task_handler_factory.py +21 -0
- msprobe/msprobe.py +67 -0
- msprobe/pytorch/__init__.py +4 -0
- msprobe/pytorch/advisor/advisor.py +124 -0
- msprobe/pytorch/advisor/advisor_const.py +59 -0
- msprobe/pytorch/advisor/advisor_result.py +58 -0
- msprobe/pytorch/api_accuracy_checker/.keep +0 -0
- msprobe/pytorch/api_accuracy_checker/__init__.py +0 -0
- msprobe/pytorch/api_accuracy_checker/common/.keep +0 -0
- msprobe/pytorch/api_accuracy_checker/common/__init__.py +0 -0
- msprobe/pytorch/api_accuracy_checker/common/config.py +50 -0
- msprobe/pytorch/api_accuracy_checker/common/utils.py +224 -0
- msprobe/pytorch/api_accuracy_checker/compare/__init__.py +0 -0
- msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +216 -0
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +545 -0
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +133 -0
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -0
- msprobe/pytorch/api_accuracy_checker/compare/compare.py +345 -0
- msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +74 -0
- msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +249 -0
- msprobe/pytorch/api_accuracy_checker/config.yaml +4 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/.keep +0 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/__init__.py +0 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +328 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +203 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +127 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +493 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +7 -0
- msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +5 -0
- msprobe/pytorch/common/__init__.py +2 -0
- msprobe/pytorch/common/compare_script.template +14 -0
- msprobe/pytorch/common/log.py +32 -0
- msprobe/pytorch/common/parse_json.py +37 -0
- msprobe/pytorch/common/utils.py +224 -0
- msprobe/pytorch/compare/acc_compare.py +1024 -0
- msprobe/pytorch/compare/distributed_compare.py +111 -0
- msprobe/pytorch/compare/highlight.py +100 -0
- msprobe/pytorch/compare/mapping.yaml +607 -0
- msprobe/pytorch/compare/match.py +36 -0
- msprobe/pytorch/compare/npy_compare.py +244 -0
- msprobe/pytorch/debugger/__init__.py +0 -0
- msprobe/pytorch/debugger/debugger_config.py +86 -0
- msprobe/pytorch/debugger/precision_debugger.py +95 -0
- msprobe/pytorch/doc/FAQ.md +193 -0
- msprobe/pytorch/doc/api_accuracy_checker.md +269 -0
- msprobe/pytorch/doc/atat/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +182 -0
- msprobe/pytorch/doc/dump.md +207 -0
- msprobe/pytorch/doc/img/BLOOM-7B_1.png +0 -0
- msprobe/pytorch/doc/img/BLOOM-7B_2.png +0 -0
- msprobe/pytorch/doc/img/BLOOM-7B_3.png +0 -0
- msprobe/pytorch/doc/img/BLOOM-7B_4.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_1.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_2.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_3.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_4.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_5.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_6.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_7.png +0 -0
- msprobe/pytorch/doc/img/GPT-3_8.png +0 -0
- msprobe/pytorch/doc/img/YOLOV5S_1.png +0 -0
- msprobe/pytorch/doc/img/YOLOV5S_2.png +0 -0
- msprobe/pytorch/doc/img/accuracy_checking_details.png +0 -0
- msprobe/pytorch/doc/img/accuracy_checking_result.png +0 -0
- msprobe/pytorch/doc/img/api_precision_compare_details.png +0 -0
- msprobe/pytorch/doc/img/api_precision_compare_result.png +0 -0
- msprobe/pytorch/doc/img/auto_analyze_log.png +0 -0
- msprobe/pytorch/doc/img/compare_result_pkl.png +0 -0
- msprobe/pytorch/doc/img/compare_result_pkl_md5.png.png +0 -0
- msprobe/pytorch/doc/img/cpu_info.png +0 -0
- msprobe/pytorch/doc/img/module_compare.png +0 -0
- msprobe/pytorch/doc/parse_tool.md +286 -0
- msprobe/pytorch/doc/ptdbg_ascend_compare.md +176 -0
- msprobe/pytorch/doc/ptdbg_ascend_overview.md +68 -0
- msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +381 -0
- msprobe/pytorch/doc/run_overflow_check.md +25 -0
- msprobe/pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md +90 -0
- msprobe/pytorch/free_benchmark/__init__.py +8 -0
- msprobe/pytorch/free_benchmark/common/__init__.py +0 -0
- msprobe/pytorch/free_benchmark/common/constant.py +67 -0
- msprobe/pytorch/free_benchmark/common/counter.py +72 -0
- msprobe/pytorch/free_benchmark/common/enums.py +37 -0
- msprobe/pytorch/free_benchmark/common/params.py +129 -0
- msprobe/pytorch/free_benchmark/common/utils.py +98 -0
- msprobe/pytorch/free_benchmark/compare/grad_saver.py +183 -0
- msprobe/pytorch/free_benchmark/compare/single_benchmark.py +104 -0
- msprobe/pytorch/free_benchmark/main.py +102 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/__init__.py +0 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +13 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +41 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/__init__.py +0 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +90 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +104 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +63 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +68 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +28 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +45 -0
- msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +19 -0
- msprobe/pytorch/free_benchmark/result_handlers/__init__.py +0 -0
- msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +203 -0
- msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +39 -0
- msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +24 -0
- msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +31 -0
- msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +170 -0
- msprobe/pytorch/functional/__init__.py +0 -0
- msprobe/pytorch/functional/data_processor.py +0 -0
- msprobe/pytorch/functional/dump_module.py +39 -0
- msprobe/pytorch/hook_module/__init__.py +1 -0
- msprobe/pytorch/hook_module/api_registry.py +161 -0
- msprobe/pytorch/hook_module/hook_module.py +109 -0
- msprobe/pytorch/hook_module/support_wrap_ops.yaml +1876 -0
- msprobe/pytorch/hook_module/utils.py +29 -0
- msprobe/pytorch/hook_module/wrap_aten.py +100 -0
- msprobe/pytorch/hook_module/wrap_distributed.py +75 -0
- msprobe/pytorch/hook_module/wrap_functional.py +108 -0
- msprobe/pytorch/hook_module/wrap_npu_custom.py +73 -0
- msprobe/pytorch/hook_module/wrap_tensor.py +72 -0
- msprobe/pytorch/hook_module/wrap_torch.py +88 -0
- msprobe/pytorch/hook_module/wrap_vf.py +64 -0
- msprobe/pytorch/module_processer.py +98 -0
- msprobe/pytorch/online_dispatch/__init__.py +20 -0
- msprobe/pytorch/online_dispatch/compare.py +236 -0
- msprobe/pytorch/online_dispatch/dispatch.py +274 -0
- msprobe/pytorch/online_dispatch/dump_compare.py +186 -0
- msprobe/pytorch/online_dispatch/single_compare.py +391 -0
- msprobe/pytorch/online_dispatch/torch_ops_config.yaml +50 -0
- msprobe/pytorch/online_dispatch/utils.py +187 -0
- msprobe/pytorch/parse.py +4 -0
- msprobe/pytorch/parse_tool/__init__.py +0 -0
- msprobe/pytorch/parse_tool/cli.py +32 -0
- msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
- msprobe/pytorch/parse_tool/lib/compare.py +259 -0
- msprobe/pytorch/parse_tool/lib/config.py +51 -0
- msprobe/pytorch/parse_tool/lib/file_desc.py +31 -0
- msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -0
- msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -0
- msprobe/pytorch/parse_tool/lib/parse_tool.py +158 -0
- msprobe/pytorch/parse_tool/lib/utils.py +367 -0
- msprobe/pytorch/parse_tool/lib/visualization.py +90 -0
- msprobe/pytorch/pt_config.py +93 -0
- msprobe/pytorch/service.py +167 -0
- msprobe/test/core_ut/common/test_utils.py +345 -0
- msprobe/test/core_ut/data_dump/test_data_collector.py +47 -0
- msprobe/test/core_ut/data_dump/test_json_writer.py +183 -0
- msprobe/test/core_ut/data_dump/test_scope.py +151 -0
- msprobe/test/core_ut/test_common_config.py +152 -0
- msprobe/test/core_ut/test_file_check.py +218 -0
- msprobe/test/core_ut/test_log.py +109 -0
- msprobe/test/mindspore_ut/test_api_kbk_dump.py +51 -0
- msprobe/test/mindspore_ut/test_debugger_config.py +42 -0
- msprobe/test/mindspore_ut/test_dump_tool_factory.py +51 -0
- msprobe/test/mindspore_ut/test_kernel_graph_dump.py +66 -0
- msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +63 -0
- msprobe/test/mindspore_ut/test_ms_config.py +69 -0
- msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +51 -0
- msprobe/test/mindspore_ut/test_precision_debugger.py +56 -0
- msprobe/test/mindspore_ut/test_task_handler_factory.py +58 -0
- msprobe/test/pytorch_ut/advisor/test_advisor.py +83 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +108 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +39 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +112 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +77 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +125 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +10 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +43 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +179 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +63 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +99 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +115 -0
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +72 -0
- msprobe/test/pytorch_ut/compare/test_acc_compare.py +17 -0
- msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +105 -0
- msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +121 -0
- msprobe/test/pytorch_ut/free_benchmark/test_main.py +101 -0
- msprobe/test/pytorch_ut/functional/test_dump_module.py +15 -0
- msprobe/test/pytorch_ut/hook_module/test_api_registry.py +130 -0
- msprobe/test/pytorch_ut/hook_module/test_hook_module.py +42 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +65 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +35 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +20 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +35 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +43 -0
- msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +11 -0
- msprobe/test/pytorch_ut/test_pt_config.py +69 -0
- msprobe/test/pytorch_ut/test_service.py +59 -0
- msprobe/test/resources/advisor.txt +3 -0
- msprobe/test/resources/compare_result_20230703104808.csv +9 -0
- msprobe/test/resources/compare_result_without_accuracy.csv +9 -0
- msprobe/test/resources/config.yaml +3 -0
- msprobe/test/resources/npu_test.pkl +8 -0
- msprobe/test/run_test.sh +30 -0
- msprobe/test/run_ut.py +58 -0
- msprobe/test/test_module_processer.py +64 -0
|
@@ -0,0 +1,493 @@
|
|
|
1
|
+
import argparse
|
|
2
|
+
import os
|
|
3
|
+
import csv
|
|
4
|
+
import re
|
|
5
|
+
import sys
|
|
6
|
+
import time
|
|
7
|
+
import gc
|
|
8
|
+
from collections import namedtuple
|
|
9
|
+
|
|
10
|
+
try:
|
|
11
|
+
import torch_npu
|
|
12
|
+
except ImportError:
|
|
13
|
+
is_gpu = True
|
|
14
|
+
current_device = "cuda"
|
|
15
|
+
else:
|
|
16
|
+
is_gpu = False
|
|
17
|
+
current_device = "npu"
|
|
18
|
+
import torch
|
|
19
|
+
from tqdm import tqdm
|
|
20
|
+
|
|
21
|
+
from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut_utils import Backward_Message, hf_32_standard_api
|
|
22
|
+
from msprobe.pytorch.api_accuracy_checker.run_ut.data_generate import gen_api_params, gen_args
|
|
23
|
+
from msprobe.pytorch.api_accuracy_checker.common.utils import get_json_contents, api_info_preprocess, \
|
|
24
|
+
initialize_save_path, UtDataProcessor
|
|
25
|
+
from msprobe.pytorch.api_accuracy_checker.compare.compare import Comparator
|
|
26
|
+
from msprobe.pytorch.api_accuracy_checker.compare.compare_column import CompareColumn
|
|
27
|
+
from msprobe.pytorch.hook_module.wrap_tensor import TensorOPTemplate
|
|
28
|
+
from msprobe.pytorch.hook_module.wrap_functional import FunctionalOPTemplate
|
|
29
|
+
from msprobe.pytorch.hook_module.wrap_torch import TorchOPTemplate
|
|
30
|
+
from msprobe.pytorch.api_accuracy_checker.common.config import msCheckerConfig
|
|
31
|
+
from msprobe.pytorch.common.parse_json import parse_json_info_forward_backward
|
|
32
|
+
from msprobe.core.common.file_check import FileOpen, FileChecker, \
|
|
33
|
+
change_mode, check_file_suffix, check_link, check_path_before_create, create_directory
|
|
34
|
+
from msprobe.pytorch.common.log import logger
|
|
35
|
+
from msprobe.core.common.const import Const, FileCheckConst, CompareConst
|
|
36
|
+
|
|
37
|
+
current_time = time.strftime("%Y%m%d%H%M%S")
|
|
38
|
+
UT_ERROR_DATA_DIR = 'ut_error_data' + current_time
|
|
39
|
+
RESULT_FILE_NAME = "accuracy_checking_result_" + current_time + ".csv"
|
|
40
|
+
DETAILS_FILE_NAME = "accuracy_checking_details_" + current_time + ".csv"
|
|
41
|
+
RunUTConfig = namedtuple('RunUTConfig', ['forward_content', 'backward_content', 'result_csv_path', 'details_csv_path',
|
|
42
|
+
'save_error_data', 'is_continue_run_ut', 'real_data_path'])
|
|
43
|
+
not_backward_list = ['repeat_interleave']
|
|
44
|
+
not_detach_set = {'resize_', 'resize_as_', 'set_', 'transpose_', 't_', 'squeeze_', 'unsqueeze_'}
|
|
45
|
+
not_raise_dtype_set = {'type_as'}
|
|
46
|
+
|
|
47
|
+
RAISE_PRECISION = {
|
|
48
|
+
torch.float16: torch.float32,
|
|
49
|
+
torch.bfloat16: torch.float32,
|
|
50
|
+
torch.float32: torch.float64
|
|
51
|
+
}
|
|
52
|
+
|
|
53
|
+
tqdm_params = {
|
|
54
|
+
'smoothing': 0, # 平滑进度条的预计剩余时间,取值范围0到1
|
|
55
|
+
'desc': 'Processing', # 进度条前的描述文字
|
|
56
|
+
'leave': True, # 迭代完成后保留进度条的显示
|
|
57
|
+
'ncols': 75, # 进度条的固定宽度
|
|
58
|
+
'mininterval': 0.1, # 更新进度条的最小间隔秒数
|
|
59
|
+
'maxinterval': 1.0, # 更新进度条的最大间隔秒数
|
|
60
|
+
'miniters': 1, # 更新进度条之间的最小迭代次数
|
|
61
|
+
'ascii': None, # 根据环境自动使用ASCII或Unicode字符
|
|
62
|
+
'unit': 'it', # 迭代单位
|
|
63
|
+
'unit_scale': True, # 自动根据单位缩放
|
|
64
|
+
'dynamic_ncols': True, # 动态调整进度条宽度以适应控制台
|
|
65
|
+
'bar_format': '{l_bar}{bar}| {n}/{total_fmt} [{elapsed}<{remaining}, {rate_fmt}]' # 自定义进度条输出格式
|
|
66
|
+
}
|
|
67
|
+
|
|
68
|
+
|
|
69
|
+
def exec_api(api_type, api_name, args, kwargs):
|
|
70
|
+
if api_type == "Functional":
|
|
71
|
+
functional_api = FunctionalOPTemplate(api_name, str, False)
|
|
72
|
+
out = functional_api.forward(*args, **kwargs)
|
|
73
|
+
if api_type == "Tensor":
|
|
74
|
+
tensor_api = TensorOPTemplate(api_name, str, False)
|
|
75
|
+
out = tensor_api.forward(*args, **kwargs)
|
|
76
|
+
if api_type == "Torch":
|
|
77
|
+
torch_api = TorchOPTemplate(api_name, str, False)
|
|
78
|
+
out = torch_api.forward(*args, **kwargs)
|
|
79
|
+
return out
|
|
80
|
+
|
|
81
|
+
|
|
82
|
+
def deal_detach(arg, to_detach=True):
|
|
83
|
+
return arg.detach() if to_detach else arg
|
|
84
|
+
|
|
85
|
+
|
|
86
|
+
def raise_bench_data_dtype(api_name, arg, raise_dtype=None):
|
|
87
|
+
'''
|
|
88
|
+
将标杆数据的dtype转换为raise_dtype
|
|
89
|
+
输入:
|
|
90
|
+
api_name:api名称
|
|
91
|
+
arg:标杆输入
|
|
92
|
+
raise_dtype:需要转换的dtype
|
|
93
|
+
输出:
|
|
94
|
+
arg: 转换dtype的标杆输入
|
|
95
|
+
'''
|
|
96
|
+
if api_name in hf_32_standard_api and arg.dtype == torch.float32:
|
|
97
|
+
return arg
|
|
98
|
+
if raise_dtype is None or arg.dtype not in RAISE_PRECISION or raise_dtype == arg.dtype:
|
|
99
|
+
return arg
|
|
100
|
+
return arg.type(raise_dtype)
|
|
101
|
+
|
|
102
|
+
|
|
103
|
+
def generate_device_params(input_args, input_kwargs, need_backward, api_name):
|
|
104
|
+
def recursive_arg_to_device(arg_in, to_detach):
|
|
105
|
+
if isinstance(arg_in, (list, tuple)):
|
|
106
|
+
return type(arg_in)(recursive_arg_to_device(arg, to_detach) for arg in arg_in)
|
|
107
|
+
elif isinstance(arg_in, torch.Tensor):
|
|
108
|
+
if need_backward and arg_in.requires_grad:
|
|
109
|
+
arg_in = deal_detach(arg_in.clone(), to_detach).to(current_device).requires_grad_()
|
|
110
|
+
temp_arg_in = arg_in * 1
|
|
111
|
+
arg_in = temp_arg_in.type_as(arg_in)
|
|
112
|
+
arg_in.retain_grad()
|
|
113
|
+
return arg_in
|
|
114
|
+
else:
|
|
115
|
+
return deal_detach(arg_in.clone(), to_detach).to(current_device)
|
|
116
|
+
else:
|
|
117
|
+
return arg_in
|
|
118
|
+
|
|
119
|
+
is_detach = api_name not in not_detach_set
|
|
120
|
+
device_args = recursive_arg_to_device(input_args, is_detach)
|
|
121
|
+
device_kwargs = \
|
|
122
|
+
{key: recursive_arg_to_device(value, key != "out" and is_detach) for key, value in input_kwargs.items()}
|
|
123
|
+
return device_args, device_kwargs
|
|
124
|
+
|
|
125
|
+
|
|
126
|
+
def generate_cpu_params(input_args, input_kwargs, need_backward, api_name):
|
|
127
|
+
def recursive_arg_to_cpu(arg_in, to_detach, raise_dtype=None):
|
|
128
|
+
if isinstance(arg_in, (list, tuple)):
|
|
129
|
+
return type(arg_in)(recursive_arg_to_cpu(arg, to_detach, raise_dtype=raise_dtype) for arg in arg_in)
|
|
130
|
+
elif isinstance(arg_in, torch.Tensor):
|
|
131
|
+
if need_backward and arg_in.requires_grad:
|
|
132
|
+
arg_in = deal_detach(raise_bench_data_dtype(
|
|
133
|
+
api_name, arg_in.clone(), raise_dtype=raise_dtype), to_detach).requires_grad_()
|
|
134
|
+
temp_arg_in = arg_in * 1
|
|
135
|
+
arg_in = temp_arg_in.type_as(arg_in)
|
|
136
|
+
arg_in.retain_grad()
|
|
137
|
+
return arg_in
|
|
138
|
+
else:
|
|
139
|
+
return deal_detach(raise_bench_data_dtype(api_name, arg_in.clone(), raise_dtype=raise_dtype), to_detach)
|
|
140
|
+
else:
|
|
141
|
+
return arg_in
|
|
142
|
+
|
|
143
|
+
def is_tensor_with_raise_precision(arg_in, check_kwargs=False):
|
|
144
|
+
if arg_in.dtype in RAISE_PRECISION:
|
|
145
|
+
return True
|
|
146
|
+
if check_kwargs and arg_in.dtype in [torch.half, torch.bfloat16]:
|
|
147
|
+
return True
|
|
148
|
+
return False
|
|
149
|
+
|
|
150
|
+
def recursive_find_dtypes(arg_in, kwargs=None, check_kwargs=False):
|
|
151
|
+
if isinstance(arg_in, (list, tuple)):
|
|
152
|
+
return set().union(*tuple(recursive_find_dtypes(arg, kwargs, check_kwargs=check_kwargs) for arg in arg_in))
|
|
153
|
+
elif isinstance(arg_in, torch.Tensor) and is_tensor_with_raise_precision(arg_in, check_kwargs):
|
|
154
|
+
return set([arg_in.dtype])
|
|
155
|
+
elif isinstance(arg_in, dict) and check_kwargs:
|
|
156
|
+
return set().union(*tuple(recursive_find_dtypes(v, kwargs, check_kwargs=True) for v in arg_in.values()))
|
|
157
|
+
return set()
|
|
158
|
+
|
|
159
|
+
raise_dtype = None
|
|
160
|
+
need_raise_dtypes = recursive_find_dtypes(input_args)
|
|
161
|
+
need_raise_dtypes.update(recursive_find_dtypes(input_kwargs, check_kwargs=True))
|
|
162
|
+
if len(need_raise_dtypes) == 1:
|
|
163
|
+
raise_dtype = RAISE_PRECISION.get(need_raise_dtypes.pop(), torch.float32)
|
|
164
|
+
elif len(need_raise_dtypes) >= 2:
|
|
165
|
+
raise_dtype = torch.float32
|
|
166
|
+
|
|
167
|
+
raise_dtype = None if api_name in not_raise_dtype_set else raise_dtype
|
|
168
|
+
is_detach = api_name not in not_detach_set
|
|
169
|
+
cpu_args = recursive_arg_to_cpu(input_args, is_detach, raise_dtype=raise_dtype)
|
|
170
|
+
cpu_kwargs = {key: recursive_arg_to_cpu(value, key != "out" and is_detach, raise_dtype=raise_dtype) for key, value in input_kwargs.items()}
|
|
171
|
+
return cpu_args, cpu_kwargs
|
|
172
|
+
|
|
173
|
+
|
|
174
|
+
def run_ut(config):
|
|
175
|
+
logger.info("start UT test")
|
|
176
|
+
logger.info(f"UT task result will be saved in {config.result_csv_path}")
|
|
177
|
+
logger.info(f"UT task details will be saved in {config.details_csv_path}")
|
|
178
|
+
if config.save_error_data:
|
|
179
|
+
error_data_path = os.path.abspath(os.path.join(msCheckerConfig.error_data_path, UT_ERROR_DATA_DIR))
|
|
180
|
+
logger.info(f"UT task error_datas will be saved in {error_data_path}")
|
|
181
|
+
compare = Comparator(config.result_csv_path, config.details_csv_path, config.is_continue_run_ut)
|
|
182
|
+
with FileOpen(config.result_csv_path, 'r') as file:
|
|
183
|
+
csv_reader = csv.reader(file)
|
|
184
|
+
next(csv_reader)
|
|
185
|
+
api_name_set = {row[0] for row in csv_reader}
|
|
186
|
+
for _, (api_full_name, api_info_dict) in enumerate(tqdm(config.forward_content.items(), **tqdm_params)):
|
|
187
|
+
if api_full_name in api_name_set:
|
|
188
|
+
continue
|
|
189
|
+
if is_unsupported_api(api_full_name): # TODO run_ut does not support to the npu fusion api and distributed api
|
|
190
|
+
continue
|
|
191
|
+
try:
|
|
192
|
+
if msCheckerConfig.white_list:
|
|
193
|
+
[_, api_name, _] = api_full_name.split(Const.SEP)
|
|
194
|
+
if api_name not in set(msCheckerConfig.white_list):
|
|
195
|
+
continue
|
|
196
|
+
data_info = run_torch_api(api_full_name, config.real_data_path, config.backward_content, api_info_dict)
|
|
197
|
+
is_fwd_success, is_bwd_success = compare.compare_output(api_full_name, data_info)
|
|
198
|
+
if config.save_error_data:
|
|
199
|
+
do_save_error_data(api_full_name, data_info, is_fwd_success, is_bwd_success)
|
|
200
|
+
except Exception as err:
|
|
201
|
+
[_, api_name, _] = api_full_name.split(Const.SEP)
|
|
202
|
+
if "expected scalar type Long" in str(err):
|
|
203
|
+
logger.warning(f"API {api_name} not support int32 tensor in CPU, please add {api_name} to CONVERT_API "
|
|
204
|
+
f"'int32_to_int64' list in accuracy_tools/api_accuracy_check/common/utils.py file.")
|
|
205
|
+
else:
|
|
206
|
+
logger.error(f"Run {api_full_name} UT Error: %s" % str(err))
|
|
207
|
+
err_column = CompareColumn()
|
|
208
|
+
fwd_compare_alg_results = err_column.to_column_value(CompareConst.SKIP, str(err))
|
|
209
|
+
result_info = (api_full_name, CompareConst.SKIP, CompareConst.SKIP, [fwd_compare_alg_results], None, 0)
|
|
210
|
+
compare.record_results(result_info)
|
|
211
|
+
finally:
|
|
212
|
+
if is_gpu:
|
|
213
|
+
torch.cuda.empty_cache()
|
|
214
|
+
else:
|
|
215
|
+
torch.npu.empty_cache()
|
|
216
|
+
gc.collect()
|
|
217
|
+
change_mode(compare.save_path, FileCheckConst.DATA_FILE_AUTHORITY)
|
|
218
|
+
change_mode(compare.detail_save_path, FileCheckConst.DATA_FILE_AUTHORITY)
|
|
219
|
+
compare.print_pretest_result()
|
|
220
|
+
|
|
221
|
+
|
|
222
|
+
def is_unsupported_api(api_name):
|
|
223
|
+
split_name = api_name.split(Const.SEP)[0]
|
|
224
|
+
flag = split_name in [Const.NPU, Const.DISTRIBUTED]
|
|
225
|
+
if flag:
|
|
226
|
+
logger.info(f"{split_name} api is not supported for run ut. SKIP.")
|
|
227
|
+
return flag
|
|
228
|
+
|
|
229
|
+
|
|
230
|
+
def do_save_error_data(api_full_name, data_info, is_fwd_success, is_bwd_success):
|
|
231
|
+
if not is_fwd_success or not is_bwd_success:
|
|
232
|
+
processor = UtDataProcessor(os.path.join(msCheckerConfig.error_data_path, UT_ERROR_DATA_DIR))
|
|
233
|
+
for element in data_info.in_fwd_data_list:
|
|
234
|
+
processor.save_tensors_in_element(api_full_name + '.forward.input', element)
|
|
235
|
+
processor.save_tensors_in_element(api_full_name + '.forward.output.bench', data_info.bench_out)
|
|
236
|
+
processor.save_tensors_in_element(api_full_name + '.forward.output.device', data_info.device_out)
|
|
237
|
+
processor.save_tensors_in_element(api_full_name + '.backward.input', data_info.grad_in)
|
|
238
|
+
processor.save_tensors_in_element(api_full_name + '.backward.output.bench', data_info.bench_grad_out)
|
|
239
|
+
processor.save_tensors_in_element(api_full_name + '.backward.output.device', data_info.device_grad_out)
|
|
240
|
+
|
|
241
|
+
|
|
242
|
+
def run_torch_api(api_full_name, real_data_path, backward_content, api_info_dict):
|
|
243
|
+
in_fwd_data_list = []
|
|
244
|
+
backward_message = ''
|
|
245
|
+
[api_type, api_name, _] = api_full_name.split(Const.SEP)
|
|
246
|
+
args, kwargs, need_grad = get_api_info(api_info_dict, api_name, real_data_path)
|
|
247
|
+
in_fwd_data_list.append(args)
|
|
248
|
+
in_fwd_data_list.append(kwargs)
|
|
249
|
+
need_backward = api_full_name in backward_content
|
|
250
|
+
if not need_grad:
|
|
251
|
+
logger.warning("%s %s" % (api_full_name, Backward_Message.UNSUPPORT_BACKWARD_MESSAGE))
|
|
252
|
+
backward_message += Backward_Message.UNSUPPORT_BACKWARD_MESSAGE
|
|
253
|
+
if api_name in not_backward_list:
|
|
254
|
+
need_grad = False
|
|
255
|
+
logger.warning("%s %s" % (api_full_name, Backward_Message.NO_BACKWARD_RESULT_MESSAGE))
|
|
256
|
+
backward_message += Backward_Message.NO_BACKWARD_RESULT_MESSAGE
|
|
257
|
+
need_backward = need_backward and need_grad
|
|
258
|
+
if kwargs.get("device"):
|
|
259
|
+
del kwargs["device"]
|
|
260
|
+
cpu_args, cpu_kwargs = generate_cpu_params(args, kwargs, need_backward, api_name)
|
|
261
|
+
device_args, device_kwargs = generate_device_params(args, kwargs, need_backward, api_name)
|
|
262
|
+
bench_grad_out, device_grad_out = None, None
|
|
263
|
+
out = exec_api(api_type, api_name, cpu_args, cpu_kwargs)
|
|
264
|
+
device_out = exec_api(api_type, api_name, device_args, device_kwargs)
|
|
265
|
+
current_path = os.path.dirname(os.path.realpath(__file__))
|
|
266
|
+
ut_setting_path = os.path.join(current_path, "torch_ut_setting.json")
|
|
267
|
+
api_setting_dict = get_json_contents(ut_setting_path)
|
|
268
|
+
grad_input_index = api_setting_dict.get(api_name)
|
|
269
|
+
grad_index = None
|
|
270
|
+
grad, bench_grad = None, None
|
|
271
|
+
if grad_input_index is not None:
|
|
272
|
+
grad_index = grad_input_index.get('grad_index')
|
|
273
|
+
|
|
274
|
+
if need_backward:
|
|
275
|
+
if need_to_backward(grad_index, out):
|
|
276
|
+
backward_args = backward_content[api_full_name].get("grad_output")
|
|
277
|
+
grad = gen_args(backward_args, api_name, real_data_path=real_data_path)[0]
|
|
278
|
+
bench_grad, _ = generate_cpu_params(grad, {}, False, api_name)
|
|
279
|
+
bench_grad_out = run_backward(cpu_args, bench_grad, grad_index, out)
|
|
280
|
+
device_grad = grad.clone().detach().to(current_device)
|
|
281
|
+
device_grad_out = run_backward(device_args, device_grad, grad_index, device_out)
|
|
282
|
+
else:
|
|
283
|
+
backward_message += Backward_Message.MULTIPLE_BACKWARD_MESSAGE
|
|
284
|
+
|
|
285
|
+
return UtDataInfo(bench_grad_out, device_grad_out, device_out, out, bench_grad, in_fwd_data_list, backward_message)
|
|
286
|
+
|
|
287
|
+
|
|
288
|
+
def get_api_info(api_info_dict, api_name, real_data_path):
|
|
289
|
+
convert_type, api_info_dict = api_info_preprocess(api_name, api_info_dict)
|
|
290
|
+
need_grad = True
|
|
291
|
+
if api_info_dict.get("input_kwargs") and "out" in api_info_dict.get("input_kwargs"):
|
|
292
|
+
need_grad = False
|
|
293
|
+
args, kwargs = gen_api_params(api_info_dict, api_name, need_grad, convert_type, real_data_path)
|
|
294
|
+
return args, kwargs, need_grad
|
|
295
|
+
|
|
296
|
+
|
|
297
|
+
def need_to_backward(grad_index, out):
|
|
298
|
+
if grad_index is None and isinstance(out, (list, tuple)):
|
|
299
|
+
return False
|
|
300
|
+
return True
|
|
301
|
+
|
|
302
|
+
|
|
303
|
+
def run_backward(args, grad, grad_index, out):
|
|
304
|
+
if grad_index is not None:
|
|
305
|
+
out[grad_index].backward(grad)
|
|
306
|
+
else:
|
|
307
|
+
out.backward(grad)
|
|
308
|
+
args_grad = []
|
|
309
|
+
for arg in args:
|
|
310
|
+
if isinstance(arg, torch.Tensor):
|
|
311
|
+
args_grad.append(arg.grad)
|
|
312
|
+
grad_out = args_grad
|
|
313
|
+
|
|
314
|
+
return grad_out
|
|
315
|
+
|
|
316
|
+
|
|
317
|
+
def initialize_save_error_data():
|
|
318
|
+
error_data_path = msCheckerConfig.error_data_path
|
|
319
|
+
check_path_before_create(error_data_path)
|
|
320
|
+
create_directory(error_data_path)
|
|
321
|
+
error_data_path_checker = FileChecker(msCheckerConfig.error_data_path, FileCheckConst.DIR,
|
|
322
|
+
ability=FileCheckConst.WRITE_ABLE)
|
|
323
|
+
error_data_path = error_data_path_checker.common_check()
|
|
324
|
+
initialize_save_path(error_data_path, UT_ERROR_DATA_DIR)
|
|
325
|
+
|
|
326
|
+
|
|
327
|
+
def get_validated_result_csv_path(result_csv_path, mode):
|
|
328
|
+
if mode not in ['result', 'detail']:
|
|
329
|
+
raise ValueError("The csv mode must be result or detail")
|
|
330
|
+
result_csv_path_checker = FileChecker(result_csv_path, FileCheckConst.FILE, ability=FileCheckConst.READ_WRITE_ABLE,
|
|
331
|
+
file_type=FileCheckConst.CSV_SUFFIX)
|
|
332
|
+
validated_result_csv_path = result_csv_path_checker.common_check()
|
|
333
|
+
if mode == 'result':
|
|
334
|
+
result_csv_name = os.path.basename(validated_result_csv_path)
|
|
335
|
+
pattern = r"^accuracy_checking_result_\d{14}\.csv$"
|
|
336
|
+
if not re.match(pattern, result_csv_name):
|
|
337
|
+
raise ValueError("When continue run ut, please do not modify the result csv name.")
|
|
338
|
+
return validated_result_csv_path
|
|
339
|
+
|
|
340
|
+
|
|
341
|
+
def get_validated_details_csv_path(validated_result_csv_path):
|
|
342
|
+
result_csv_name = os.path.basename(validated_result_csv_path)
|
|
343
|
+
details_csv_name = result_csv_name.replace('result', 'details')
|
|
344
|
+
details_csv_path = os.path.join(os.path.dirname(validated_result_csv_path), details_csv_name)
|
|
345
|
+
details_csv_path_checker = FileChecker(details_csv_path, FileCheckConst.FILE,
|
|
346
|
+
ability=FileCheckConst.READ_WRITE_ABLE, file_type=FileCheckConst.CSV_SUFFIX)
|
|
347
|
+
validated_details_csv_path = details_csv_path_checker.common_check()
|
|
348
|
+
return validated_details_csv_path
|
|
349
|
+
|
|
350
|
+
|
|
351
|
+
def _run_ut_parser(parser):
|
|
352
|
+
parser.add_argument("-api_info", "--api_info_file", dest="api_info_file", default="", type=str,
|
|
353
|
+
help="<Required> The api param tool result file: generate from api param tool, "
|
|
354
|
+
"a json file.",
|
|
355
|
+
required=True)
|
|
356
|
+
parser.add_argument("-o", "--out_path", dest="out_path", default="", type=str,
|
|
357
|
+
help="<optional> The ut task result out path.",
|
|
358
|
+
required=False)
|
|
359
|
+
parser.add_argument('-save_error_data', dest="save_error_data", action="store_true",
|
|
360
|
+
help="<optional> Save compare failed api output.", required=False)
|
|
361
|
+
parser.add_argument("-j", "--jit_compile", dest="jit_compile", action="store_true",
|
|
362
|
+
help="<optional> whether to turn on jit compile", required=False)
|
|
363
|
+
|
|
364
|
+
class UniqueDeviceAction(argparse.Action):
|
|
365
|
+
def __call__(self, parser, namespace, values, option_string=None):
|
|
366
|
+
unique_values = set(values)
|
|
367
|
+
if len(values) != len(unique_values):
|
|
368
|
+
parser.error("device id must be unique")
|
|
369
|
+
for device_id in values:
|
|
370
|
+
if not 0 <= device_id:
|
|
371
|
+
parser.error("device id must be greater than or equal to 0")
|
|
372
|
+
setattr(namespace, self.dest, values)
|
|
373
|
+
|
|
374
|
+
parser.add_argument("-d", "--device", dest="device_id", nargs='+', type=int,
|
|
375
|
+
help="<optional> set device id to run ut, must be unique and in range 0-7",
|
|
376
|
+
default=[0], required=False, action=UniqueDeviceAction)
|
|
377
|
+
parser.add_argument("-csv_path", "--result_csv_path", dest="result_csv_path", default="", type=str,
|
|
378
|
+
help="<optional> The path of accuracy_checking_result_{timestamp}.csv, "
|
|
379
|
+
"when run ut is interrupted, enter the file path to continue run ut.",
|
|
380
|
+
required=False)
|
|
381
|
+
parser.add_argument("-real_data_path", dest="real_data_path", nargs="?", const="", default="", type=str,
|
|
382
|
+
help="<optional> In real data mode, the root directory for storing real data "
|
|
383
|
+
"must be configured.",
|
|
384
|
+
required=False)
|
|
385
|
+
parser.add_argument("-f", "--filter_api", dest="filter_api", action="store_true",
|
|
386
|
+
help="<optional> Whether to filter the api in the api_info_file.", required=False)
|
|
387
|
+
|
|
388
|
+
|
|
389
|
+
def preprocess_forward_content(forward_content):
|
|
390
|
+
processed_content = {}
|
|
391
|
+
base_keys_variants = {}
|
|
392
|
+
arg_cache = {}
|
|
393
|
+
|
|
394
|
+
for key, value in forward_content.items():
|
|
395
|
+
base_key = key.rsplit(Const.SEP, 1)[0]
|
|
396
|
+
|
|
397
|
+
if key not in arg_cache:
|
|
398
|
+
filtered_new_args = [
|
|
399
|
+
{k: v for k, v in arg.items() if k not in ['Max', 'Min']}
|
|
400
|
+
for arg in value['args'] if isinstance(arg, dict)
|
|
401
|
+
]
|
|
402
|
+
arg_cache[key] = (filtered_new_args, value['kwargs'])
|
|
403
|
+
|
|
404
|
+
filtered_new_args, new_kwargs = arg_cache[key]
|
|
405
|
+
|
|
406
|
+
if base_key not in base_keys_variants:
|
|
407
|
+
processed_content[key] = value
|
|
408
|
+
base_keys_variants[base_key] = {key}
|
|
409
|
+
else:
|
|
410
|
+
is_duplicate = False
|
|
411
|
+
for variant in base_keys_variants.get(base_key, []):
|
|
412
|
+
try:
|
|
413
|
+
existing_args, existing_kwargs = arg_cache.get(variant)
|
|
414
|
+
except KeyError as e:
|
|
415
|
+
logger.error(f"KeyError: {e} when processing {key}")
|
|
416
|
+
if existing_args == filtered_new_args and existing_kwargs == new_kwargs:
|
|
417
|
+
is_duplicate = True
|
|
418
|
+
break
|
|
419
|
+
|
|
420
|
+
if not is_duplicate:
|
|
421
|
+
processed_content[key] = value
|
|
422
|
+
base_keys_variants[base_key].add(key)
|
|
423
|
+
|
|
424
|
+
return processed_content
|
|
425
|
+
|
|
426
|
+
|
|
427
|
+
def _run_ut(parser=None):
|
|
428
|
+
if not parser:
|
|
429
|
+
parser = argparse.ArgumentParser()
|
|
430
|
+
_run_ut_parser(parser)
|
|
431
|
+
args = parser.parse_args(sys.argv[1:])
|
|
432
|
+
run_ut_command(args)
|
|
433
|
+
|
|
434
|
+
|
|
435
|
+
def run_ut_command(args):
|
|
436
|
+
if not is_gpu:
|
|
437
|
+
torch.npu.set_compile_mode(jit_compile=args.jit_compile)
|
|
438
|
+
used_device = current_device + ":" + str(args.device_id[0])
|
|
439
|
+
try:
|
|
440
|
+
if is_gpu:
|
|
441
|
+
torch.cuda.set_device(used_device)
|
|
442
|
+
else:
|
|
443
|
+
torch.npu.set_device(used_device)
|
|
444
|
+
except Exception as error:
|
|
445
|
+
logger.error(f"Set device id failed. device id is: {args.device_id}")
|
|
446
|
+
raise NotImplementedError from error
|
|
447
|
+
check_link(args.api_info_file)
|
|
448
|
+
api_info = os.path.realpath(args.api_info_file)
|
|
449
|
+
check_file_suffix(api_info, FileCheckConst.JSON_SUFFIX)
|
|
450
|
+
out_path = os.path.realpath(args.out_path) if args.out_path else "./"
|
|
451
|
+
check_path_before_create(out_path)
|
|
452
|
+
create_directory(out_path)
|
|
453
|
+
out_path_checker = FileChecker(out_path, FileCheckConst.DIR, ability=FileCheckConst.WRITE_ABLE)
|
|
454
|
+
out_path = out_path_checker.common_check()
|
|
455
|
+
save_error_data = args.save_error_data
|
|
456
|
+
forward_content, backward_content, real_data_path = parse_json_info_forward_backward(api_info)
|
|
457
|
+
if args.filter_api:
|
|
458
|
+
logger.info("Start filtering the api in the forward_input_file.")
|
|
459
|
+
forward_content = preprocess_forward_content(forward_content)
|
|
460
|
+
logger.info("Finish filtering the api in the forward_input_file.")
|
|
461
|
+
|
|
462
|
+
result_csv_path = os.path.join(out_path, RESULT_FILE_NAME)
|
|
463
|
+
details_csv_path = os.path.join(out_path, DETAILS_FILE_NAME)
|
|
464
|
+
if args.result_csv_path:
|
|
465
|
+
result_csv_path = get_validated_result_csv_path(args.result_csv_path, 'result')
|
|
466
|
+
details_csv_path = get_validated_details_csv_path(result_csv_path)
|
|
467
|
+
if save_error_data:
|
|
468
|
+
if args.result_csv_path:
|
|
469
|
+
time_info = result_csv_path.split('.')[0].split('_')[-1]
|
|
470
|
+
global UT_ERROR_DATA_DIR
|
|
471
|
+
UT_ERROR_DATA_DIR = 'ut_error_data' + time_info
|
|
472
|
+
initialize_save_error_data()
|
|
473
|
+
run_ut_config = RunUTConfig(forward_content, backward_content, result_csv_path, details_csv_path, save_error_data,
|
|
474
|
+
args.result_csv_path, real_data_path)
|
|
475
|
+
run_ut(run_ut_config)
|
|
476
|
+
|
|
477
|
+
|
|
478
|
+
class UtDataInfo:
|
|
479
|
+
def __init__(self, bench_grad, device_grad, device_output, bench_output, grad_in, in_fwd_data_list,
|
|
480
|
+
backward_message, rank=0):
|
|
481
|
+
self.bench_grad = bench_grad
|
|
482
|
+
self.device_grad = device_grad
|
|
483
|
+
self.device_output = device_output
|
|
484
|
+
self.bench_output = bench_output
|
|
485
|
+
self.grad_in = grad_in
|
|
486
|
+
self.in_fwd_data_list = in_fwd_data_list
|
|
487
|
+
self.backward_message = backward_message
|
|
488
|
+
self.rank = rank
|
|
489
|
+
|
|
490
|
+
|
|
491
|
+
if __name__ == '__main__':
|
|
492
|
+
_run_ut()
|
|
493
|
+
logger.info("UT task completed.")
|
|
@@ -0,0 +1,7 @@
|
|
|
1
|
+
hf_32_standard_api = ["conv1d", "conv2d"]
|
|
2
|
+
|
|
3
|
+
|
|
4
|
+
class Backward_Message:
|
|
5
|
+
MULTIPLE_BACKWARD_MESSAGE = "Multiple backward is not supported."
|
|
6
|
+
UNSUPPORT_BACKWARD_MESSAGE = "function with out=... arguments don't support automatic differentiation, skip backward."
|
|
7
|
+
NO_BACKWARD_RESULT_MESSAGE = "function backward result is None, skip backward."
|
|
@@ -0,0 +1,14 @@
|
|
|
1
|
+
from ptdbg_ascend import compare
|
|
2
|
+
|
|
3
|
+
pkl_path = "%s"
|
|
4
|
+
dump_data_dir = "%s"
|
|
5
|
+
|
|
6
|
+
dump_path_param = {
|
|
7
|
+
"npu_pkl_path": ,
|
|
8
|
+
"bench_pkl_path": ,
|
|
9
|
+
"npu_dump_data_dir": ,
|
|
10
|
+
"bench_dump_data_dir": ,
|
|
11
|
+
"is_print_compare_log": True
|
|
12
|
+
}
|
|
13
|
+
|
|
14
|
+
compare(dump_path_param, output_path="", stack_mode=%s)
|
|
@@ -0,0 +1,32 @@
|
|
|
1
|
+
import os
|
|
2
|
+
import time
|
|
3
|
+
import sys
|
|
4
|
+
from msprobe.pytorch.common.utils import get_rank_if_initialized
|
|
5
|
+
from msprobe.core.common.log import BaseLogger
|
|
6
|
+
from msprobe.core.common.exceptions import DistributedNotInitializedError
|
|
7
|
+
|
|
8
|
+
|
|
9
|
+
class PyTorchLogger(BaseLogger):
|
|
10
|
+
def __init__(self):
|
|
11
|
+
super().__init__()
|
|
12
|
+
|
|
13
|
+
def get_rank(self):
|
|
14
|
+
try:
|
|
15
|
+
current_rank = get_rank_if_initialized()
|
|
16
|
+
except DistributedNotInitializedError:
|
|
17
|
+
current_rank = None
|
|
18
|
+
return current_rank
|
|
19
|
+
|
|
20
|
+
def _print_log(self, level, msg, end='\n'):
|
|
21
|
+
current_rank = self.get_rank()
|
|
22
|
+
current_time = time.strftime("%Y-%m-%d %H:%M:%S", time.localtime())
|
|
23
|
+
pid = os.getpid()
|
|
24
|
+
if current_rank is not None:
|
|
25
|
+
full_msg = f"{current_time} ({pid}) [rank {current_rank}] [{level}] {msg}"
|
|
26
|
+
else:
|
|
27
|
+
full_msg = f"{current_time} ({pid}) [{level}] {msg}"
|
|
28
|
+
print(full_msg, end=end)
|
|
29
|
+
sys.stdout.flush()
|
|
30
|
+
|
|
31
|
+
|
|
32
|
+
logger = PyTorchLogger()
|
|
@@ -0,0 +1,37 @@
|
|
|
1
|
+
import json
|
|
2
|
+
from msprobe.core.common.exceptions import ParseJsonException
|
|
3
|
+
|
|
4
|
+
|
|
5
|
+
def parse_json_info_forward_backward(json_path):
|
|
6
|
+
def parse_data_name_with_pattern(data_name, pattern):
|
|
7
|
+
name_struct = data_name.split('.')
|
|
8
|
+
if not name_struct[-1] == pattern:
|
|
9
|
+
raise ParseJsonException(ParseJsonException.UnexpectedNameStruct,
|
|
10
|
+
f"{data_name} in file {json_path}")
|
|
11
|
+
api_name = '.'.join(name_struct[:-1])
|
|
12
|
+
return api_name
|
|
13
|
+
|
|
14
|
+
with open(json_path, 'r') as f:
|
|
15
|
+
dump_json = json.load(f)
|
|
16
|
+
|
|
17
|
+
real_data_path = dump_json.get("dump_data_dir")
|
|
18
|
+
dump_data = dump_json.get("data")
|
|
19
|
+
if not dump_data:
|
|
20
|
+
raise ParseJsonException(ParseJsonException.InvalidDumpJson, "dump数据中没有data字段")
|
|
21
|
+
|
|
22
|
+
forward_data = {}
|
|
23
|
+
backward_data = {}
|
|
24
|
+
for data_name, data_item in dump_data.items():
|
|
25
|
+
if "Module" in data_name:
|
|
26
|
+
continue
|
|
27
|
+
if "forward" in data_name:
|
|
28
|
+
api_name = parse_data_name_with_pattern(data_name, "forward")
|
|
29
|
+
forward_data.update({api_name: data_item})
|
|
30
|
+
elif "backward" in data_name:
|
|
31
|
+
api_name = parse_data_name_with_pattern(data_name, "backward")
|
|
32
|
+
backward_data.update({api_name: data_item})
|
|
33
|
+
else:
|
|
34
|
+
raise ParseJsonException(ParseJsonException.UnexpectedNameStruct,
|
|
35
|
+
f"{data_name} in file {json_path}.")
|
|
36
|
+
|
|
37
|
+
return forward_data, backward_data, real_data_path
|