mindstudio-probe 1.0.1__py3-none-any.whl → 1.0.3__py3-none-any.whl
This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.
- {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/METADATA +5 -1
- mindstudio_probe-1.0.3.dist-info/RECORD +272 -0
- msprobe/README.md +78 -23
- msprobe/__init__.py +1 -0
- msprobe/config/README.md +182 -40
- msprobe/config/config.json +22 -0
- msprobe/core/__init__.py +0 -0
- msprobe/{pytorch → core}/advisor/advisor.py +3 -3
- msprobe/{pytorch → core}/advisor/advisor_result.py +2 -2
- msprobe/core/common/const.py +82 -5
- msprobe/core/common/exceptions.py +30 -18
- msprobe/core/common/file_check.py +19 -1
- msprobe/core/common/log.py +15 -1
- msprobe/core/common/utils.py +130 -30
- msprobe/core/common_config.py +32 -19
- msprobe/core/compare/acc_compare.py +299 -0
- msprobe/core/compare/check.py +95 -0
- msprobe/core/compare/compare_cli.py +49 -0
- msprobe/core/compare/highlight.py +222 -0
- msprobe/core/compare/multiprocessing_compute.py +149 -0
- msprobe/{pytorch → core}/compare/npy_compare.py +55 -4
- msprobe/core/compare/utils.py +429 -0
- msprobe/core/data_dump/data_collector.py +39 -35
- msprobe/core/data_dump/data_processor/base.py +85 -37
- msprobe/core/data_dump/data_processor/factory.py +5 -7
- msprobe/core/data_dump/data_processor/mindspore_processor.py +198 -0
- msprobe/core/data_dump/data_processor/pytorch_processor.py +94 -51
- msprobe/core/data_dump/json_writer.py +11 -11
- msprobe/core/grad_probe/__init__.py +0 -0
- msprobe/core/grad_probe/constant.py +71 -0
- msprobe/core/grad_probe/grad_compare.py +175 -0
- msprobe/core/grad_probe/utils.py +52 -0
- msprobe/doc/grad_probe/grad_probe.md +207 -0
- msprobe/doc/grad_probe/img/image-1.png +0 -0
- msprobe/doc/grad_probe/img/image-2.png +0 -0
- msprobe/doc/grad_probe/img/image-3.png +0 -0
- msprobe/doc/grad_probe/img/image-4.png +0 -0
- msprobe/doc/grad_probe/img/image.png +0 -0
- msprobe/mindspore/api_accuracy_checker/__init__.py +0 -0
- msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +246 -0
- msprobe/mindspore/api_accuracy_checker/api_info.py +69 -0
- msprobe/mindspore/api_accuracy_checker/api_runner.py +152 -0
- msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +197 -0
- msprobe/mindspore/api_accuracy_checker/compute_element.py +224 -0
- msprobe/mindspore/api_accuracy_checker/main.py +16 -0
- msprobe/mindspore/api_accuracy_checker/type_mapping.py +114 -0
- msprobe/mindspore/api_accuracy_checker/utils.py +63 -0
- msprobe/mindspore/cell_processor.py +34 -0
- msprobe/mindspore/common/const.py +87 -0
- msprobe/mindspore/common/log.py +38 -0
- msprobe/mindspore/common/utils.py +57 -0
- msprobe/mindspore/compare/distributed_compare.py +75 -0
- msprobe/mindspore/compare/ms_compare.py +117 -0
- msprobe/mindspore/compare/ms_graph_compare.py +317 -0
- msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -0
- msprobe/mindspore/debugger/debugger_config.py +38 -15
- msprobe/mindspore/debugger/precision_debugger.py +79 -4
- msprobe/mindspore/doc/compare.md +58 -0
- msprobe/mindspore/doc/dump.md +158 -6
- msprobe/mindspore/dump/dump_tool_factory.py +19 -22
- msprobe/mindspore/dump/hook_cell/api_registry.py +104 -0
- msprobe/mindspore/dump/hook_cell/hook_cell.py +53 -0
- msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +925 -0
- msprobe/mindspore/dump/hook_cell/wrap_functional.py +91 -0
- msprobe/mindspore/dump/hook_cell/wrap_tensor.py +63 -0
- msprobe/mindspore/dump/jit_dump.py +56 -0
- msprobe/mindspore/dump/kernel_kbyk_dump.py +65 -0
- msprobe/mindspore/free_benchmark/__init__.py +0 -0
- msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -0
- msprobe/mindspore/free_benchmark/common/__init__.py +0 -0
- msprobe/mindspore/free_benchmark/common/config.py +12 -0
- msprobe/mindspore/free_benchmark/common/handler_params.py +17 -0
- msprobe/mindspore/free_benchmark/common/utils.py +71 -0
- msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -0
- msprobe/mindspore/free_benchmark/decorator/__init__.py +0 -0
- msprobe/mindspore/free_benchmark/decorator/dec_forward.py +42 -0
- msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -0
- msprobe/mindspore/free_benchmark/handler/__init__.py +0 -0
- msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -0
- msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -0
- msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -0
- msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -0
- msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -0
- msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -0
- msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -0
- msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +34 -0
- msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -0
- msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +27 -0
- msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -0
- msprobe/mindspore/grad_probe/__init__.py +0 -0
- msprobe/mindspore/grad_probe/global_context.py +91 -0
- msprobe/mindspore/grad_probe/grad_analyzer.py +231 -0
- msprobe/mindspore/grad_probe/grad_monitor.py +27 -0
- msprobe/mindspore/grad_probe/grad_stat_csv.py +132 -0
- msprobe/mindspore/grad_probe/hook.py +92 -0
- msprobe/mindspore/grad_probe/utils.py +29 -0
- msprobe/mindspore/ms_config.py +63 -15
- msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +17 -15
- msprobe/mindspore/runtime.py +4 -0
- msprobe/mindspore/service.py +354 -0
- msprobe/mindspore/task_handler_factory.py +7 -4
- msprobe/msprobe.py +66 -26
- msprobe/pytorch/__init__.py +1 -1
- msprobe/pytorch/api_accuracy_checker/common/config.py +21 -16
- msprobe/pytorch/api_accuracy_checker/common/utils.py +1 -60
- msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +2 -5
- msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +46 -10
- msprobe/pytorch/api_accuracy_checker/compare/compare.py +84 -48
- msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +8 -12
- msprobe/pytorch/api_accuracy_checker/config.yaml +7 -1
- msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +15 -11
- msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +11 -15
- msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +16 -9
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +193 -105
- msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +68 -1
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/__init__.py +0 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +202 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +324 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +218 -0
- msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -0
- msprobe/pytorch/bench_functions/__init__.py +15 -0
- msprobe/pytorch/bench_functions/apply_adam_w.py +28 -0
- msprobe/pytorch/bench_functions/confusion_transpose.py +19 -0
- msprobe/pytorch/bench_functions/fast_gelu.py +55 -0
- msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -0
- msprobe/pytorch/bench_functions/linear.py +12 -0
- msprobe/pytorch/bench_functions/matmul_backward.py +48 -0
- msprobe/pytorch/bench_functions/npu_fusion_attention.py +421 -0
- msprobe/pytorch/bench_functions/rms_norm.py +15 -0
- msprobe/pytorch/bench_functions/rotary_mul.py +52 -0
- msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -0
- msprobe/pytorch/bench_functions/swiglu.py +55 -0
- msprobe/pytorch/common/parse_json.py +3 -1
- msprobe/pytorch/common/utils.py +83 -7
- msprobe/pytorch/compare/distributed_compare.py +19 -64
- msprobe/pytorch/compare/match.py +3 -6
- msprobe/pytorch/compare/pt_compare.py +40 -0
- msprobe/pytorch/debugger/debugger_config.py +11 -2
- msprobe/pytorch/debugger/precision_debugger.py +34 -4
- msprobe/pytorch/doc/api_accuracy_checker.md +57 -13
- msprobe/pytorch/doc/api_accuracy_checker_online.md +187 -0
- msprobe/pytorch/doc/dump.md +73 -20
- msprobe/pytorch/doc/ptdbg_ascend_compare.md +75 -11
- msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +3 -3
- msprobe/pytorch/doc/run_overflow_check.md +1 -1
- msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +151 -0
- msprobe/pytorch/free_benchmark/common/constant.py +3 -0
- msprobe/pytorch/free_benchmark/common/utils.py +4 -0
- msprobe/pytorch/free_benchmark/compare/grad_saver.py +22 -26
- msprobe/pytorch/free_benchmark/main.py +7 -4
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +3 -3
- msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +1 -1
- msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +1 -1
- msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +43 -29
- msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -1
- msprobe/pytorch/function_factory.py +75 -0
- msprobe/pytorch/functional/dump_module.py +4 -4
- msprobe/pytorch/grad_probe/__init__.py +0 -0
- msprobe/pytorch/grad_probe/grad_monitor.py +90 -0
- msprobe/pytorch/grad_probe/grad_stat_csv.py +129 -0
- msprobe/pytorch/hook_module/hook_module.py +14 -3
- msprobe/pytorch/hook_module/support_wrap_ops.yaml +2 -1
- msprobe/pytorch/hook_module/utils.py +9 -9
- msprobe/pytorch/hook_module/wrap_aten.py +20 -10
- msprobe/pytorch/hook_module/wrap_distributed.py +10 -7
- msprobe/pytorch/hook_module/wrap_functional.py +4 -7
- msprobe/pytorch/hook_module/wrap_npu_custom.py +21 -10
- msprobe/pytorch/hook_module/wrap_tensor.py +5 -6
- msprobe/pytorch/hook_module/wrap_torch.py +5 -7
- msprobe/pytorch/hook_module/wrap_vf.py +6 -8
- msprobe/pytorch/module_processer.py +53 -13
- msprobe/pytorch/online_dispatch/compare.py +4 -4
- msprobe/pytorch/online_dispatch/dispatch.py +39 -41
- msprobe/pytorch/online_dispatch/dump_compare.py +17 -47
- msprobe/pytorch/online_dispatch/single_compare.py +5 -5
- msprobe/pytorch/online_dispatch/utils.py +2 -43
- msprobe/pytorch/parse_tool/lib/compare.py +31 -19
- msprobe/pytorch/parse_tool/lib/config.py +2 -1
- msprobe/pytorch/parse_tool/lib/parse_tool.py +4 -4
- msprobe/pytorch/parse_tool/lib/utils.py +34 -80
- msprobe/pytorch/parse_tool/lib/visualization.py +4 -3
- msprobe/pytorch/pt_config.py +100 -6
- msprobe/pytorch/service.py +104 -19
- mindstudio_probe-1.0.1.dist-info/RECORD +0 -228
- msprobe/mindspore/dump/api_kbk_dump.py +0 -55
- msprobe/pytorch/compare/acc_compare.py +0 -1024
- msprobe/pytorch/compare/highlight.py +0 -100
- msprobe/test/core_ut/common/test_utils.py +0 -345
- msprobe/test/core_ut/data_dump/test_data_collector.py +0 -47
- msprobe/test/core_ut/data_dump/test_json_writer.py +0 -183
- msprobe/test/core_ut/data_dump/test_scope.py +0 -151
- msprobe/test/core_ut/test_common_config.py +0 -152
- msprobe/test/core_ut/test_file_check.py +0 -218
- msprobe/test/core_ut/test_log.py +0 -109
- msprobe/test/mindspore_ut/test_api_kbk_dump.py +0 -51
- msprobe/test/mindspore_ut/test_debugger_config.py +0 -42
- msprobe/test/mindspore_ut/test_dump_tool_factory.py +0 -51
- msprobe/test/mindspore_ut/test_kernel_graph_dump.py +0 -66
- msprobe/test/mindspore_ut/test_kernel_graph_overflow_check.py +0 -63
- msprobe/test/mindspore_ut/test_ms_config.py +0 -69
- msprobe/test/mindspore_ut/test_overflow_check_tool_factory.py +0 -51
- msprobe/test/mindspore_ut/test_precision_debugger.py +0 -56
- msprobe/test/mindspore_ut/test_task_handler_factory.py +0 -58
- msprobe/test/pytorch_ut/advisor/test_advisor.py +0 -83
- msprobe/test/pytorch_ut/api_accuracy_checker/common/test_common_utils.py +0 -108
- msprobe/test/pytorch_ut/api_accuracy_checker/common/test_config.py +0 -39
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_algorithm.py +0 -112
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_api_precision_compare.py +0 -77
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare.py +0 -125
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_column.py +0 -10
- msprobe/test/pytorch_ut/api_accuracy_checker/compare/test_compare_utils.py +0 -43
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/dump.json +0 -179
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/forward.json +0 -63
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_data_generate.py +0 -99
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_multi_run_ut.py +0 -115
- msprobe/test/pytorch_ut/api_accuracy_checker/run_ut/test_run_ut.py +0 -72
- msprobe/test/pytorch_ut/compare/test_acc_compare.py +0 -17
- msprobe/test/pytorch_ut/free_benchmark/perturbed_layers/test_perturbed_layser.py +0 -105
- msprobe/test/pytorch_ut/free_benchmark/result_handlers/test_result_handler.py +0 -121
- msprobe/test/pytorch_ut/free_benchmark/test_main.py +0 -101
- msprobe/test/pytorch_ut/functional/test_dump_module.py +0 -15
- msprobe/test/pytorch_ut/hook_module/test_api_registry.py +0 -130
- msprobe/test/pytorch_ut/hook_module/test_hook_module.py +0 -42
- msprobe/test/pytorch_ut/hook_module/test_wrap_aten.py +0 -65
- msprobe/test/pytorch_ut/hook_module/test_wrap_distributed.py +0 -35
- msprobe/test/pytorch_ut/hook_module/test_wrap_functional.py +0 -20
- msprobe/test/pytorch_ut/hook_module/test_wrap_tensor.py +0 -35
- msprobe/test/pytorch_ut/hook_module/test_wrap_torch.py +0 -43
- msprobe/test/pytorch_ut/hook_module/test_wrap_vf.py +0 -11
- msprobe/test/pytorch_ut/test_pt_config.py +0 -69
- msprobe/test/pytorch_ut/test_service.py +0 -59
- msprobe/test/resources/advisor.txt +0 -3
- msprobe/test/resources/compare_result_20230703104808.csv +0 -9
- msprobe/test/resources/compare_result_without_accuracy.csv +0 -9
- msprobe/test/resources/config.yaml +0 -3
- msprobe/test/resources/npu_test.pkl +0 -8
- msprobe/test/run_test.sh +0 -30
- msprobe/test/run_ut.py +0 -58
- msprobe/test/test_module_processer.py +0 -64
- {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/LICENSE +0 -0
- {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/WHEEL +0 -0
- {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/entry_points.txt +0 -0
- {mindstudio_probe-1.0.1.dist-info → mindstudio_probe-1.0.3.dist-info}/top_level.txt +0 -0
- /msprobe/{pytorch → core}/advisor/advisor_const.py +0 -0
- /msprobe/pytorch/doc/{atat → msprobe}/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md" +0 -0
|
@@ -1,99 +0,0 @@
|
|
|
1
|
-
# coding=utf-8
|
|
2
|
-
import os
|
|
3
|
-
import unittest
|
|
4
|
-
import copy
|
|
5
|
-
|
|
6
|
-
from msprobe.pytorch.api_accuracy_checker.run_ut.data_generate import *
|
|
7
|
-
from msprobe.pytorch.api_accuracy_checker.common.utils import get_json_contents
|
|
8
|
-
|
|
9
|
-
base_dir = os.path.dirname(os.path.realpath(__file__))
|
|
10
|
-
forward_file = os.path.join(base_dir, "forward.json")
|
|
11
|
-
forward_content = get_json_contents(forward_file)
|
|
12
|
-
for key, value in forward_content.items():
|
|
13
|
-
api_full_name = key
|
|
14
|
-
api_info_dict = value
|
|
15
|
-
|
|
16
|
-
max_value = 1.3945078125
|
|
17
|
-
min_value = -1.444359375
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
class TestDataGenerateMethods(unittest.TestCase):
|
|
21
|
-
def test_gen_api_params(self):
|
|
22
|
-
api_info = copy.deepcopy(api_info_dict)
|
|
23
|
-
args_params, kwargs_params = gen_api_params(api_info, True, None, None)
|
|
24
|
-
max_diff = abs(args_params[0].max() - max_value)
|
|
25
|
-
min_diff = abs(args_params[0].min() - min_value)
|
|
26
|
-
self.assertEqual(len(args_params), 2)
|
|
27
|
-
self.assertEqual(args_params[0].dtype, torch.float16)
|
|
28
|
-
self.assertEqual(args_params[1], 2)
|
|
29
|
-
self.assertLessEqual(max_diff, 0.001)
|
|
30
|
-
self.assertLessEqual(min_diff, 0.001)
|
|
31
|
-
self.assertEqual(args_params[0].shape, torch.Size([2048, 2, 1, 256]))
|
|
32
|
-
self.assertEqual(kwargs_params, {'dim': -1})
|
|
33
|
-
|
|
34
|
-
def test_gen_args(self):
|
|
35
|
-
args_result = gen_args(api_info_dict.get('input_args'), "conv2d")
|
|
36
|
-
max_diff = abs(args_result[0].max() - max_value)
|
|
37
|
-
min_diff = abs(args_result[0].min() - min_value)
|
|
38
|
-
self.assertEqual(len(args_result), 2)
|
|
39
|
-
self.assertEqual(args_result[0].dtype, torch.float16)
|
|
40
|
-
self.assertLessEqual(max_diff, 0.001)
|
|
41
|
-
self.assertLessEqual(min_diff, 0.001)
|
|
42
|
-
self.assertEqual(args_result[0].shape, torch.Size([2048, 2, 1, 256]))
|
|
43
|
-
|
|
44
|
-
def test_gen_data(self):
|
|
45
|
-
data = gen_data(api_info_dict.get('input_args')[0], "conv2d", True, None, None)
|
|
46
|
-
max_diff = abs(data.max() - max_value)
|
|
47
|
-
min_diff = abs(data.min() - min_value)
|
|
48
|
-
self.assertEqual(data.dtype, torch.float16)
|
|
49
|
-
self.assertEqual(data.requires_grad, True)
|
|
50
|
-
self.assertLessEqual(max_diff, 0.001)
|
|
51
|
-
self.assertLessEqual(min_diff, 0.001)
|
|
52
|
-
self.assertEqual(data.shape, torch.Size([2048, 2, 1, 256]))
|
|
53
|
-
|
|
54
|
-
def test_gen_kwargs(self):
|
|
55
|
-
api_info = copy.deepcopy(api_info_dict)
|
|
56
|
-
kwargs_params = gen_kwargs(api_info, None)
|
|
57
|
-
self.assertEqual(kwargs_params, {'dim': -1})
|
|
58
|
-
|
|
59
|
-
def test_gen_kwargs_2(self):
|
|
60
|
-
k_dict = {"inplace": {"type": "bool", "value": "False"}}
|
|
61
|
-
for key, value in k_dict.items():
|
|
62
|
-
gen_torch_kwargs(k_dict, key, value)
|
|
63
|
-
self.assertEqual(k_dict, {'inplace': False})
|
|
64
|
-
|
|
65
|
-
def test_gen_random_tensor(self):
|
|
66
|
-
data = gen_random_tensor(api_info_dict.get('input_args')[0], None)
|
|
67
|
-
max_diff = abs(data.max() - max_value)
|
|
68
|
-
min_diff = abs(data.min() - min_value)
|
|
69
|
-
self.assertEqual(data.dtype, torch.float16)
|
|
70
|
-
self.assertEqual(data.requires_grad, False)
|
|
71
|
-
self.assertLessEqual(max_diff, 0.001)
|
|
72
|
-
self.assertLessEqual(min_diff, 0.001)
|
|
73
|
-
self.assertEqual(data.shape, torch.Size([2048, 2, 1, 256]))
|
|
74
|
-
|
|
75
|
-
def test_gen_common_tensor(self):
|
|
76
|
-
info = api_info_dict.get('input_args')[0]
|
|
77
|
-
low, high = info.get('Min'), info.get('Max')
|
|
78
|
-
low_origin, high_origin = info.get('Min_origin'), info.get('Max_origin')
|
|
79
|
-
low_info = [low, low_origin]
|
|
80
|
-
high_info = [high, high_origin]
|
|
81
|
-
data_dtype = info.get('dtype')
|
|
82
|
-
shape = tuple(info.get('shape'))
|
|
83
|
-
data = gen_common_tensor(low_info, high_info, shape, data_dtype, None)
|
|
84
|
-
max_diff = abs(data.max() - max_value)
|
|
85
|
-
min_diff = abs(data.min() - min_value)
|
|
86
|
-
self.assertEqual(data.dtype, torch.float16)
|
|
87
|
-
self.assertEqual(data.requires_grad, False)
|
|
88
|
-
self.assertLessEqual(max_diff, 0.001)
|
|
89
|
-
self.assertLessEqual(min_diff, 0.001)
|
|
90
|
-
self.assertEqual(data.shape, torch.Size([2048, 2, 1, 256]))
|
|
91
|
-
|
|
92
|
-
def test_gen_bool_tensor(self):
|
|
93
|
-
info = {"type": "torch.Tensor", "dtype": "torch.bool", "shape": [1, 1, 160, 256], "Max": 1, "Min": 0,
|
|
94
|
-
"requires_grad": False}
|
|
95
|
-
low, high = info.get("Min"), info.get("Max")
|
|
96
|
-
shape = tuple(info.get("shape"))
|
|
97
|
-
data = gen_bool_tensor(low, high, shape)
|
|
98
|
-
self.assertEqual(data.shape, torch.Size([1, 1, 160, 256]))
|
|
99
|
-
self.assertEqual(data.dtype, torch.bool)
|
|
@@ -1,115 +0,0 @@
|
|
|
1
|
-
import os
|
|
2
|
-
import glob
|
|
3
|
-
import unittest
|
|
4
|
-
import logging
|
|
5
|
-
from unittest.mock import patch, mock_open, MagicMock
|
|
6
|
-
import json
|
|
7
|
-
import signal
|
|
8
|
-
from msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut import split_json_file, signal_handler, run_parallel_ut, \
|
|
9
|
-
prepare_config, main, ParallelUTConfig
|
|
10
|
-
|
|
11
|
-
|
|
12
|
-
class TestMultiRunUT(unittest.TestCase):
|
|
13
|
-
|
|
14
|
-
def setUp(self):
|
|
15
|
-
self.test_json_file = os.path.join(os.path.dirname(os.path.realpath(__file__)), "dump.json")
|
|
16
|
-
self.test_data = {'data': {'key1': 'TRUE', 'key2': 'TRUE', 'key3': 'TRUE'}}
|
|
17
|
-
self.test_json_content = json.dumps(self.test_data)
|
|
18
|
-
self.forward_split_files_content = [
|
|
19
|
-
{'key1': 'TRUE', 'key2': 'TRUE'},
|
|
20
|
-
{'key3': 'TRUE', 'key4': 'TRUE'}
|
|
21
|
-
]
|
|
22
|
-
|
|
23
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.FileOpen')
|
|
24
|
-
def test_split_json_file(self, mock_FileOpen):
|
|
25
|
-
mock_FileOpen.return_value.__enter__.return_value = mock_open(read_data=self.test_json_content).return_value
|
|
26
|
-
num_splits = 2
|
|
27
|
-
split_files, total_items = split_json_file(self.test_json_file, num_splits, False)
|
|
28
|
-
self.assertEqual(len(split_files), num_splits)
|
|
29
|
-
self.assertEqual(total_items, len(self.test_data.get('data')))
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
@patch('subprocess.Popen')
|
|
33
|
-
@patch('os.path.exists', return_value=True)
|
|
34
|
-
@patch('builtins.open', new_callable=mock_open)
|
|
35
|
-
@patch('json.load', side_effect=lambda f: {'key1': 'TRUE', 'key2': 'TRUE'})
|
|
36
|
-
def test_run_parallel_ut(self, mock_json_load, mock_file, mock_exists, mock_popen):
|
|
37
|
-
mock_process = MagicMock()
|
|
38
|
-
mock_process.poll.side_effect = [None, None, 1]
|
|
39
|
-
mock_process.stdout.readline.side_effect = ['[ERROR] Test Error Message\n', '']
|
|
40
|
-
mock_popen.return_value = mock_process
|
|
41
|
-
|
|
42
|
-
config = ParallelUTConfig(
|
|
43
|
-
api_files=['test.json'],
|
|
44
|
-
out_path='./',
|
|
45
|
-
num_splits=2,
|
|
46
|
-
save_error_data_flag=True,
|
|
47
|
-
jit_compile_flag=False,
|
|
48
|
-
device_id=[0, 1],
|
|
49
|
-
result_csv_path='result.csv',
|
|
50
|
-
total_items=2,
|
|
51
|
-
real_data_path=None
|
|
52
|
-
)
|
|
53
|
-
|
|
54
|
-
mock_file.side_effect = [
|
|
55
|
-
mock_open(read_data=json.dumps(self.forward_split_files_content[0])).return_value,
|
|
56
|
-
mock_open(read_data=json.dumps(self.forward_split_files_content[1])).return_value
|
|
57
|
-
]
|
|
58
|
-
|
|
59
|
-
run_parallel_ut(config)
|
|
60
|
-
|
|
61
|
-
mock_popen.assert_called()
|
|
62
|
-
mock_exists.assert_called()
|
|
63
|
-
|
|
64
|
-
@patch('os.remove')
|
|
65
|
-
@patch('os.path.realpath', side_effect=lambda x: x)
|
|
66
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.check_link')
|
|
67
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.check_file_suffix')
|
|
68
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.FileChecker')
|
|
69
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.split_json_file',
|
|
70
|
-
return_value=(['forward_split1.json', 'forward_split2.json'], 2))
|
|
71
|
-
def test_prepare_config(self, mock_split_json_file, mock_FileChecker, mock_check_file_suffix, mock_check_link,
|
|
72
|
-
mock_realpath, mock_remove):
|
|
73
|
-
mock_FileChecker_instance = MagicMock()
|
|
74
|
-
mock_FileChecker_instance.common_check.return_value = './'
|
|
75
|
-
mock_FileChecker.return_value = mock_FileChecker_instance
|
|
76
|
-
args = MagicMock()
|
|
77
|
-
args.api_info = 'forward.json'
|
|
78
|
-
args.out_path = './'
|
|
79
|
-
args.num_splits = 2
|
|
80
|
-
args.save_error_data = True
|
|
81
|
-
args.jit_compile = False
|
|
82
|
-
args.device_id = [0, 1]
|
|
83
|
-
args.result_csv_path = None
|
|
84
|
-
args.real_data_path = None
|
|
85
|
-
|
|
86
|
-
config = prepare_config(args)
|
|
87
|
-
|
|
88
|
-
self.assertEqual(config.num_splits, 2)
|
|
89
|
-
self.assertTrue(config.save_error_data_flag)
|
|
90
|
-
self.assertFalse(config.jit_compile_flag)
|
|
91
|
-
self.assertEqual(config.device_id, [0, 1])
|
|
92
|
-
self.assertEqual(config.total_items, 2)
|
|
93
|
-
|
|
94
|
-
|
|
95
|
-
@patch('argparse.ArgumentParser.parse_args')
|
|
96
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.prepare_config')
|
|
97
|
-
@patch('msprobe.pytorch.api_accuracy_checker.run_ut.multi_run_ut.run_parallel_ut')
|
|
98
|
-
def test_main(self, mock_run_parallel_ut, mock_prepare_config, mock_parse_args):
|
|
99
|
-
main()
|
|
100
|
-
mock_parse_args.assert_called()
|
|
101
|
-
mock_prepare_config.assert_called()
|
|
102
|
-
mock_run_parallel_ut.assert_called()
|
|
103
|
-
|
|
104
|
-
def tearDown(self):
|
|
105
|
-
current_directory = os.getcwd()
|
|
106
|
-
pattern = os.path.join(current_directory, 'accuracy_checking_*')
|
|
107
|
-
files = glob.glob(pattern)
|
|
108
|
-
|
|
109
|
-
for file in files:
|
|
110
|
-
try:
|
|
111
|
-
os.remove(file)
|
|
112
|
-
logging.info(f"Deleted file: {file}")
|
|
113
|
-
except Exception as e:
|
|
114
|
-
logging.error(f"Failed to delete file {file}: {e}")
|
|
115
|
-
|
|
@@ -1,72 +0,0 @@
|
|
|
1
|
-
# coding=utf-8
|
|
2
|
-
import os
|
|
3
|
-
import copy
|
|
4
|
-
import unittest
|
|
5
|
-
import torch
|
|
6
|
-
from unittest.mock import patch, DEFAULT
|
|
7
|
-
from msprobe.pytorch.api_accuracy_checker.run_ut.run_ut import *
|
|
8
|
-
from msprobe.pytorch.api_accuracy_checker.common.utils import get_json_contents
|
|
9
|
-
|
|
10
|
-
base_dir = os.path.dirname(os.path.realpath(__file__))
|
|
11
|
-
forward_file = os.path.join(base_dir, "forward.json")
|
|
12
|
-
forward_content = get_json_contents(forward_file)
|
|
13
|
-
for api_full_name, api_info_dict in forward_content.items():
|
|
14
|
-
api_full_name = api_full_name
|
|
15
|
-
api_info_dict = api_info_dict
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
class TestRunUtMethods(unittest.TestCase):
|
|
19
|
-
def test_exec_api(self):
|
|
20
|
-
api_info = copy.deepcopy(api_info_dict)
|
|
21
|
-
|
|
22
|
-
[api_type, api_name, _, _] = api_full_name.split(".")
|
|
23
|
-
args, kwargs, need_grad = get_api_info(api_info, api_name, None)
|
|
24
|
-
cpu_args, cpu_kwargs = generate_cpu_params(args, kwargs, True, '')
|
|
25
|
-
out = exec_api(api_type, api_name, cpu_args, cpu_kwargs)
|
|
26
|
-
self.assertEqual(out[0].dtype, torch.float32)
|
|
27
|
-
self.assertTrue(out[0].requires_grad)
|
|
28
|
-
self.assertEqual(out[0].shape, torch.Size([2048, 2, 1, 128]))
|
|
29
|
-
|
|
30
|
-
def test_generate_device_params(self):
|
|
31
|
-
mock_tensor = torch.rand([2, 2560, 24, 24], dtype=torch.float32, requires_grad=True)
|
|
32
|
-
|
|
33
|
-
with patch.multiple('torch.Tensor',
|
|
34
|
-
to=DEFAULT,
|
|
35
|
-
clone=DEFAULT,
|
|
36
|
-
detach=DEFAULT,
|
|
37
|
-
requires_grad_=DEFAULT,
|
|
38
|
-
type_as=DEFAULT,
|
|
39
|
-
retain_grad=DEFAULT) as mocks:
|
|
40
|
-
mocks['clone'].return_value = mock_tensor
|
|
41
|
-
mocks['detach'].return_value = mock_tensor
|
|
42
|
-
mocks['requires_grad_'].return_value = mock_tensor
|
|
43
|
-
mocks['type_as'].return_value = mock_tensor
|
|
44
|
-
mocks['retain_grad'].return_value = None
|
|
45
|
-
mocks['to'].return_value = mock_tensor
|
|
46
|
-
|
|
47
|
-
device_args, device_kwargs = generate_device_params([mock_tensor], {'inplace': False}, True, '')
|
|
48
|
-
self.assertEqual(len(device_args), 1)
|
|
49
|
-
self.assertEqual(device_args[0].dtype, torch.float32)
|
|
50
|
-
self.assertTrue(device_args[0].requires_grad)
|
|
51
|
-
self.assertEqual(device_args[0].shape, torch.Size([2, 2560, 24, 24]))
|
|
52
|
-
self.assertEqual(device_kwargs, {'inplace': False})
|
|
53
|
-
|
|
54
|
-
def test_generate_cpu_params(self):
|
|
55
|
-
api_info = copy.deepcopy(api_info_dict)
|
|
56
|
-
[api_type, api_name, _, _] = api_full_name.split(".")
|
|
57
|
-
args, kwargs, need_grad = get_api_info(api_info, api_name, None)
|
|
58
|
-
cpu_args, cpu_kwargs = generate_cpu_params(args, kwargs, True, '')
|
|
59
|
-
self.assertEqual(len(cpu_args), 2)
|
|
60
|
-
self.assertEqual(cpu_args[0].dtype, torch.float32)
|
|
61
|
-
self.assertTrue(cpu_args[0].requires_grad)
|
|
62
|
-
self.assertEqual(cpu_args[0].shape, torch.Size([2048, 2, 1, 256]))
|
|
63
|
-
self.assertEqual(cpu_kwargs, {'dim': -1})
|
|
64
|
-
|
|
65
|
-
def test_UtDataInfo(self):
|
|
66
|
-
data_info = UtDataInfo(None, None, None, None, None, None, None)
|
|
67
|
-
self.assertIsNone(data_info.bench_grad)
|
|
68
|
-
self.assertIsNone(data_info.device_grad)
|
|
69
|
-
self.assertIsNone(data_info.device_output)
|
|
70
|
-
self.assertIsNone(data_info.bench_output)
|
|
71
|
-
self.assertIsNone(data_info.grad_in)
|
|
72
|
-
self.assertIsNone(data_info.in_fwd_data_list)
|
|
@@ -1,17 +0,0 @@
|
|
|
1
|
-
# coding=utf-8
|
|
2
|
-
import unittest
|
|
3
|
-
from msprobe.pytorch.compare.acc_compare import rename_api
|
|
4
|
-
|
|
5
|
-
class TestUtilsMethods(unittest.TestCase):
|
|
6
|
-
|
|
7
|
-
def test_rename_api(self):
|
|
8
|
-
test_name_1 = "Distributed.broadcast.0.forward.input.0"
|
|
9
|
-
expect_name_1 = "Distributed.broadcast.input.0"
|
|
10
|
-
actual_name_1 = rename_api(test_name_1, "forward")
|
|
11
|
-
self.assertEqual(actual_name_1, expect_name_1)
|
|
12
|
-
|
|
13
|
-
test_name_2 = "Torch.sum.0.backward.output.0"
|
|
14
|
-
expect_name_2 = "Torch.sum.output.0"
|
|
15
|
-
actual_name_2 = rename_api(test_name_2, "backward")
|
|
16
|
-
self.assertEqual(actual_name_2, expect_name_2)
|
|
17
|
-
|
|
@@ -1,105 +0,0 @@
|
|
|
1
|
-
from unittest import TestCase
|
|
2
|
-
|
|
3
|
-
import torch
|
|
4
|
-
from msprobe.core.common.const import Const
|
|
5
|
-
from msprobe.pytorch.free_benchmark.common.enums import DeviceType, PerturbationMode
|
|
6
|
-
from msprobe.pytorch.free_benchmark.common.params import data_pre_deal
|
|
7
|
-
from msprobe.pytorch.free_benchmark.perturbed_layers.layer_factory import LayerFactory
|
|
8
|
-
|
|
9
|
-
|
|
10
|
-
class TestPerturbedLayer(TestCase):
|
|
11
|
-
|
|
12
|
-
# 对输出精度和输入精度一致算子使用升精度扰动因子时, 输出结果的精度也会提升
|
|
13
|
-
def test_improve_precision_layer_handle_with_out_dtype_changing(self):
|
|
14
|
-
api_name = "Torch.mul.0.forward"
|
|
15
|
-
x = torch.randn(2, 3, dtype=torch.float16)
|
|
16
|
-
y = torch.randn(2, 3, dtype=torch.float16)
|
|
17
|
-
out = torch.mul(x, y)
|
|
18
|
-
|
|
19
|
-
data_params = data_pre_deal(api_name, torch.mul, (x, y), {})
|
|
20
|
-
data_params.fuzz_stage = Const.FORWARD
|
|
21
|
-
data_params.original_result = out
|
|
22
|
-
|
|
23
|
-
layer = LayerFactory.create(
|
|
24
|
-
api_name, DeviceType.NPU, PerturbationMode.IMPROVE_PRECISION
|
|
25
|
-
)
|
|
26
|
-
layer.handle(data_params)
|
|
27
|
-
self.assertEqual(data_params.original_result.dtype, torch.float16)
|
|
28
|
-
self.assertEqual(layer.perturbed_value, torch.float32)
|
|
29
|
-
self.assertEqual(data_params.perturbed_result.dtype, torch.float32)
|
|
30
|
-
|
|
31
|
-
# 对于可迭代类型的输入, 升精度方法会遍历其中元素对支持类型输入升精度
|
|
32
|
-
def test_improve_precision_layer_with_iterable_inputs(self):
|
|
33
|
-
api_name = "iterable.0.forward"
|
|
34
|
-
tensor_a = torch.randn(2, 3, dtype=torch.bfloat16)
|
|
35
|
-
tensor_b = torch.randn(2, 3, dtype=torch.float16)
|
|
36
|
-
tensor_c = torch.randn(2, 3, dtype=torch.float32)
|
|
37
|
-
tensor_d = torch.randn(2, 3, dtype=torch.float64)
|
|
38
|
-
tensor_f = torch.randn(2, 3, dtype=torch.float64).to(torch.int32)
|
|
39
|
-
inputs = [tensor_a, tensor_b, {"c": tensor_c, "d": tensor_d}, tensor_f]
|
|
40
|
-
|
|
41
|
-
layer = LayerFactory.create(
|
|
42
|
-
api_name, DeviceType.NPU, PerturbationMode.IMPROVE_PRECISION
|
|
43
|
-
)
|
|
44
|
-
Perturbed_value = layer.improve_tensor_precision(inputs)
|
|
45
|
-
self.assertEqual(Perturbed_value[0].dtype, torch.float32)
|
|
46
|
-
self.assertEqual(Perturbed_value[1].dtype, torch.float32)
|
|
47
|
-
self.assertEqual(Perturbed_value[2]["c"].dtype, torch.float32)
|
|
48
|
-
self.assertEqual(Perturbed_value[2]["d"].dtype, torch.float64)
|
|
49
|
-
self.assertEqual(Perturbed_value[3].dtype, torch.int32)
|
|
50
|
-
|
|
51
|
-
# no_change扰动因子不会改变输入
|
|
52
|
-
def test_no_change_layer(self):
|
|
53
|
-
api_name = "nochange.0.forward"
|
|
54
|
-
inputs = torch.as_tensor([1e-9, 1e-2], dtype=torch.float32)
|
|
55
|
-
layer = LayerFactory.create(
|
|
56
|
-
api_name, DeviceType.NPU, PerturbationMode.NO_CHANGE
|
|
57
|
-
)
|
|
58
|
-
Perturbed_value = layer.no_change(inputs)
|
|
59
|
-
self.assertEqual(Perturbed_value[0], 1e-9)
|
|
60
|
-
self.assertEqual(Perturbed_value[1], 1e-2)
|
|
61
|
-
|
|
62
|
-
# 对于一维二维张量,change_value扰动因子会交换首尾值的位置
|
|
63
|
-
def test_change_value_layer(self):
|
|
64
|
-
api_name = "change.0.forward"
|
|
65
|
-
inputs_1dim = torch.as_tensor([1e-9, 1e-7, 1e-2], dtype=torch.float32)
|
|
66
|
-
inputs_2dim = torch.as_tensor(
|
|
67
|
-
[[1e-9, 1e-7, 1e-2], [1e-9, 1e-2, 1e-7]], dtype=torch.float32
|
|
68
|
-
)
|
|
69
|
-
layer = LayerFactory.create(
|
|
70
|
-
api_name, DeviceType.NPU, PerturbationMode.CHANGE_VALUE
|
|
71
|
-
)
|
|
72
|
-
Perturbed_value_1dim = layer.change_value(inputs_1dim)
|
|
73
|
-
layer.is_added = False
|
|
74
|
-
Perturbed_value_2dim = layer.change_value(inputs_2dim)
|
|
75
|
-
self.assertEqual(Perturbed_value_1dim[0], 1e-2)
|
|
76
|
-
self.assertEqual(Perturbed_value_1dim[2], 1e-9)
|
|
77
|
-
self.assertEqual(Perturbed_value_2dim[0][0], 1e-7)
|
|
78
|
-
self.assertEqual(Perturbed_value_2dim[-1][-1], 1e-9)
|
|
79
|
-
|
|
80
|
-
# 对于输入张量,bit_noise扰动因子对大于极小值的部分进行末尾比特翻转
|
|
81
|
-
def test_bit_noise_layer(self):
|
|
82
|
-
api_name = "bitnoise.0.forward"
|
|
83
|
-
inputs = torch.as_tensor(
|
|
84
|
-
[4096.00048828125, 16777216, 1e-38], dtype=torch.float32
|
|
85
|
-
)
|
|
86
|
-
layer = LayerFactory.create(
|
|
87
|
-
api_name, DeviceType.NPU, PerturbationMode.BIT_NOISE
|
|
88
|
-
)
|
|
89
|
-
Perturbed_value = layer.add_bit_noise(inputs)
|
|
90
|
-
self.assertEqual(Perturbed_value[0], 4096.0000000000)
|
|
91
|
-
self.assertEqual(Perturbed_value[1], 16777218)
|
|
92
|
-
self.assertEqual(Perturbed_value[2], 1e-38)
|
|
93
|
-
|
|
94
|
-
# 对于输入张量,add_noise扰动因子对大于极小值的部分增加一个小值
|
|
95
|
-
def test_add_noise_layer(self):
|
|
96
|
-
api_name = "addnoise.0.forward"
|
|
97
|
-
inputs = torch.as_tensor(
|
|
98
|
-
[1e-1, 1e-2], dtype=torch.bfloat16
|
|
99
|
-
)
|
|
100
|
-
layer = LayerFactory.create(
|
|
101
|
-
api_name, DeviceType.NPU, PerturbationMode.ADD_NOISE
|
|
102
|
-
)
|
|
103
|
-
Perturbed_value = layer.add_noise(inputs)
|
|
104
|
-
self.assertEqual(Perturbed_value[0], 1e-1+1e-4)
|
|
105
|
-
self.assertEqual(Perturbed_value[1], 1e-2)
|
|
@@ -1,121 +0,0 @@
|
|
|
1
|
-
from abc import ABC
|
|
2
|
-
from unittest import TestCase
|
|
3
|
-
|
|
4
|
-
import torch
|
|
5
|
-
from msprobe.core.common.const import Const
|
|
6
|
-
from msprobe.pytorch.free_benchmark.common.constant import PreheatConfig, ThresholdConfig
|
|
7
|
-
from msprobe.pytorch.free_benchmark.common.counter import preheat_counter
|
|
8
|
-
from msprobe.pytorch.free_benchmark.common.enums import (
|
|
9
|
-
DeviceType,
|
|
10
|
-
FuzzLevel,
|
|
11
|
-
HandlerType,
|
|
12
|
-
PerturbationMode,
|
|
13
|
-
)
|
|
14
|
-
from msprobe.pytorch.free_benchmark.common.params import DataParams, make_handler_params
|
|
15
|
-
from msprobe.pytorch.free_benchmark.result_handlers.handler_factory import (
|
|
16
|
-
FuzzHandlerFactory,
|
|
17
|
-
)
|
|
18
|
-
|
|
19
|
-
|
|
20
|
-
class Config(ABC):
|
|
21
|
-
"""
|
|
22
|
-
用以提供参数配置
|
|
23
|
-
"""
|
|
24
|
-
def __init__(self, handler_type, preheat_config):
|
|
25
|
-
self.fuzz_stage = Const.FORWARD
|
|
26
|
-
self.handler_type = handler_type
|
|
27
|
-
self.fuzz_device = DeviceType.NPU
|
|
28
|
-
self.fuzz_level = FuzzLevel.BASE_LEVEL
|
|
29
|
-
self.pert_mode = PerturbationMode.IMPROVE_PRECISION
|
|
30
|
-
self.preheat_config = preheat_config
|
|
31
|
-
|
|
32
|
-
|
|
33
|
-
class TestFuzzHandler(TestCase):
|
|
34
|
-
|
|
35
|
-
def setUp(self) -> None:
|
|
36
|
-
origin_inputs = [
|
|
37
|
-
torch.as_tensor([3.01, 3.02], dtype=torch.float16),
|
|
38
|
-
torch.as_tensor([0.02, 0.02], dtype=torch.float16),
|
|
39
|
-
]
|
|
40
|
-
# 将输入乘以一个大于误差阈值1.002的值,模拟二次执行出现误差
|
|
41
|
-
perturbed_inputs = [
|
|
42
|
-
(value * 1.0021).to(torch.float32).to("cpu") for value in origin_inputs
|
|
43
|
-
]
|
|
44
|
-
origin_output = torch.add(*origin_inputs)
|
|
45
|
-
perturbed_output = torch.add(*perturbed_inputs)
|
|
46
|
-
# 实例有问题的data对象
|
|
47
|
-
self.data_params = DataParams(
|
|
48
|
-
args=origin_inputs,
|
|
49
|
-
kwargs={},
|
|
50
|
-
original_result=origin_output,
|
|
51
|
-
perturbed_result=perturbed_output,
|
|
52
|
-
origin_func=torch.add,
|
|
53
|
-
)
|
|
54
|
-
self.api_name = "add.0.forward"
|
|
55
|
-
self.step = 0
|
|
56
|
-
|
|
57
|
-
def test_result_handler_check(self):
|
|
58
|
-
# 对于check处理类,扰动前后输出不一致的情况会有UnequalRow对象生成
|
|
59
|
-
for _ in range(2):
|
|
60
|
-
config = Config(
|
|
61
|
-
HandlerType.CHECK, {PreheatConfig.IF_PREHEAT: False}
|
|
62
|
-
)
|
|
63
|
-
handler_params = make_handler_params(self.api_name, config, self.step)
|
|
64
|
-
handler = FuzzHandlerFactory.create(handler_params)
|
|
65
|
-
handler.handle(self.data_params)
|
|
66
|
-
self.assertEqual(
|
|
67
|
-
len(handler.get_unequal_rows()), 1
|
|
68
|
-
)
|
|
69
|
-
|
|
70
|
-
def test_result_handler_fix(self):
|
|
71
|
-
# 对于fix处理类,扰动后输出会替代原始输出, dtype和原始输出一致,但值为新输出值
|
|
72
|
-
config = Config(
|
|
73
|
-
HandlerType.FIX, {PreheatConfig.IF_PREHEAT: False}
|
|
74
|
-
)
|
|
75
|
-
handler_params = make_handler_params(self.api_name, config, self.step)
|
|
76
|
-
handler = FuzzHandlerFactory.create(handler_params)
|
|
77
|
-
result = handler.handle(self.data_params)
|
|
78
|
-
self.assertEqual(result.dtype, torch.float16)
|
|
79
|
-
self.assertEqual(result.device, self.data_params.original_result.device)
|
|
80
|
-
self.assertAlmostEqual(
|
|
81
|
-
result[0], self.data_params.perturbed_result.to(torch.float16)[0]
|
|
82
|
-
)
|
|
83
|
-
self.assertAlmostEqual(
|
|
84
|
-
result[1], self.data_params.perturbed_result.to(torch.float16)[1]
|
|
85
|
-
)
|
|
86
|
-
|
|
87
|
-
def test_result_handler_preheat(self):
|
|
88
|
-
# 对于preheat处理类,在预热阶段后的阈值会根据CPU调整
|
|
89
|
-
config = Config(
|
|
90
|
-
HandlerType.CHECK,
|
|
91
|
-
{
|
|
92
|
-
PreheatConfig.IF_PREHEAT: True,
|
|
93
|
-
PreheatConfig.PREHEAT_STEP: 4,
|
|
94
|
-
PreheatConfig.MAX_SAMPLE: 3
|
|
95
|
-
}
|
|
96
|
-
)
|
|
97
|
-
for _ in range(3):
|
|
98
|
-
handler_params = make_handler_params(self.api_name, config, 0)
|
|
99
|
-
handler = FuzzHandlerFactory.create(handler_params)
|
|
100
|
-
handler.handle(self.data_params)
|
|
101
|
-
# 通过preheat_counter的数据可以判断预热是否正常执行,这里第一个step会记录api执行次数
|
|
102
|
-
self.assertEqual(preheat_counter.get_one_step_used_api("add"), 3)
|
|
103
|
-
for step in range(1, 4):
|
|
104
|
-
for _ in range(3):
|
|
105
|
-
handler_params = make_handler_params(self.api_name, config, step)
|
|
106
|
-
handler = FuzzHandlerFactory.create(handler_params)
|
|
107
|
-
handler.handle(self.data_params)
|
|
108
|
-
# call time记录当前step api的调用次数
|
|
109
|
-
self.assertEqual(preheat_counter.get_api_called_time("add"), 3)
|
|
110
|
-
# 对于3个step最多采样三次的预热设置,sample time应该每次采样一例
|
|
111
|
-
self.assertEqual(preheat_counter.get_api_sample_time("add"), 1)
|
|
112
|
-
# 预热阶段,api阈值应该在两个阈值超参之间
|
|
113
|
-
api_threshld = preheat_counter.get_api_thd("add", "torch.float16")
|
|
114
|
-
self.assertLessEqual(
|
|
115
|
-
api_threshld,
|
|
116
|
-
ThresholdConfig.PREHEAT_INITIAL_THD
|
|
117
|
-
)
|
|
118
|
-
self.assertGreaterEqual(
|
|
119
|
-
api_threshld,
|
|
120
|
-
ThresholdConfig.DTYPE_PER_THD[torch.float16]
|
|
121
|
-
)
|
|
@@ -1,101 +0,0 @@
|
|
|
1
|
-
import functools
|
|
2
|
-
from abc import ABC
|
|
3
|
-
from unittest import TestCase
|
|
4
|
-
|
|
5
|
-
import torch
|
|
6
|
-
import torch.nn as nn
|
|
7
|
-
from msprobe.core.common.const import Const
|
|
8
|
-
from msprobe.pytorch.free_benchmark import FreeBenchmarkCheck
|
|
9
|
-
from msprobe.pytorch.free_benchmark.common.constant import CommonField, PreheatConfig
|
|
10
|
-
from msprobe.pytorch.free_benchmark.common.enums import (
|
|
11
|
-
DeviceType,
|
|
12
|
-
FuzzLevel,
|
|
13
|
-
HandlerType,
|
|
14
|
-
PerturbationMode,
|
|
15
|
-
)
|
|
16
|
-
|
|
17
|
-
|
|
18
|
-
class Config(ABC):
|
|
19
|
-
"""
|
|
20
|
-
用以提供参数配置
|
|
21
|
-
"""
|
|
22
|
-
|
|
23
|
-
def __init__(self, fuzz_stage, handler_type):
|
|
24
|
-
self.fuzz_stage = fuzz_stage
|
|
25
|
-
self.handler_type = handler_type
|
|
26
|
-
self.fuzz_device = DeviceType.NPU
|
|
27
|
-
self.fuzz_level = FuzzLevel.BASE_LEVEL
|
|
28
|
-
self.pert_mode = PerturbationMode.IMPROVE_PRECISION
|
|
29
|
-
self.preheat_config = {PreheatConfig.IF_PREHEAT: False}
|
|
30
|
-
|
|
31
|
-
|
|
32
|
-
class WrapMul(nn.Module):
|
|
33
|
-
"""
|
|
34
|
-
用nn.module包装mul算子, 在forward中调用torch.mul
|
|
35
|
-
"""
|
|
36
|
-
|
|
37
|
-
def __init__(self, op_name) -> None:
|
|
38
|
-
super().__init__()
|
|
39
|
-
self.op_name = op_name
|
|
40
|
-
|
|
41
|
-
def forward(self, *args, **kwargs):
|
|
42
|
-
return torch.mul(*args, **kwargs)
|
|
43
|
-
|
|
44
|
-
|
|
45
|
-
class UnequalDataProcessor(ABC):
|
|
46
|
-
"""
|
|
47
|
-
接口类, 处理检测不一致结果
|
|
48
|
-
"""
|
|
49
|
-
|
|
50
|
-
def __init__(self) -> None:
|
|
51
|
-
super().__init__()
|
|
52
|
-
self.unequal_rows = []
|
|
53
|
-
|
|
54
|
-
def update_unequal_rows(self, unequal_rows):
|
|
55
|
-
self.unequal_rows.append(unequal_rows)
|
|
56
|
-
|
|
57
|
-
|
|
58
|
-
class TestInterface(TestCase):
|
|
59
|
-
def setUp(self):
|
|
60
|
-
self.api_name = "Torch.mul.0"
|
|
61
|
-
|
|
62
|
-
def testForwardFix(self):
|
|
63
|
-
# 对于前向接口,在forward钩子中开启FIX,返回结果给hook的输出
|
|
64
|
-
config = Config(Const.FORWARD, HandlerType.FIX)
|
|
65
|
-
checker = FreeBenchmarkCheck(config)
|
|
66
|
-
# 执行算子前向
|
|
67
|
-
x = torch.randn(2, 3).to(torch.float16)
|
|
68
|
-
y = torch.randn(2, 3).to(torch.float16)
|
|
69
|
-
mul_module = WrapMul(self.api_name)
|
|
70
|
-
out = mul_module(x, y)
|
|
71
|
-
# 模拟forward hook中调用无标杆前向检测接口
|
|
72
|
-
result, _ = checker.forward(
|
|
73
|
-
self.api_name,
|
|
74
|
-
mul_module,
|
|
75
|
-
args=(x, y),
|
|
76
|
-
kwargs={},
|
|
77
|
-
output=out,
|
|
78
|
-
)
|
|
79
|
-
self.assertEqual(result.dtype, torch.float32)
|
|
80
|
-
|
|
81
|
-
def testBackwardCheck(self):
|
|
82
|
-
# 对于反向接口,在pre forward时暂存input, 然后在backwrad后进行对比
|
|
83
|
-
config = Config(Const.BACKWARD, HandlerType.CHECK)
|
|
84
|
-
checker = FreeBenchmarkCheck(config)
|
|
85
|
-
processor = UnequalDataProcessor()
|
|
86
|
-
# 初始化输入输出
|
|
87
|
-
x = torch.tensor([2, 3], dtype=torch.float16, requires_grad=True)
|
|
88
|
-
y = torch.tensor([2, 3], dtype=torch.float16, requires_grad=True)
|
|
89
|
-
grad_output = torch.tensor([1,1], dtype=torch.float16)
|
|
90
|
-
backward_name = Const.SEP.join([self.api_name, Const.BACKWARD])
|
|
91
|
-
# 执行前向生成grad saver实例
|
|
92
|
-
mul_module = WrapMul(self.api_name)
|
|
93
|
-
checker.pre_forward(backward_name, mul_module, processor, (x, y), {})
|
|
94
|
-
# 执行算子前向和反向, 并反向获取扰动后grad_input
|
|
95
|
-
out = mul_module(x, y)
|
|
96
|
-
checker.backward(backward_name, mul_module, grad_output)
|
|
97
|
-
out.backward(torch.ones_like(out))
|
|
98
|
-
# module是否添加暂存器, 其中反向钩子执行扰动后grad_input是否正确
|
|
99
|
-
self.assertTrue(hasattr(mul_module, CommonField.GRADSAVER))
|
|
100
|
-
grad_saver = getattr(mul_module, CommonField.GRADSAVER)
|
|
101
|
-
self.assertEqual(grad_saver.perturbed_grad_input[0][0], 2)
|
|
@@ -1,15 +0,0 @@
|
|
|
1
|
-
import unittest
|
|
2
|
-
|
|
3
|
-
import torch.nn as nn
|
|
4
|
-
from msprobe.pytorch import PrecisionDebugger
|
|
5
|
-
from msprobe.pytorch.functional.dump_module import module_dump, module_count
|
|
6
|
-
|
|
7
|
-
|
|
8
|
-
class TestDumpModule(unittest.TestCase):
|
|
9
|
-
def setUp(self):
|
|
10
|
-
self.module = nn.Linear(in_features=8, out_features=4)
|
|
11
|
-
|
|
12
|
-
def test_module_dump(self):
|
|
13
|
-
PrecisionDebugger(dump_path="./dump")
|
|
14
|
-
module_dump(self.module, "TestModule")
|
|
15
|
-
self.assertTrue("TestModule" in module_count)
|