PyPI - mindstudio-probe - Versions diffs - 1.0.3__py3-none-any.whl → 1.0.4__py3-none-any.whl - Mend

mindstudio-probe 1.0.3py3-none-any.whl → 1.0.4py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (262) hide show

{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.0.4.dist-info}/LICENSE +201 -201
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.0.4.dist-info}/METADATA +36 -34
mindstudio_probe-1.0.4.dist-info/RECORD +276 -0
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.0.4.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.0.4.dist-info}/entry_points.txt +1 -0
msprobe/README.md +101 -237
msprobe/{config/config.json → config.json} +49 -49
msprobe/core/advisor/advisor.py +124 -124
msprobe/core/advisor/advisor_const.py +59 -59
msprobe/core/advisor/advisor_result.py +58 -58
msprobe/core/common/const.py +341 -318
msprobe/core/common/exceptions.py +99 -99
msprobe/core/common/{file_check.py → file_utils.py} +478 -283
msprobe/core/common/log.py +76 -69
msprobe/core/common/utils.py +385 -616
msprobe/core/common_config.py +85 -71
msprobe/core/compare/acc_compare.py +299 -298
msprobe/core/compare/check.py +95 -95
msprobe/core/compare/compare_cli.py +49 -49
msprobe/core/compare/highlight.py +223 -222
msprobe/core/compare/multiprocessing_compute.py +149 -149
msprobe/core/compare/npy_compare.py +295 -295
msprobe/core/compare/utils.py +430 -429
msprobe/core/data_dump/data_collector.py +154 -144
msprobe/core/data_dump/data_processor/base.py +314 -293
msprobe/core/data_dump/data_processor/factory.py +59 -59
msprobe/core/data_dump/data_processor/mindspore_processor.py +186 -198
msprobe/core/data_dump/data_processor/pytorch_processor.py +366 -389
msprobe/core/data_dump/json_writer.py +96 -116
msprobe/core/data_dump/scope.py +178 -178
msprobe/core/grad_probe/constant.py +70 -70
msprobe/core/grad_probe/grad_compare.py +171 -175
msprobe/core/grad_probe/utils.py +64 -52
msprobe/docs/01.installation.md +89 -0
msprobe/docs/02.config_introduction.md +165 -0
msprobe/docs/03.config_examples.md +247 -0
msprobe/docs/04.acl_config_examples.md +76 -0
msprobe/docs/05.data_dump_PyTorch.md +198 -0
msprobe/docs/06.data_dump_MindSpore.md +243 -0
msprobe/docs/07.accuracy_checker_PyTorch.md +274 -0
msprobe/docs/08.accuracy_checker_online_PyTorch.md +198 -0
msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
msprobe/docs/10.accuracy_compare_PyTorch.md +245 -0
msprobe/docs/11.accuracy_compare_MindSpore.md +202 -0
msprobe/docs/12.overflow_check_PyTorch.md +79 -0
msprobe/docs/13.overflow_check_MindSpore.md +31 -0
msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
msprobe/docs/15.free_benchmarking_PyTorch.md +164 -0
msprobe/{doc/grad_probe/grad_probe.md → docs/17.grad_probe.md} +207 -207
msprobe/docs/FAQ_PyTorch.md +177 -0
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/mindspore/__init__.py +1 -1
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +254 -245
msprobe/mindspore/api_accuracy_checker/api_info.py +69 -69
msprobe/mindspore/api_accuracy_checker/api_runner.py +155 -151
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +196 -196
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
msprobe/mindspore/api_accuracy_checker/compute_element.py +238 -223
msprobe/mindspore/api_accuracy_checker/main.py +8 -15
msprobe/mindspore/api_accuracy_checker/type_mapping.py +113 -113
msprobe/mindspore/api_accuracy_checker/utils.py +79 -62
msprobe/mindspore/cell_processor.py +34 -34
msprobe/mindspore/common/const.py +106 -87
msprobe/mindspore/common/log.py +37 -37
msprobe/mindspore/common/utils.py +81 -57
msprobe/mindspore/compare/distributed_compare.py +75 -75
msprobe/mindspore/compare/ms_compare.py +219 -117
msprobe/mindspore/compare/ms_graph_compare.py +348 -317
msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -399
msprobe/mindspore/debugger/debugger_config.py +66 -74
msprobe/mindspore/debugger/precision_debugger.py +126 -107
msprobe/mindspore/dump/dump_tool_factory.py +35 -35
msprobe/mindspore/dump/hook_cell/api_registry.py +118 -104
msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -53
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +922 -925
msprobe/mindspore/dump/hook_cell/wrap_api.py +113 -0
msprobe/mindspore/dump/jit_dump.py +72 -56
msprobe/mindspore/dump/kernel_graph_dump.py +59 -60
msprobe/mindspore/dump/kernel_kbyk_dump.py +64 -65
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +116 -116
msprobe/mindspore/free_benchmark/common/config.py +12 -12
msprobe/mindspore/free_benchmark/common/handler_params.py +17 -17
msprobe/mindspore/free_benchmark/common/utils.py +71 -71
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -842
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +43 -42
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +107 -107
msprobe/mindspore/free_benchmark/handler/base_handler.py +90 -90
msprobe/mindspore/free_benchmark/handler/check_handler.py +41 -41
msprobe/mindspore/free_benchmark/handler/fix_handler.py +36 -36
msprobe/mindspore/free_benchmark/handler/handler_factory.py +21 -21
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +67 -67
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +21 -21
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +63 -63
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +51 -0
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +35 -34
msprobe/mindspore/free_benchmark/perturbation/no_change.py +12 -12
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +29 -27
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +33 -33
msprobe/mindspore/grad_probe/global_context.py +90 -91
msprobe/mindspore/grad_probe/grad_analyzer.py +231 -231
msprobe/mindspore/grad_probe/grad_monitor.py +27 -27
msprobe/mindspore/grad_probe/grad_stat_csv.py +131 -131
msprobe/mindspore/grad_probe/hook.py +94 -92
msprobe/mindspore/grad_probe/utils.py +29 -28
msprobe/mindspore/ms_config.py +128 -126
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +44 -45
msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +34 -34
msprobe/mindspore/runtime.py +4 -4
msprobe/mindspore/service.py +378 -354
msprobe/mindspore/task_handler_factory.py +24 -24
msprobe/msprobe.py +105 -107
msprobe/pytorch/__init__.py +3 -3
msprobe/pytorch/api_accuracy_checker/common/config.py +53 -55
msprobe/pytorch/api_accuracy_checker/common/utils.py +214 -165
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +213 -213
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +606 -581
msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
msprobe/pytorch/api_accuracy_checker/compare/compare.py +386 -381
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +73 -73
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +245 -244
msprobe/pytorch/api_accuracy_checker/config.yaml +10 -10
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +335 -332
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +200 -199
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +133 -134
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +592 -581
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +70 -74
msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +197 -202
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +325 -324
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +204 -204
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +219 -218
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +10 -10
msprobe/pytorch/bench_functions/__init__.py +15 -15
msprobe/pytorch/bench_functions/apply_adam_w.py +28 -28
msprobe/pytorch/bench_functions/confusion_transpose.py +19 -19
msprobe/pytorch/bench_functions/fast_gelu.py +55 -55
msprobe/pytorch/bench_functions/layer_norm_eval.py +6 -6
msprobe/pytorch/bench_functions/linear.py +12 -12
msprobe/pytorch/bench_functions/matmul_backward.py +48 -48
msprobe/pytorch/bench_functions/npu_fusion_attention.py +509 -421
msprobe/pytorch/bench_functions/rms_norm.py +15 -15
msprobe/pytorch/bench_functions/rotary_mul.py +52 -52
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +26 -26
msprobe/pytorch/bench_functions/swiglu.py +55 -55
msprobe/pytorch/common/__init__.py +2 -2
msprobe/pytorch/common/compare_script.template +14 -14
msprobe/pytorch/common/log.py +20 -31
msprobe/pytorch/common/parse_json.py +39 -39
msprobe/pytorch/common/utils.py +305 -300
msprobe/pytorch/compare/distributed_compare.py +66 -66
msprobe/pytorch/compare/mapping.yaml +607 -607
msprobe/pytorch/compare/match.py +34 -33
msprobe/pytorch/compare/pt_compare.py +50 -40
msprobe/pytorch/debugger/debugger_config.py +95 -95
msprobe/pytorch/debugger/precision_debugger.py +125 -125
msprobe/pytorch/free_benchmark/__init__.py +8 -8
msprobe/pytorch/free_benchmark/common/constant.py +70 -70
msprobe/pytorch/free_benchmark/common/counter.py +71 -71
msprobe/pytorch/free_benchmark/common/enums.py +37 -37
msprobe/pytorch/free_benchmark/common/params.py +129 -129
msprobe/pytorch/free_benchmark/common/utils.py +102 -102
msprobe/pytorch/free_benchmark/compare/grad_saver.py +179 -179
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +104 -104
msprobe/pytorch/free_benchmark/main.py +105 -105
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +13 -13
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +41 -41
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +90 -90
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +104 -104
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +63 -63
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +68 -68
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +28 -28
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +45 -45
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +19 -19
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +217 -217
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +39 -39
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +23 -23
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +30 -30
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +170 -170
msprobe/pytorch/function_factory.py +76 -75
msprobe/pytorch/functional/dump_module.py +39 -39
msprobe/pytorch/grad_probe/grad_monitor.py +91 -90
msprobe/pytorch/grad_probe/grad_stat_csv.py +128 -128
msprobe/pytorch/hook_module/api_registry.py +161 -161
msprobe/pytorch/hook_module/hook_module.py +120 -120
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1877
msprobe/pytorch/hook_module/utils.py +30 -29
msprobe/pytorch/hook_module/wrap_aten.py +110 -110
msprobe/pytorch/hook_module/wrap_distributed.py +78 -78
msprobe/pytorch/hook_module/wrap_functional.py +105 -105
msprobe/pytorch/hook_module/wrap_npu_custom.py +93 -84
msprobe/pytorch/hook_module/wrap_tensor.py +71 -71
msprobe/pytorch/hook_module/wrap_torch.py +86 -86
msprobe/pytorch/hook_module/wrap_vf.py +62 -62
msprobe/pytorch/module_processer.py +138 -138
msprobe/pytorch/online_dispatch/__init__.py +20 -20
msprobe/pytorch/online_dispatch/compare.py +236 -236
msprobe/pytorch/online_dispatch/dispatch.py +271 -271
msprobe/pytorch/online_dispatch/dump_compare.py +155 -156
msprobe/pytorch/online_dispatch/single_compare.py +391 -391
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +49 -49
msprobe/pytorch/online_dispatch/utils.py +130 -146
msprobe/pytorch/parse.py +4 -4
msprobe/pytorch/parse_tool/cli.py +32 -32
msprobe/pytorch/parse_tool/lib/compare.py +260 -271
msprobe/pytorch/parse_tool/lib/config.py +52 -52
msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +158 -158
msprobe/pytorch/parse_tool/lib/utils.py +316 -321
msprobe/pytorch/parse_tool/lib/visualization.py +85 -91
msprobe/pytorch/pt_config.py +188 -187
msprobe/pytorch/service.py +246 -252
mindstudio_probe-1.0.3.dist-info/RECORD +0 -272
msprobe/config/README.md +0 -539
msprobe/mindspore/doc/compare.md +0 -58
msprobe/mindspore/doc/dump.md +0 -217
msprobe/mindspore/dump/hook_cell/wrap_functional.py +0 -91
msprobe/mindspore/dump/hook_cell/wrap_tensor.py +0 -63
msprobe/pytorch/doc/FAQ.md +0 -193
msprobe/pytorch/doc/api_accuracy_checker.md +0 -313
msprobe/pytorch/doc/api_accuracy_checker_online.md +0 -187
msprobe/pytorch/doc/dump.md +0 -260
msprobe/pytorch/doc/msprobe/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -240
msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
msprobe/pytorch/doc/run_overflow_check.md +0 -25
msprobe/pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md +0 -90
msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -151
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.0.4.dist-info}/top_level.txt +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
/msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
/msprobe/{config → docs}/img/free_benchmark.png +0 -0
/msprobe/{doc/grad_probe/img/image-1.png → docs/img/grad_probe_image-1.png} +0 -0
/msprobe/{doc/grad_probe/img/image-2.png → docs/img/grad_probe_image-2.png} +0 -0
/msprobe/{doc/grad_probe/img/image-3.png → docs/img/grad_probe_image-3.png} +0 -0
/msprobe/{doc/grad_probe/img/image-4.png → docs/img/grad_probe_image-4.png} +0 -0
/msprobe/{doc/grad_probe/img/image.png → docs/img/grad_probe_image.png} +0 -0
/msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0

msprobe/pytorch/free_benchmark/common/constant.py CHANGED Viewed

@@ -1,70 +1,70 @@
-from typing import Dict
-import numpy as np
-import torch
-from msprobe.pytorch.free_benchmark.common.enums import FuzzThreshold
-from msprobe.pytorch.free_benchmark.common.params import BenchmarkThd
-class CommonField:
-    DEVICE = "device"
-    META = "meta"
-    FUZZ_TENSOR = "fuzz_tensor"
-    REQUIRES_GRAD = "requires_grad"
-    HOLD_PLACE = "hold_place"
-    DISTRIBUTED_OP = "torch.distributed"
-    GRADSAVER = "grad_saver"
-class ThresholdConfig:
-    PERTURBATION_VALUE_DICT: Dict = {
-        torch.bfloat16: FuzzThreshold.BF16_THD,
-        torch.float16: FuzzThreshold.F16_THD,
-        torch.float32: FuzzThreshold.F32_THD,
-        torch.float64: FuzzThreshold.F64_THD,
-    }
-    ABS_TOL_VALUE_DICT: Dict = {
-        torch.bfloat16: FuzzThreshold.BF16_THD,
-        torch.float16: FuzzThreshold.F16_THD,
-        torch.float32: FuzzThreshold.F32_THD,
-        torch.float64: FuzzThreshold.F64_THD,
-    }
-    # bit翻转需要匹配到等长或更长的整型
-    PERTURBATION_BIT_DICT = {
-        torch.bfloat16: torch.int16,
-        torch.float16: torch.int16,
-        torch.float32: torch.int32,
-        torch.float64: torch.int64,
-    }
-    # 输入噪声下界
-    NOISE_INPUT_LOWER_BOUND = 1e-8
-    COMP_CONSISTENT = 1.0
-    COMP_NAN = np.nan
-    SYMBOL_FLIPPING = "symbol_flipping"
-    BACKWARD_OUTPUT_LOWER_BOUND = 1e-3
-    SMALL_VALUE = 1.0
-    # 预热初始阈值
-    PREHEAT_INITIAL_THD = 2.05
-    API_THD_STEP = 2.0
-    DTYPE_PER_THD = {
-        torch.float16: 1.002,
-        torch.bfloat16: 1.004,
-        torch.float32: 1.0002,
-    }
-    BENCHMARK_THD_DICT = {
-        torch.float32: BenchmarkThd(2**-14, 1.0, 2**-14, 1e-4),
-        torch.float16: BenchmarkThd(2**-11, 1.0, 2**-11, 1e-4),
-        torch.bfloat16: BenchmarkThd(2**-8, 1.0, 2**-8, 1e-4),
-    }
-    TENSOR_SPLIT_MAX_CHUNK = 128
-class PreheatConfig:
-    IF_PREHEAT = "if_preheat"
-    PREHEAT_STEP = "preheat_step"
-    MAX_SAMPLE = "max_sample"
+from typing import Dict
+import numpy as np
+import torch
+from msprobe.pytorch.free_benchmark.common.enums import FuzzThreshold
+from msprobe.pytorch.free_benchmark.common.params import BenchmarkThd
+class CommonField:
+    DEVICE = "device"
+    META = "meta"
+    FUZZ_TENSOR = "fuzz_tensor"
+    REQUIRES_GRAD = "requires_grad"
+    HOLD_PLACE = "hold_place"
+    DISTRIBUTED_OP = "torch.distributed"
+    GRADSAVER = "grad_saver"
+class ThresholdConfig:
+    PERTURBATION_VALUE_DICT: Dict = {
+        torch.bfloat16: FuzzThreshold.BF16_THD,
+        torch.float16: FuzzThreshold.F16_THD,
+        torch.float32: FuzzThreshold.F32_THD,
+        torch.float64: FuzzThreshold.F64_THD,
+    }
+    ABS_TOL_VALUE_DICT: Dict = {
+        torch.bfloat16: FuzzThreshold.BF16_THD,
+        torch.float16: FuzzThreshold.F16_THD,
+        torch.float32: FuzzThreshold.F32_THD,
+        torch.float64: FuzzThreshold.F64_THD,
+    }
+    # bit翻转需要匹配到等长或更长的整型
+    PERTURBATION_BIT_DICT = {
+        torch.bfloat16: torch.int16,
+        torch.float16: torch.int16,
+        torch.float32: torch.int32,
+        torch.float64: torch.int64,
+    }
+    # 输入噪声下界
+    NOISE_INPUT_LOWER_BOUND = 1e-8
+    COMP_CONSISTENT = 1.0
+    COMP_NAN = np.nan
+    SYMBOL_FLIPPING = "symbol_flipping"
+    BACKWARD_OUTPUT_LOWER_BOUND = 1e-3
+    SMALL_VALUE = 1.0
+    # 预热初始阈值
+    PREHEAT_INITIAL_THD = 2.05
+    API_THD_STEP = 2.0
+    DTYPE_PER_THD = {
+        torch.float16: 1.002,
+        torch.bfloat16: 1.004,
+        torch.float32: 1.0002,
+    }
+    BENCHMARK_THD_DICT = {
+        torch.float32: BenchmarkThd(2**-14, 1.0, 2**-14, 1e-4),
+        torch.float16: BenchmarkThd(2**-11, 1.0, 2**-11, 1e-4),
+        torch.bfloat16: BenchmarkThd(2**-8, 1.0, 2**-8, 1e-4),
+    }
+    TENSOR_SPLIT_MAX_CHUNK = 128
+class PreheatConfig:
+    IF_PREHEAT = "if_preheat"
+    PREHEAT_STEP = "preheat_step"
+    MAX_SAMPLE = "max_sample"

msprobe/pytorch/free_benchmark/common/counter.py CHANGED Viewed

@@ -1,72 +1,72 @@
-from collections import defaultdict
-from msprobe.pytorch.free_benchmark.common.constant import ThresholdConfig
-class PreheatCounter:
-    def __init__(self) -> None:
-        self.api_called_time: dict = defaultdict(int)
-        self.api_sample_time: dict = defaultdict(int)
-        self.one_step_used_api: dict = defaultdict(int)
-        self.api_thd: dict = defaultdict(dict)
-        self.preheat_record: dict = defaultdict(dict)
-        self.dtype_map: dict = {}
-        self.if_preheat: dict = defaultdict(dict)
-        self.step = 0
-    def clear_step(self):
-        self.preheat_record.clear()
-        self.api_called_time.clear()
-        self.api_sample_time.clear()
-    def check_step(self, current_step):
-        if current_step != self.step:
-            self.clear_step()
-            self.step = current_step
-    def add_api_called_time(self, api_name: str):
-        self.api_called_time[api_name] += 1
-    def get_api_called_time(self, api_name: str) -> int:
-        return self.api_called_time[api_name]
-    def add_api_sample_time(self, api_name: str):
-        self.api_sample_time[api_name] += 1
-    def get_api_sample_time(self, api_name: str) -> int:
-        return self.api_sample_time[api_name]
-    def add_one_step_used_api(self, api_name: str):
-        self.one_step_used_api[api_name] += 1
-    def get_one_step_used_api(self, api_name: str):
-        return self.one_step_used_api[api_name]
-    def update_preheat_record(self, api_name, dtype, cmp_result):
-        # 记录预热阶段CPU标杆比对的结果
-        if str(dtype) not in self.preheat_record[api_name].keys():
-            self.preheat_record[api_name][str(dtype)] = list()
-        self.preheat_record[api_name][str(dtype)].append(cmp_result)
-        self.dtype_map[str(dtype)] = dtype
-    def update_api_thd(self, api_name, dtype, threshold, dthreshold):
-        self.api_thd[api_name][str(dtype)] = (
-            threshold if threshold > dthreshold else dthreshold
-        )
-    def get_api_thd(self, api_name, dtype):
-        if not str(dtype) in self.api_thd[api_name]:
-            self.api_thd[api_name][str(dtype)] = ThresholdConfig.PREHEAT_INITIAL_THD
-            self.dtype_map[str(dtype)] = dtype
-        return self.api_thd[api_name][str(dtype)]
-    def set_api_preheat(self, api_name, dtype_str, is_preheat=True):
-        # 标记cpu不一致的dtype 不再进行预热
-        self.if_preheat[api_name][dtype_str] = is_preheat
-    def get_api_preheat(self, api_name, dtype):
-        # 标记cpu不一致的dtype 不再进行预热
-        if str(dtype) not in self.if_preheat[api_name]:
-            return True
-        return self.if_preheat[api_name][str(dtype)]
+from collections import defaultdict
+from msprobe.pytorch.free_benchmark.common.constant import ThresholdConfig
+class PreheatCounter:
+    def __init__(self) -> None:
+        self.api_called_time: dict = defaultdict(int)
+        self.api_sample_time: dict = defaultdict(int)
+        self.one_step_used_api: dict = defaultdict(int)
+        self.api_thd: dict = defaultdict(dict)
+        self.preheat_record: dict = defaultdict(dict)
+        self.dtype_map: dict = {}
+        self.if_preheat: dict = defaultdict(dict)
+        self.step = 0
+    def clear_step(self):
+        self.preheat_record.clear()
+        self.api_called_time.clear()
+        self.api_sample_time.clear()
+    def check_step(self, current_step):
+        if current_step != self.step:
+            self.clear_step()
+            self.step = current_step
+    def add_api_called_time(self, api_name: str):
+        self.api_called_time[api_name] += 1
+    def get_api_called_time(self, api_name: str) -> int:
+        return self.api_called_time[api_name]
+    def add_api_sample_time(self, api_name: str):
+        self.api_sample_time[api_name] += 1
+    def get_api_sample_time(self, api_name: str) -> int:
+        return self.api_sample_time[api_name]
+    def add_one_step_used_api(self, api_name: str):
+        self.one_step_used_api[api_name] += 1
+    def get_one_step_used_api(self, api_name: str):
+        return self.one_step_used_api[api_name]
+    def update_preheat_record(self, api_name, dtype, cmp_result):
+        # 记录预热阶段CPU标杆比对的结果
+        if str(dtype) not in self.preheat_record[api_name].keys():
+            self.preheat_record[api_name][str(dtype)] = list()
+        self.preheat_record[api_name][str(dtype)].append(cmp_result)
+        self.dtype_map[str(dtype)] = dtype
+    def update_api_thd(self, api_name, dtype, threshold, dthreshold):
+        self.api_thd[api_name][str(dtype)] = (
+            threshold if threshold > dthreshold else dthreshold
+        )
+    def get_api_thd(self, api_name, dtype):
+        if not str(dtype) in self.api_thd[api_name]:
+            self.api_thd[api_name][str(dtype)] = ThresholdConfig.PREHEAT_INITIAL_THD
+            self.dtype_map[str(dtype)] = dtype
+        return self.api_thd[api_name][str(dtype)]
+    def set_api_preheat(self, api_name, dtype_str, is_preheat=True):
+        # 标记cpu不一致的dtype 不再进行预热
+        self.if_preheat[api_name][dtype_str] = is_preheat
+    def get_api_preheat(self, api_name, dtype):
+        # 标记cpu不一致的dtype 不再进行预热
+        if str(dtype) not in self.if_preheat[api_name]:
+            return True
+        return self.if_preheat[api_name][str(dtype)]
 preheat_counter = PreheatCounter()

msprobe/pytorch/free_benchmark/common/enums.py CHANGED Viewed

@@ -1,37 +1,37 @@
-class PerturbationMode:
-    ADD_NOISE = "add_noise"
-    CHANGE_VALUE = "change_value"
-    IMPROVE_PRECISION = "improve_precision"
-    NO_CHANGE = "no_change"
-    BIT_NOISE = "bit_noise"
-    TO_CPU = "to_cpu"
-class DeviceType:
-    NPU = "npu"
-    CPU = "cpu"
-class FuzzThreshold:
-    BF16_THD = 1e-4
-    F16_THD = 1e-6
-    F32_THD = 1e-8
-    F64_THD = 1e-16
-class NormType:
-    ONE_NORM = (1, "one_norm")
-    TWO_NORM = (2, "two_norm")
-    ENDLESS_NORM = (3, "endless_norm")
-class HandlerType:
-    CHECK = "check"
-    PREHEAT = "preheat"
-    FIX = "fix"
-class FuzzLevel:
-    BASE_LEVEL = "L1"
-    ADV_LEVEL = "L2"
-    REAL_LEVEL = "L3"
+class PerturbationMode:
+    ADD_NOISE = "add_noise"
+    CHANGE_VALUE = "change_value"
+    IMPROVE_PRECISION = "improve_precision"
+    NO_CHANGE = "no_change"
+    BIT_NOISE = "bit_noise"
+    TO_CPU = "to_cpu"
+class DeviceType:
+    NPU = "npu"
+    CPU = "cpu"
+class FuzzThreshold:
+    BF16_THD = 1e-4
+    F16_THD = 1e-6
+    F32_THD = 1e-8
+    F64_THD = 1e-16
+class NormType:
+    ONE_NORM = (1, "one_norm")
+    TWO_NORM = (2, "two_norm")
+    ENDLESS_NORM = (3, "endless_norm")
+class HandlerType:
+    CHECK = "check"
+    PREHEAT = "preheat"
+    FIX = "fix"
+class FuzzLevel:
+    BASE_LEVEL = "L1"
+    ADV_LEVEL = "L2"
+    REAL_LEVEL = "L3"

msprobe/pytorch/free_benchmark/common/params.py CHANGED Viewed

@@ -1,129 +1,129 @@
-from dataclasses import dataclass
-from typing import Any, Callable, Dict, List, Optional, Tuple
-import torch
-from msprobe.pytorch.free_benchmark import logger
-from msprobe.pytorch.free_benchmark.common.enums import (
-    DeviceType,
-    FuzzLevel,
-    PerturbationMode,
-)
-from msprobe.pytorch.free_benchmark.common.utils import Tools
-@dataclass
-class DataParams:
-    args: Optional[Tuple] = None
-    kwargs: Optional[Dict] = None
-    valid_input_index: Optional[int] = None
-    original_result: Optional[Any] = None
-    perturbed_result: Optional[Any] = None
-    is_consistent: Optional[bool] = True
-    perturbed_value: Optional[Any] = None
-    origin_func: Optional[Callable] = None
-    api_type: Optional[str] = None
-    fuzz_stage: Optional[str] = None
-    grad_unequal_flag: Optional[bool] = True
-@dataclass
-class HandlerParams:
-    handler_type: Optional[str] = None
-    api_name: Optional[str] = None
-    pert_mode: Optional[PerturbationMode] = None
-    step: Optional[int] = None
-    fuzz_stage: Optional[str] = None
-    fuzz_device: Optional[DeviceType] = None
-    preheat_config: Optional[Dict] = None
-    fuzz_level: Optional[str] = None
-@dataclass
-class UnequalRow:
-    rank: Optional[int] = None
-    pert_mode: Optional[PerturbationMode] = None
-    stage: Optional[str] = None
-    step: Optional[int] = None
-    api_name: Optional[str] = None
-    max_rel: Optional[float] = None
-    dtype: Optional[str] = None
-    shape: Optional[str] = None
-    output_index: Optional[int] = None
-@dataclass
-class BenchmarkThd:
-    rtol: Optional[float] = None  # 相对误差阈值
-    small_value: Optional[float] = None  # 小值域
-    small_value_atol: Optional[float] = None  # 小值域绝对阈值
-    err_balance: Optional[float] = None  # 误差均衡性
-def check_args_type(args: Tuple) -> int:
-    for i, arg in enumerate(args):
-        if torch.is_tensor(arg):
-            if arg.is_meta:
-                continue
-            if not torch.is_floating_point(arg):
-                continue
-            return i
-        if isinstance(arg, (List, Tuple, Dict)):
-            return i
-    return -1
-def data_pre_deal(name, func, args, kwargs):
-    data_params = DataParams(args=args, kwargs=kwargs, origin_func=func)
-    index = check_args_type(args)
-    data_params.valid_input_index = index
-    if index == -1:
-        logger.warning_on_rank_0(
-            f"[msprobe] Free benchmark: 无标杆工具不支持当前算子的输入类型 {name}."
-        )
-    return data_params
-def make_handler_params(name, config, step):
-    handler_params = HandlerParams()
-    handler_params.api_name = name
-    handler_params.step = step
-    handler_params.handler_type = config.handler_type
-    handler_params.fuzz_stage = config.fuzz_stage
-    handler_params.fuzz_device = config.fuzz_device
-    handler_params.preheat_config = config.preheat_config
-    handler_params.fuzz_level = config.fuzz_level
-    handler_params.pert_mode = config.pert_mode
-    return handler_params
-def make_unequal_row(
-    data_params: DataParams,
-    handle_params: HandlerParams,
-    ratio: float = None,
-    index: int = None,
-):
-    row = UnequalRow(
-        api_name=handle_params.api_name,
-        pert_mode=handle_params.pert_mode,
-        output_index=index,
-        stage=handle_params.fuzz_stage,
-        step=handle_params.step,
-    )
-    if isinstance(ratio, float):
-        row.max_rel = ratio - 1
-    origin_tensor = data_params.original_result
-    perturbed_tensor = data_params.perturbed_result
-    if index:
-        origin_tensor = origin_tensor[index]
-        perturbed_tensor = perturbed_tensor[index]
-        row.output_index = index
-    if isinstance(origin_tensor, torch.Tensor):
-        row.dtype = origin_tensor.dtype
-        row.shape = origin_tensor.shape
-    row.rank = Tools.get_dist_rank()
-    # 以下暂不支持
-    if handle_params.fuzz_level == FuzzLevel.ADV_LEVEL:
-        pass
-    if handle_params.fuzz_level == FuzzLevel.REAL_LEVEL:
-        pass
-    return row
+from dataclasses import dataclass
+from typing import Any, Callable, Dict, List, Optional, Tuple
+import torch
+from msprobe.pytorch.free_benchmark import logger
+from msprobe.pytorch.free_benchmark.common.enums import (
+    DeviceType,
+    FuzzLevel,
+    PerturbationMode,
+)
+from msprobe.pytorch.free_benchmark.common.utils import Tools
+@dataclass
+class DataParams:
+    args: Optional[Tuple] = None
+    kwargs: Optional[Dict] = None
+    valid_input_index: Optional[int] = None
+    original_result: Optional[Any] = None
+    perturbed_result: Optional[Any] = None
+    is_consistent: Optional[bool] = True
+    perturbed_value: Optional[Any] = None
+    origin_func: Optional[Callable] = None
+    api_type: Optional[str] = None
+    fuzz_stage: Optional[str] = None
+    grad_unequal_flag: Optional[bool] = True
+@dataclass
+class HandlerParams:
+    handler_type: Optional[str] = None
+    api_name: Optional[str] = None
+    pert_mode: Optional[PerturbationMode] = None
+    step: Optional[int] = None
+    fuzz_stage: Optional[str] = None
+    fuzz_device: Optional[DeviceType] = None
+    preheat_config: Optional[Dict] = None
+    fuzz_level: Optional[str] = None
+@dataclass
+class UnequalRow:
+    rank: Optional[int] = None
+    pert_mode: Optional[PerturbationMode] = None
+    stage: Optional[str] = None
+    step: Optional[int] = None
+    api_name: Optional[str] = None
+    max_rel: Optional[float] = None
+    dtype: Optional[str] = None
+    shape: Optional[str] = None
+    output_index: Optional[int] = None
+@dataclass
+class BenchmarkThd:
+    rtol: Optional[float] = None  # 相对误差阈值
+    small_value: Optional[float] = None  # 小值域
+    small_value_atol: Optional[float] = None  # 小值域绝对阈值
+    err_balance: Optional[float] = None  # 误差均衡性
+def check_args_type(args: Tuple) -> int:
+    for i, arg in enumerate(args):
+        if torch.is_tensor(arg):
+            if arg.is_meta:
+                continue
+            if not torch.is_floating_point(arg):
+                continue
+            return i
+        if isinstance(arg, (List, Tuple, Dict)):
+            return i
+    return -1
+def data_pre_deal(name, func, args, kwargs):
+    data_params = DataParams(args=args, kwargs=kwargs, origin_func=func)
+    index = check_args_type(args)
+    data_params.valid_input_index = index
+    if index == -1:
+        logger.warning_on_rank_0(
+            f"[msprobe] Free benchmark: 无标杆工具不支持当前算子的输入类型 {name}."
+        )
+    return data_params
+def make_handler_params(name, config, step):
+    handler_params = HandlerParams()
+    handler_params.api_name = name
+    handler_params.step = step
+    handler_params.handler_type = config.handler_type
+    handler_params.fuzz_stage = config.fuzz_stage
+    handler_params.fuzz_device = config.fuzz_device
+    handler_params.preheat_config = config.preheat_config
+    handler_params.fuzz_level = config.fuzz_level
+    handler_params.pert_mode = config.pert_mode
+    return handler_params
+def make_unequal_row(
+    data_params: DataParams,
+    handle_params: HandlerParams,
+    ratio: float = None,
+    index: int = None,
+):
+    row = UnequalRow(
+        api_name=handle_params.api_name,
+        pert_mode=handle_params.pert_mode,
+        output_index=index,
+        stage=handle_params.fuzz_stage,
+        step=handle_params.step,
+    )
+    if isinstance(ratio, float):
+        row.max_rel = ratio - 1
+    origin_tensor = data_params.original_result
+    perturbed_tensor = data_params.perturbed_result
+    if index:
+        origin_tensor = origin_tensor[index]
+        perturbed_tensor = perturbed_tensor[index]
+        row.output_index = index
+    if isinstance(origin_tensor, torch.Tensor):
+        row.dtype = origin_tensor.dtype
+        row.shape = origin_tensor.shape
+    row.rank = Tools.get_dist_rank()
+    # 以下暂不支持
+    if handle_params.fuzz_level == FuzzLevel.ADV_LEVEL:
+        pass
+    if handle_params.fuzz_level == FuzzLevel.REAL_LEVEL:
+        pass
+    return row

mindstudio-probe 1.0.3__py3-none-any.whl → 1.0.4__py3-none-any.whl

mindstudio-probe 1.0.3py3-none-any.whl → 1.0.4py3-none-any.whl