PyPI - mindstudio-probe - Versions diffs - 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (278) hide show

{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/LICENSE +201 -201
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/METADATA +36 -34
mindstudio_probe-1.1.0.dist-info/RECORD +287 -0
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/entry_points.txt +1 -0
msprobe/README.md +131 -237
msprobe/__init__.py +16 -1
msprobe/{config/config.json → config.json} +47 -49
msprobe/core/advisor/advisor.py +124 -124
msprobe/core/advisor/advisor_const.py +58 -59
msprobe/core/advisor/advisor_result.py +58 -58
msprobe/core/common/const.py +402 -318
msprobe/core/common/exceptions.py +99 -99
msprobe/core/common/{file_check.py → file_utils.py} +523 -283
msprobe/core/common/inplace_op_checker.py +38 -0
msprobe/core/common/inplace_ops.yaml +251 -0
msprobe/core/common/log.py +86 -69
msprobe/core/common/utils.py +371 -616
msprobe/core/common_config.py +78 -71
msprobe/core/compare/acc_compare.py +472 -298
msprobe/core/compare/check.py +180 -95
msprobe/core/compare/compare_cli.py +69 -49
msprobe/core/compare/highlight.py +259 -222
msprobe/core/compare/multiprocessing_compute.py +174 -149
msprobe/core/compare/npy_compare.py +310 -295
msprobe/core/compare/utils.py +464 -429
msprobe/core/data_dump/data_collector.py +153 -144
msprobe/core/data_dump/data_processor/base.py +337 -293
msprobe/core/data_dump/data_processor/factory.py +76 -59
msprobe/core/data_dump/data_processor/mindspore_processor.py +192 -198
msprobe/core/data_dump/data_processor/pytorch_processor.py +383 -389
msprobe/core/data_dump/json_writer.py +117 -116
msprobe/core/data_dump/scope.py +194 -178
msprobe/core/grad_probe/constant.py +74 -70
msprobe/core/grad_probe/grad_compare.py +170 -175
msprobe/core/grad_probe/utils.py +77 -52
msprobe/docs/01.installation.md +99 -0
msprobe/docs/02.config_introduction.md +137 -0
msprobe/docs/03.config_examples.md +237 -0
msprobe/docs/04.acl_config_examples.md +78 -0
msprobe/docs/05.data_dump_PyTorch.md +326 -0
msprobe/docs/06.data_dump_MindSpore.md +285 -0
msprobe/docs/07.accuracy_checker_PyTorch.md +297 -0
msprobe/docs/08.accuracy_checker_online_PyTorch.md +238 -0
msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
msprobe/docs/10.accuracy_compare_PyTorch.md +327 -0
msprobe/docs/11.accuracy_compare_MindSpore.md +333 -0
msprobe/docs/12.overflow_check_PyTorch.md +79 -0
msprobe/docs/13.overflow_check_MindSpore.md +31 -0
msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
msprobe/docs/15.free_benchmarking_PyTorch.md +170 -0
msprobe/docs/16.free_benchmarking_MindSpore.md +140 -0
msprobe/{doc/grad_probe/grad_probe.md → docs/17.grad_probe.md} +205 -207
msprobe/{pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md → docs/18.online_dispatch.md} +89 -90
msprobe/docs/FAQ.md +189 -0
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/mindspore/__init__.py +2 -1
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +278 -245
msprobe/mindspore/api_accuracy_checker/api_info.py +76 -69
msprobe/mindspore/api_accuracy_checker/api_runner.py +155 -151
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +196 -196
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
msprobe/mindspore/api_accuracy_checker/compute_element.py +238 -223
msprobe/mindspore/api_accuracy_checker/main.py +8 -15
msprobe/mindspore/api_accuracy_checker/type_mapping.py +113 -113
msprobe/mindspore/api_accuracy_checker/utils.py +79 -62
msprobe/mindspore/cell_processor.py +58 -34
msprobe/mindspore/common/const.py +108 -87
msprobe/mindspore/common/log.py +37 -37
msprobe/mindspore/common/utils.py +97 -57
msprobe/mindspore/compare/distributed_compare.py +62 -75
msprobe/mindspore/compare/layer_mapping.py +146 -0
msprobe/mindspore/compare/modify_mapping.py +107 -0
msprobe/mindspore/compare/ms_compare.py +357 -117
msprobe/mindspore/compare/ms_graph_compare.py +364 -317
msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -399
msprobe/mindspore/debugger/debugger_config.py +69 -74
msprobe/mindspore/debugger/precision_debugger.py +150 -107
msprobe/mindspore/dump/dump_tool_factory.py +50 -35
msprobe/mindspore/dump/hook_cell/api_registry.py +128 -104
msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -53
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +206 -0
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +994 -925
msprobe/mindspore/dump/hook_cell/wrap_api.py +121 -0
msprobe/mindspore/dump/jit_dump.py +96 -56
msprobe/mindspore/dump/kernel_graph_dump.py +75 -60
msprobe/mindspore/dump/kernel_kbyk_dump.py +79 -65
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +131 -116
msprobe/mindspore/free_benchmark/common/config.py +27 -12
msprobe/mindspore/free_benchmark/common/handler_params.py +32 -17
msprobe/mindspore/free_benchmark/common/utils.py +85 -71
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -842
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +57 -42
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +122 -107
msprobe/mindspore/free_benchmark/handler/base_handler.py +105 -90
msprobe/mindspore/free_benchmark/handler/check_handler.py +56 -41
msprobe/mindspore/free_benchmark/handler/fix_handler.py +51 -36
msprobe/mindspore/free_benchmark/handler/handler_factory.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +82 -67
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +78 -63
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +77 -0
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +49 -34
msprobe/mindspore/free_benchmark/perturbation/no_change.py +27 -12
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +44 -27
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +48 -33
msprobe/mindspore/grad_probe/global_context.py +100 -91
msprobe/mindspore/grad_probe/grad_analyzer.py +231 -231
msprobe/mindspore/grad_probe/grad_monitor.py +27 -27
msprobe/mindspore/grad_probe/grad_stat_csv.py +131 -131
msprobe/mindspore/grad_probe/hook.py +94 -92
msprobe/mindspore/grad_probe/utils.py +29 -28
msprobe/mindspore/ms_config.py +128 -126
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +60 -45
msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +49 -34
msprobe/mindspore/runtime.py +4 -4
msprobe/mindspore/service.py +297 -354
msprobe/mindspore/task_handler_factory.py +24 -24
msprobe/msprobe.py +105 -107
msprobe/pytorch/__init__.py +23 -4
msprobe/pytorch/api_accuracy_checker/common/config.py +70 -55
msprobe/pytorch/api_accuracy_checker/common/utils.py +246 -165
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +230 -213
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +632 -581
msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
msprobe/pytorch/api_accuracy_checker/compare/compare.py +416 -381
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +90 -73
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +265 -244
msprobe/pytorch/api_accuracy_checker/config.yaml +10 -10
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +370 -332
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +221 -199
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +150 -134
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +518 -581
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +213 -74
msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +218 -202
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +370 -324
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +227 -204
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +110 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +244 -218
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml +63 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +44 -0
msprobe/pytorch/bench_functions/__init__.py +30 -15
msprobe/pytorch/bench_functions/apply_adam_w.py +43 -28
msprobe/pytorch/bench_functions/confusion_transpose.py +34 -19
msprobe/pytorch/bench_functions/fast_gelu.py +70 -55
msprobe/pytorch/bench_functions/layer_norm_eval.py +21 -6
msprobe/pytorch/bench_functions/linear.py +27 -12
msprobe/pytorch/bench_functions/matmul_backward.py +63 -48
msprobe/pytorch/bench_functions/npu_fusion_attention.py +538 -421
msprobe/pytorch/bench_functions/rms_norm.py +30 -15
msprobe/pytorch/bench_functions/rotary_mul.py +71 -52
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +41 -26
msprobe/pytorch/bench_functions/swiglu.py +70 -55
msprobe/pytorch/common/__init__.py +17 -2
msprobe/pytorch/common/compare_script.template +14 -14
msprobe/pytorch/common/log.py +33 -32
msprobe/pytorch/common/parse_json.py +54 -39
msprobe/pytorch/common/utils.py +310 -300
msprobe/pytorch/compare/distributed_compare.py +66 -66
msprobe/pytorch/compare/mapping.yaml +607 -607
msprobe/pytorch/compare/match.py +49 -33
msprobe/pytorch/compare/pt_compare.py +82 -40
msprobe/pytorch/debugger/debugger_config.py +108 -95
msprobe/pytorch/debugger/precision_debugger.py +173 -125
msprobe/pytorch/free_benchmark/__init__.py +23 -8
msprobe/pytorch/free_benchmark/common/constant.py +70 -70
msprobe/pytorch/free_benchmark/common/counter.py +71 -71
msprobe/pytorch/free_benchmark/common/enums.py +65 -37
msprobe/pytorch/free_benchmark/common/params.py +144 -129
msprobe/pytorch/free_benchmark/common/utils.py +118 -102
msprobe/pytorch/free_benchmark/compare/grad_saver.py +200 -179
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +119 -104
msprobe/pytorch/free_benchmark/main.py +120 -105
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +28 -13
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +56 -41
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +105 -90
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +119 -104
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +87 -63
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +83 -68
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +43 -28
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +60 -45
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +34 -19
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +256 -217
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +54 -39
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +38 -23
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +45 -30
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +185 -170
msprobe/pytorch/function_factory.py +91 -75
msprobe/pytorch/functional/module_dump.py +84 -0
msprobe/pytorch/grad_probe/grad_monitor.py +91 -90
msprobe/pytorch/grad_probe/grad_stat_csv.py +128 -128
msprobe/pytorch/hook_module/__init__.py +16 -1
msprobe/pytorch/hook_module/api_registry.py +166 -161
msprobe/pytorch/hook_module/hook_module.py +118 -120
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1877
msprobe/pytorch/hook_module/utils.py +28 -29
msprobe/pytorch/hook_module/wrap_aten.py +111 -110
msprobe/pytorch/hook_module/wrap_distributed.py +77 -78
msprobe/pytorch/hook_module/wrap_functional.py +104 -105
msprobe/pytorch/hook_module/wrap_npu_custom.py +85 -84
msprobe/pytorch/hook_module/wrap_tensor.py +69 -71
msprobe/pytorch/hook_module/wrap_torch.py +84 -86
msprobe/pytorch/hook_module/wrap_vf.py +60 -62
msprobe/pytorch/module_processer.py +153 -138
msprobe/pytorch/online_dispatch/__init__.py +20 -20
msprobe/pytorch/online_dispatch/compare.py +235 -236
msprobe/pytorch/online_dispatch/dispatch.py +271 -271
msprobe/pytorch/online_dispatch/dump_compare.py +155 -156
msprobe/pytorch/online_dispatch/single_compare.py +391 -391
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +57 -49
msprobe/pytorch/online_dispatch/utils.py +127 -146
msprobe/pytorch/parse.py +19 -4
msprobe/pytorch/parse_tool/cli.py +31 -32
msprobe/pytorch/parse_tool/lib/compare.py +259 -271
msprobe/pytorch/parse_tool/lib/config.py +52 -52
msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +161 -158
msprobe/pytorch/parse_tool/lib/utils.py +320 -321
msprobe/pytorch/parse_tool/lib/visualization.py +85 -91
msprobe/pytorch/pt_config.py +317 -187
msprobe/pytorch/service.py +311 -252
mindstudio_probe-1.0.3.dist-info/RECORD +0 -272
msprobe/config/README.md +0 -539
msprobe/mindspore/doc/compare.md +0 -58
msprobe/mindspore/doc/dump.md +0 -217
msprobe/mindspore/dump/hook_cell/wrap_functional.py +0 -91
msprobe/mindspore/dump/hook_cell/wrap_tensor.py +0 -63
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +0 -10
msprobe/pytorch/doc/FAQ.md +0 -193
msprobe/pytorch/doc/api_accuracy_checker.md +0 -313
msprobe/pytorch/doc/api_accuracy_checker_online.md +0 -187
msprobe/pytorch/doc/dump.md +0 -260
msprobe/pytorch/doc/msprobe/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -240
msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
msprobe/pytorch/doc/run_overflow_check.md +0 -25
msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -151
msprobe/pytorch/functional/data_processor.py +0 -0
msprobe/pytorch/functional/dump_module.py +0 -39
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/top_level.txt +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
/msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
/msprobe/{config → docs}/img/free_benchmark.png +0 -0
/msprobe/{doc/grad_probe/img/image-1.png → docs/img/grad_probe_image-1.png} +0 -0
/msprobe/{doc/grad_probe/img/image-2.png → docs/img/grad_probe_image-2.png} +0 -0
/msprobe/{doc/grad_probe/img/image-3.png → docs/img/grad_probe_image-3.png} +0 -0
/msprobe/{doc/grad_probe/img/image-4.png → docs/img/grad_probe_image-4.png} +0 -0
/msprobe/{doc/grad_probe/img/image.png → docs/img/grad_probe_image.png} +0 -0
/msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0

msprobe/mindspore/compare/ms_compare.py CHANGED Viewed

@@ -1,117 +1,357 @@
-import os.path
-from msprobe.core.common.utils import check_compare_param, CompareException, check_configuration_param, \
-    task_dumppath_get, load_yaml, load_npy
-from msprobe.core.common.file_check import create_directory
-from msprobe.core.common.const import Const
-from msprobe.core.common.log import logger
-from msprobe.core.common.exceptions import FileCheckException
-from msprobe.core.compare.acc_compare import Comparator
-from msprobe.core.compare.check import check_struct_match, fuzzy_check_op
-class MSComparator(Comparator):
-    def __init__(self, cell_mapping=None, api_mapping=None):
-        self.frame_name = MSComparator.__name__
-        self.cell_mapping = cell_mapping
-        self.api_mapping = api_mapping
-        self.cross_frame = cell_mapping is not None or api_mapping is not None
-        self.cell_mapping_dict = self.load_mapping_file(self.cell_mapping)
-        self.api_mapping_dict = {}
-        if api_mapping is not None:
-            self.ms_to_pt_mapping = self.load_internal_api()
-    def load_internal_api(self):
-        cur_path = os.path.dirname(os.path.realpath(__file__))
-        yaml_path = os.path.join(cur_path,"ms_to_pt_api.yaml")
-        return load_yaml(yaml_path)
-    def load_mapping_file(self, mapping_file):
-        if isinstance(mapping_file, str):
-            mapping_dict = load_yaml(mapping_file)
-        else:
-            mapping_dict = {}
-        return mapping_dict
-    def process_cell_mapping(self, npu_op_name):
-        npu_op_name = [op_name.replace("Cell", "Module", 1) for op_name in npu_op_name]
-        if self.cell_mapping_dict:
-            for index, op_name in enumerate(npu_op_name):
-                # get cell name & class name from op_name
-                # Cell.fc1.Dense.forward.0.input.0
-                cell_name = op_name.split(Const.SEP, 1)[-1].rsplit(Const.SEP, 4)[0]
-                if cell_name in self.cell_mapping_dict:
-                    npu_op_name[index] = op_name.replace(cell_name, self.cell_mapping_dict[cell_name], 1)
-        return npu_op_name
-    def check_op(self, npu_dict, bench_dict, fuzzy_match):
-        npu_op_name = npu_dict["op_name"].copy()
-        bench_op_name = bench_dict["op_name"].copy()
-        if self.api_mapping is not None:
-            npu_op_name = self.process_api_mapping(npu_op_name, bench_op_name)
-        if self.cell_mapping is not None:
-            npu_op_name = self.process_cell_mapping(npu_op_name)
-        struct_match = check_struct_match(npu_dict, bench_dict, cross_frame=self.cross_frame)
-        if not fuzzy_match:
-            return npu_op_name == bench_op_name and struct_match
-        is_match = True
-        try:
-            is_match = fuzzy_check_op(npu_op_name, bench_op_name)
-        except Exception as err:
-            logger.warning("%s and %s can not fuzzy match." % (npu_op_name, bench_op_name))
-            is_match = False
-        return is_match and struct_match
-    def read_npy_data(self, dir_path, file_name, load_pt_file=False):
-        data_path = os.path.join(dir_path, file_name)
-        if load_pt_file:
-            import torch
-            from msprobe.pytorch.common.utils import load_pt
-            data_value = load_pt(data_path).detach()
-            if data_value.dtype == torch.bfloat16:
-                data_value = data_value.to(torch.float32)
-            data_value = data_value.numpy()
-        else:
-            data_value = load_npy(data_path)
-        return data_value
-    def api_replace(self, npu_op_name, target, para):
-        for idx, _ in enumerate(npu_op_name):
-            npu_op_name[idx] = npu_op_name[idx].replace(target, para)
-        return npu_op_name
-    def process_api_mapping(self, npu_op_name, bench_op_name):
-        # get api name & class name from op_name
-        # Functional.addcmul.0.forward.input.0
-        ms_api_name = npu_op_name[0].rsplit(Const.SEP, 4)[0]
-        pt_api_name = bench_op_name[0].rsplit(Const.SEP, 4)[0]
-        class_name = ms_api_name.split(Const.SEP)[0]
-        if class_name == "Mint":
-            return self.api_replace(npu_op_name, "Mint", "Torch")
-        elif class_name == "MintFunctional":
-            return self.api_replace(npu_op_name, "MintFunctional", "Functional")
-        elif self.ms_to_pt_mapping.get(ms_api_name) == pt_api_name:
-            return self.api_replace(npu_op_name, ms_api_name, pt_api_name)
-        else:
-            return npu_op_name
-def ms_compare(input_param, output_path, **kwargs):
-    try:
-        stack_mode = kwargs.get('stack_mode', False)
-        auto_analyze = kwargs.get('auto_analyze', True)
-        fuzzy_match = kwargs.get('fuzzy_match', False)
-        cell_mapping = kwargs.get('cell_mapping', None)
-        api_mapping = kwargs.get('api_mapping', None)
-        summary_compare, md5_compare = task_dumppath_get(input_param)
-        check_configuration_param(stack_mode, auto_analyze, fuzzy_match)
-        create_directory(output_path)
-        check_compare_param(input_param, output_path, summary_compare, md5_compare)
-    except (CompareException, FileCheckException) as error:
-        logger.error('Compare failed. Please check the arguments and do it again!')
-        raise CompareException(error.code) from error
-    ms_comparator = MSComparator(cell_mapping, api_mapping)
-    ms_comparator.compare_core(input_param, output_path, stack_mode=stack_mode,
-                 auto_analyze=auto_analyze, fuzzy_match=fuzzy_match, summary_compare=summary_compare,
-                 md5_compare=md5_compare)
+import os
+import re
+import copy
+import sys
+from itertools import zip_longest
+from msprobe.core.common.utils import check_compare_param, CompareException, check_configuration_param, \
+    task_dumppath_get, struct_json_get, add_time_with_yaml
+from msprobe.core.common.file_utils import create_directory, load_yaml, load_npy, load_json, save_yaml, FileOpen
+from msprobe.core.common.const import Const, CompareConst
+from msprobe.core.common.log import logger
+from msprobe.core.common.exceptions import FileCheckException
+from msprobe.core.compare.acc_compare import Comparator
+from msprobe.core.compare.check import check_struct_match, fuzzy_check_op
+from msprobe.mindspore.compare.modify_mapping import modify_mapping_with_stack
+from msprobe.mindspore.compare.layer_mapping import get_layer_mapping
+class MSComparator(Comparator):
+    def __init__(self, cell_mapping=None, api_mapping=None, data_mapping=None, is_cross_framework=False):
+        self.frame_name = MSComparator.__name__
+        self.cell_mapping = cell_mapping
+        self.api_mapping = api_mapping
+        self.data_mapping = data_mapping
+        if data_mapping:
+            self.cross_frame = is_cross_framework
+        else:
+            self.cross_frame = cell_mapping is not None or api_mapping is not None
+        self.cell_mapping_dict = self.load_mapping_file(self.cell_mapping)
+        self.api_mapping_dict = self.load_mapping_file(self.api_mapping)
+        if api_mapping is not None:
+            self.ms_to_pt_mapping = self.load_internal_api()
+        if isinstance(self.data_mapping, str) or self.data_mapping is None:
+            self.data_mapping_dict = self.load_mapping_file(self.data_mapping)
+        elif isinstance(self.data_mapping, dict):
+            self.data_mapping_dict = self.data_mapping
+        else:
+            raise TypeError(f"The type of parameter `data_mapping` must be dict, str or None, but got "
+                            f"{type(self.data_mapping)}")
+    def load_internal_api(self):
+        cur_path = os.path.dirname(os.path.realpath(__file__))
+        yaml_path = os.path.join(cur_path, "ms_to_pt_api.yaml")
+        return load_yaml(yaml_path)
+    def load_mapping_file(self, mapping_file):
+        if isinstance(mapping_file, str):
+            mapping_dict = load_yaml(mapping_file)
+        else:
+            mapping_dict = {}
+        return mapping_dict
+    def process_cell_mapping(self, npu_op_name):
+        npu_op_name = [op_name.replace("Cell", "Module", 1) for op_name in npu_op_name]
+        if self.cell_mapping_dict:
+            for index, op_name in enumerate(npu_op_name):
+                # get cell name & class name from op_name
+                # Cell.fc1.Dense.forward.0.input.0
+                cell_name = op_name.split(Const.SEP, 1)[-1].rsplit(Const.SEP, 4)[0]
+                if cell_name in self.cell_mapping_dict:
+                    npu_op_name[index] = op_name.replace(cell_name, self.cell_mapping_dict[cell_name], 1)
+        return npu_op_name
+    def check_op(self, npu_dict, bench_dict, fuzzy_match):
+        npu_dict_new, bench_dict_new = copy.deepcopy(npu_dict), copy.deepcopy(bench_dict)
+        npu_op_name, bench_op_name = npu_dict_new.get(CompareConst.OP_NAME), bench_dict_new.get(CompareConst.OP_NAME)
+        if self.cell_mapping is not None:
+            npu_op_name = self.process_cell_mapping(npu_op_name)
+        if self.api_mapping is not None:
+            npu_op_name = self.process_internal_api_mapping(npu_op_name, bench_op_name)
+            if isinstance(self.api_mapping, str):
+                npu_dict_new, bench_dict_new, target_dict = self.transform_user_mapping_api(npu_dict_new,
+                                                                                            bench_dict_new)
+                if target_dict:
+                    bench_dict = self.reconstitution_bench_dict(npu_dict, copy.deepcopy(bench_dict_new), target_dict)
+                    npu_op_name = npu_dict_new.get(CompareConst.OP_NAME)
+                    bench_op_name = bench_dict_new.get(CompareConst.OP_NAME)
+        struct_match = check_struct_match(npu_dict_new, bench_dict_new, cross_frame=self.cross_frame)
+        if not fuzzy_match:
+            return npu_op_name == bench_op_name and struct_match
+        is_match = True
+        try:
+            is_match = fuzzy_check_op(npu_op_name, bench_op_name)
+        except Exception as err:
+            logger.warning("%s and %s can not fuzzy match." % (npu_op_name, bench_op_name))
+            is_match = False
+        return is_match and struct_match
+    def read_npy_data(self, dir_path, file_name, load_pt_file=False):
+        data_path = os.path.join(dir_path, file_name)
+        if load_pt_file:
+            import torch
+            from msprobe.pytorch.common.utils import load_pt
+            data_value = load_pt(data_path, True).detach()
+            if data_value.dtype == torch.bfloat16:
+                data_value = data_value.to(torch.float32)
+            data_value = data_value.numpy()
+        else:
+            data_value = load_npy(data_path)
+        return data_value
+    def api_replace(self, npu_op_name, target, para):
+        for idx, _ in enumerate(npu_op_name):
+            npu_op_name[idx] = npu_op_name[idx].replace(target, para)
+        return npu_op_name
+    def process_internal_api_mapping(self, npu_op_name, bench_op_name):
+        # get api name & class name from op_name
+        # Functional.addcmul.0.forward.input.0
+        npu_op_name, bench_op_name = npu_op_name.copy(), bench_op_name.copy()
+        ms_api_name = self.get_api_name(npu_op_name[0].split(Const.SEP))
+        pt_api_name = self.get_api_name(bench_op_name[0].split(Const.SEP))
+        class_name = ms_api_name.split(Const.SEP)[0]
+        if class_name == "Mint":
+            return self.api_replace(npu_op_name, "Mint", "Torch")
+        elif class_name == "MintFunctional":
+            return self.api_replace(npu_op_name, "MintFunctional", "Functional")
+        elif self.ms_to_pt_mapping.get(ms_api_name) == pt_api_name:
+            return self.api_replace(npu_op_name, ms_api_name, pt_api_name)
+        else:
+            return npu_op_name
+    def remove_element(self, op_name, struct, summary, idx):
+        del op_name[idx]
+        del struct[idx]
+        del summary[idx]
+    def get_api_name(self, api_list):
+        try:
+            api_name = api_list[0] + Const.SEP + api_list[1]
+        except IndexError as error:
+            logger.error(f'Failed to retrieve API name, please check if the dump data is reasonable')
+            raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR) from error
+        return api_name
+    def transform_user_mapping_api(self, new_npu_dict, new_bench_dict):
+        """
+        Transform user mapping API based on new NPU and benchmark dictionaries.
+        Parameters:
+            new_npu_dict (dict): New NPU operation dictionary.
+            new_bench_dict (dict): New benchmark operation dictionary.
+        Returns:
+            tuple: Updated NPU and benchmark dictionaries, along with the target dictionary.
+        """
+        npu_op_name, bench_op_name = new_npu_dict.get(CompareConst.OP_NAME), new_bench_dict.get(CompareConst.OP_NAME)
+        npu_struct_in = new_npu_dict.get(CompareConst.INPUT_STRUCT)
+        bench_struct_in = new_bench_dict.get(CompareConst.INPUT_STRUCT)
+        npu_struct_out = new_npu_dict.get(CompareConst.OUTPUT_STRUCT)
+        bench_struct_out =  new_bench_dict.get(CompareConst.OUTPUT_STRUCT)
+        npu_summary, bench_summary = new_npu_dict.get(CompareConst.SUMMARY), new_bench_dict.get(CompareConst.SUMMARY)
+        npu_in_len, bench_in_len = len(npu_struct_in), len(bench_struct_in)
+        npu_out_len, bench_out_len = len(npu_struct_out), len(bench_struct_out)
+        ms_api_list, pt_api_list = npu_op_name[0].split(Const.SEP), bench_op_name[0].split(Const.SEP)
+        ms_api_name = self.get_api_name(ms_api_list)
+        pt_api_name = self.get_api_name(pt_api_list)
+        target_dict = {}
+        for api_dict in self.api_mapping_dict:
+            if api_dict.get("pt_api") == pt_api_name and api_dict.get("ms_api") == ms_api_name:
+                ms_user_args_len, pt_user_args_len = len(api_dict.get("ms_args")), len(api_dict.get("pt_args"))
+                ms_user_output_len, pt_user_output_len = len(api_dict.get("ms_output")), len(api_dict.get("pt_output"))
+                if ms_user_args_len != pt_user_args_len or ms_user_output_len != pt_user_output_len:
+                    logger.warning("The user-defined mapping table is incorrect,\
+                        make sure that the number of parameters is equal")
+                    break
+                ms_out_list = api_dict.get("ms_output", [])
+                for idx in reversed(range(npu_out_len)):
+                    if idx not in ms_out_list:
+                        del npu_struct_out[idx]
+                        if idx + npu_in_len < len(npu_summary) and idx + npu_in_len < len(npu_op_name):
+                            del npu_summary[idx + npu_in_len]
+                            del npu_op_name[idx + npu_in_len]
+                pt_out_list = api_dict.get("pt_output", [])
+                for idx in reversed(range(bench_out_len)):
+                    if idx not in pt_out_list:
+                        del bench_struct_out[idx]
+                        if idx + bench_in_len < len(bench_summary) and idx + bench_in_len < len(bench_op_name):
+                            del bench_summary[idx + bench_in_len]
+                            del bench_op_name[idx + bench_in_len]
+                ms_para_list = api_dict.get("ms_args", [])
+                for idx in reversed(range(npu_in_len)):
+                    if idx not in ms_para_list:
+                        self.remove_element(npu_op_name, npu_struct_in, npu_summary, idx)
+                pt_para_list = api_dict.get("pt_args", [])
+                for idx in reversed(range(bench_in_len)):
+                    if idx not in pt_para_list:
+                        self.remove_element(bench_op_name, bench_struct_in, bench_summary, idx)
+                npu_op_name = self.api_replace(npu_op_name, ms_api_name, pt_api_name)
+                npu_op_name = self.para_sequence_update(npu_op_name, bench_op_name)
+                target_dict = api_dict
+                break
+        if target_dict:
+            new_npu_dict.update({CompareConst.OP_NAME: npu_op_name, CompareConst.INPUT_STRUCT: npu_struct_in,
+                                 CompareConst.OUTPUT_STRUCT: npu_struct_out, CompareConst.SUMMARY: npu_summary})
+            new_bench_dict.update({CompareConst.OP_NAME: bench_op_name, CompareConst.INPUT_STRUCT: bench_struct_in,
+                                   CompareConst.OUTPUT_STRUCT: bench_struct_out, CompareConst.SUMMARY: bench_summary})
+        return new_npu_dict, new_bench_dict, target_dict
+    def para_sequence_update(self, npu_op_name, bench_op_name):
+        for idx, _ in enumerate(npu_op_name):
+            bench_op_name_list = bench_op_name[idx].rsplit(Const.SEP, 1)
+            if len(bench_op_name_list) != 0:
+                npu_op_name[idx] = npu_op_name[idx][:-1] + bench_op_name_list[-1]
+        return npu_op_name
+    def reconstitution_bench_dict(self, npu_dict, del_bench_dict, api_dict):
+        ms_user_args_list = api_dict.get("ms_args", [])
+        ms_user_output_list = api_dict.get("ms_output", [])
+        npu_struct_in = npu_dict.get(CompareConst.INPUT_STRUCT)
+        npu_struct_out = npu_dict.get(CompareConst.OUTPUT_STRUCT)
+        npu_in_len = len(npu_struct_in)
+        npu_out_len = len(npu_struct_out)
+        if npu_in_len == len(ms_user_args_list) and npu_out_len == len(ms_user_output_list):
+            return del_bench_dict
+        ms_input_args_list = [i for i in range(npu_in_len)]
+        input_sub_list = list(set(ms_input_args_list) - set(ms_user_args_list))
+        ms_output_args_list = [i for i in range(npu_out_len)]
+        output_sub_list = list(set(ms_output_args_list) - set(ms_user_output_list))
+        bench_op_name = del_bench_dict.get(CompareConst.OP_NAME, [])
+        bench_struct_in = del_bench_dict.get(CompareConst.INPUT_STRUCT, [])
+        bench_struct_out = del_bench_dict.get(CompareConst.OUTPUT_STRUCT, [])
+        bench_summary = del_bench_dict.get(CompareConst.SUMMARY, [])
+        for idx in input_sub_list:  # Fill in the blank value field in the pt dictionary
+            bench_op_name.insert(idx, CompareConst.N_A)
+            bench_struct_in.insert(idx, CompareConst.N_A)
+            bench_summary.insert(idx, CompareConst.N_A)
+        for idx in output_sub_list:  # Fill in the blank value field in the pt dictionary
+            bench_op_name.insert(npu_in_len + idx, CompareConst.N_A)
+            bench_struct_out.insert(idx, CompareConst.N_A)
+            bench_summary.insert(npu_in_len + idx, CompareConst.N_A)
+        del_bench_dict.update({CompareConst.OP_NAME: bench_op_name, CompareConst.INPUT_STRUCT: bench_struct_in,
+                               CompareConst.OUTPUT_STRUCT: bench_struct_out, CompareConst.SUMMARY: bench_summary})
+        return del_bench_dict
+def sort_by_execution_sequence(npu_data, bench_data, mapping_list, flag):
+    def generate_execution_sequence(data):
+        sequence_map = {}
+        for index, item in enumerate(data.keys()):
+            if flag in item:
+                item_split = item.split(Const.SEP)
+                item_name = Const.SEP.join(item_split[0:-2])
+                item_index = item_split[-1]
+                if item_index == 'forward' or item_index == 'backward':
+                    item_index = item_split[-2]
+                item_key = f"{item_name}.{item_index}"
+                sequence_map[item_key] = index
+        return sequence_map
+    npu_map = generate_execution_sequence(npu_data)
+    bench_map = generate_execution_sequence(bench_data)
+    def sort_by_map(item):
+        first_key = npu_map.get(item[0], sys.maxsize)
+        second_key = bench_map.get(item[1], sys.maxsize)
+        return first_key, second_key
+    return sorted(mapping_list, key=sort_by_map)
+def generate_kernel_data(map_value, data, flag):
+    if not map_value:
+        return [], []
+    inputs_name = []
+    outputs_name = []
+    map_split = map_value.split(Const.SEP)
+    map_name = Const.SEP.join(map_split[0:-1])
+    map_index = map_split[-1]
+    for key, value in data.items():
+        if key.find(flag) != -1 and key.find(map_name) != -1:
+            if key.split(Const.SEP)[-1] != map_index and key.split(Const.SEP)[-2] != map_index :
+                continue
+            if flag == 'forward':
+                input_args = value.get('input_args', {})
+            else:
+                input_args = value.get('input', {})
+            output_args = value.get('output', {})
+            for i in range(len(input_args)):
+                inputs_name.append(f"{key}.input.{i}")
+            for i in range(len(output_args)):
+                outputs_name.append(f"{key}.output.{i}")
+    return inputs_name, outputs_name
+def generate_file_mapping(npu_json_path, bench_json_path, mapping_list):
+    npu_data = load_json(npu_json_path).get("data", {})
+    bench_data = load_json(bench_json_path).get("data", {})
+    forward_data = []
+    mapping_list = sort_by_execution_sequence(npu_data, bench_data, mapping_list, Const.FORWARD)
+    for map_value in mapping_list:
+        npu_forward_inputs, npu_backward_outputs = generate_kernel_data(map_value[0], npu_data, "forward")
+        bench_forward_inputs, bench_backward_outputs = generate_kernel_data(map_value[1], bench_data, "forward")
+        inputs_zip = list(zip_longest(npu_forward_inputs, bench_forward_inputs))
+        outputs_zip = list(zip_longest(npu_backward_outputs, bench_backward_outputs))
+        forward_data.extend(inputs_zip)
+        forward_data.extend(outputs_zip)
+    backward_data = []
+    mapping_list = sort_by_execution_sequence(npu_data, bench_data, mapping_list, Const.BACKWARD)
+    for map_value in mapping_list:
+        npu_forward_inputs, npu_backward_outputs = generate_kernel_data(map_value[0], npu_data, "backward")
+        bench_forward_inputs, bench_backward_outputs = generate_kernel_data(map_value[1], bench_data, "backward")
+        inputs_zip = list(zip_longest(npu_forward_inputs, bench_forward_inputs))
+        outputs_zip = list(zip_longest(npu_backward_outputs, bench_backward_outputs))
+        backward_data.extend(inputs_zip)
+        backward_data.extend(outputs_zip)
+    kernel_data = forward_data + backward_data
+    result = {key: value for key, value in kernel_data if key is not None}
+    return result
+def check_cross_framework(bench_json_path):
+    pattern = r'"data_name":\s*"[^"]+\.pt"'
+    with FileOpen(bench_json_path, 'r') as file:
+        for line in file:
+            if re.search(pattern, line):
+                return True
+    return False
+def ms_compare(input_param, output_path, **kwargs):
+    try:
+        stack_mode = kwargs.get('stack_mode', False)
+        auto_analyze = kwargs.get('auto_analyze', True)
+        fuzzy_match = kwargs.get('fuzzy_match', False)
+        cell_mapping = kwargs.get('cell_mapping', None)
+        api_mapping = kwargs.get('api_mapping', None)
+        data_mapping = kwargs.get('data_mapping', None)
+        layer_mapping = kwargs.get('layer_mapping', None)
+        summary_compare, md5_compare = task_dumppath_get(input_param)
+        check_configuration_param(stack_mode, auto_analyze, fuzzy_match, input_param.get('is_print_compare_log', True))
+        create_directory(output_path)
+        check_compare_param(input_param, output_path, summary_compare, md5_compare)
+    except (CompareException, FileCheckException) as error:
+        logger.error('Compare failed. Please check the arguments and do it again!')
+        raise CompareException(error.code) from error
+    if layer_mapping:
+        pt_stack, pt_construct = struct_json_get(input_param, Const.PT_FRAMEWORK)
+        ms_stack, ms_construct = struct_json_get(input_param, Const.MS_FRAMEWORK)
+        mapping = load_yaml(layer_mapping)
+        ms_mapping_result = modify_mapping_with_stack(ms_stack, ms_construct)
+        pt_mapping_result = modify_mapping_with_stack(pt_stack, pt_construct)
+        layer_mapping = get_layer_mapping(ms_mapping_result, pt_mapping_result, mapping)
+        data_mapping = generate_file_mapping(input_param.get("npu_json_path"), input_param.get("bench_json_path"), layer_mapping)
+        data_mapping_name = add_time_with_yaml(f"data_mapping")
+        data_mapping_path = os.path.join(os.path.realpath(output_path), f"{data_mapping_name}")
+        save_yaml(data_mapping_path, data_mapping)
+    is_cross_framework = check_cross_framework(input_param.get("bench_json_path"))
+    ms_comparator = MSComparator(cell_mapping, api_mapping, data_mapping, is_cross_framework)
+    ms_comparator.compare_core(input_param, output_path, stack_mode=stack_mode,
+                 auto_analyze=auto_analyze, fuzzy_match=fuzzy_match, summary_compare=summary_compare,
+                 md5_compare=md5_compare)

mindstudio-probe 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl