PyPI - mindstudio-probe - Versions diffs - 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (278) hide show

{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/LICENSE +201 -201
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/METADATA +36 -34
mindstudio_probe-1.1.0.dist-info/RECORD +287 -0
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/entry_points.txt +1 -0
msprobe/README.md +131 -237
msprobe/__init__.py +16 -1
msprobe/{config/config.json → config.json} +47 -49
msprobe/core/advisor/advisor.py +124 -124
msprobe/core/advisor/advisor_const.py +58 -59
msprobe/core/advisor/advisor_result.py +58 -58
msprobe/core/common/const.py +402 -318
msprobe/core/common/exceptions.py +99 -99
msprobe/core/common/{file_check.py → file_utils.py} +523 -283
msprobe/core/common/inplace_op_checker.py +38 -0
msprobe/core/common/inplace_ops.yaml +251 -0
msprobe/core/common/log.py +86 -69
msprobe/core/common/utils.py +371 -616
msprobe/core/common_config.py +78 -71
msprobe/core/compare/acc_compare.py +472 -298
msprobe/core/compare/check.py +180 -95
msprobe/core/compare/compare_cli.py +69 -49
msprobe/core/compare/highlight.py +259 -222
msprobe/core/compare/multiprocessing_compute.py +174 -149
msprobe/core/compare/npy_compare.py +310 -295
msprobe/core/compare/utils.py +464 -429
msprobe/core/data_dump/data_collector.py +153 -144
msprobe/core/data_dump/data_processor/base.py +337 -293
msprobe/core/data_dump/data_processor/factory.py +76 -59
msprobe/core/data_dump/data_processor/mindspore_processor.py +192 -198
msprobe/core/data_dump/data_processor/pytorch_processor.py +383 -389
msprobe/core/data_dump/json_writer.py +117 -116
msprobe/core/data_dump/scope.py +194 -178
msprobe/core/grad_probe/constant.py +74 -70
msprobe/core/grad_probe/grad_compare.py +170 -175
msprobe/core/grad_probe/utils.py +77 -52
msprobe/docs/01.installation.md +99 -0
msprobe/docs/02.config_introduction.md +137 -0
msprobe/docs/03.config_examples.md +237 -0
msprobe/docs/04.acl_config_examples.md +78 -0
msprobe/docs/05.data_dump_PyTorch.md +326 -0
msprobe/docs/06.data_dump_MindSpore.md +285 -0
msprobe/docs/07.accuracy_checker_PyTorch.md +297 -0
msprobe/docs/08.accuracy_checker_online_PyTorch.md +238 -0
msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
msprobe/docs/10.accuracy_compare_PyTorch.md +327 -0
msprobe/docs/11.accuracy_compare_MindSpore.md +333 -0
msprobe/docs/12.overflow_check_PyTorch.md +79 -0
msprobe/docs/13.overflow_check_MindSpore.md +31 -0
msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
msprobe/docs/15.free_benchmarking_PyTorch.md +170 -0
msprobe/docs/16.free_benchmarking_MindSpore.md +140 -0
msprobe/{doc/grad_probe/grad_probe.md → docs/17.grad_probe.md} +205 -207
msprobe/{pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md → docs/18.online_dispatch.md} +89 -90
msprobe/docs/FAQ.md +189 -0
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/mindspore/__init__.py +2 -1
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +278 -245
msprobe/mindspore/api_accuracy_checker/api_info.py +76 -69
msprobe/mindspore/api_accuracy_checker/api_runner.py +155 -151
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +196 -196
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
msprobe/mindspore/api_accuracy_checker/compute_element.py +238 -223
msprobe/mindspore/api_accuracy_checker/main.py +8 -15
msprobe/mindspore/api_accuracy_checker/type_mapping.py +113 -113
msprobe/mindspore/api_accuracy_checker/utils.py +79 -62
msprobe/mindspore/cell_processor.py +58 -34
msprobe/mindspore/common/const.py +108 -87
msprobe/mindspore/common/log.py +37 -37
msprobe/mindspore/common/utils.py +97 -57
msprobe/mindspore/compare/distributed_compare.py +62 -75
msprobe/mindspore/compare/layer_mapping.py +146 -0
msprobe/mindspore/compare/modify_mapping.py +107 -0
msprobe/mindspore/compare/ms_compare.py +357 -117
msprobe/mindspore/compare/ms_graph_compare.py +364 -317
msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -399
msprobe/mindspore/debugger/debugger_config.py +69 -74
msprobe/mindspore/debugger/precision_debugger.py +150 -107
msprobe/mindspore/dump/dump_tool_factory.py +50 -35
msprobe/mindspore/dump/hook_cell/api_registry.py +128 -104
msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -53
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +206 -0
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +994 -925
msprobe/mindspore/dump/hook_cell/wrap_api.py +121 -0
msprobe/mindspore/dump/jit_dump.py +96 -56
msprobe/mindspore/dump/kernel_graph_dump.py +75 -60
msprobe/mindspore/dump/kernel_kbyk_dump.py +79 -65
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +131 -116
msprobe/mindspore/free_benchmark/common/config.py +27 -12
msprobe/mindspore/free_benchmark/common/handler_params.py +32 -17
msprobe/mindspore/free_benchmark/common/utils.py +85 -71
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -842
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +57 -42
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +122 -107
msprobe/mindspore/free_benchmark/handler/base_handler.py +105 -90
msprobe/mindspore/free_benchmark/handler/check_handler.py +56 -41
msprobe/mindspore/free_benchmark/handler/fix_handler.py +51 -36
msprobe/mindspore/free_benchmark/handler/handler_factory.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +82 -67
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +78 -63
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +77 -0
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +49 -34
msprobe/mindspore/free_benchmark/perturbation/no_change.py +27 -12
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +44 -27
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +48 -33
msprobe/mindspore/grad_probe/global_context.py +100 -91
msprobe/mindspore/grad_probe/grad_analyzer.py +231 -231
msprobe/mindspore/grad_probe/grad_monitor.py +27 -27
msprobe/mindspore/grad_probe/grad_stat_csv.py +131 -131
msprobe/mindspore/grad_probe/hook.py +94 -92
msprobe/mindspore/grad_probe/utils.py +29 -28
msprobe/mindspore/ms_config.py +128 -126
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +60 -45
msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +49 -34
msprobe/mindspore/runtime.py +4 -4
msprobe/mindspore/service.py +297 -354
msprobe/mindspore/task_handler_factory.py +24 -24
msprobe/msprobe.py +105 -107
msprobe/pytorch/__init__.py +23 -4
msprobe/pytorch/api_accuracy_checker/common/config.py +70 -55
msprobe/pytorch/api_accuracy_checker/common/utils.py +246 -165
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +230 -213
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +632 -581
msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
msprobe/pytorch/api_accuracy_checker/compare/compare.py +416 -381
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +90 -73
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +265 -244
msprobe/pytorch/api_accuracy_checker/config.yaml +10 -10
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +370 -332
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +221 -199
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +150 -134
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +518 -581
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +213 -74
msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +218 -202
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +370 -324
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +227 -204
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +110 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +244 -218
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml +63 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +44 -0
msprobe/pytorch/bench_functions/__init__.py +30 -15
msprobe/pytorch/bench_functions/apply_adam_w.py +43 -28
msprobe/pytorch/bench_functions/confusion_transpose.py +34 -19
msprobe/pytorch/bench_functions/fast_gelu.py +70 -55
msprobe/pytorch/bench_functions/layer_norm_eval.py +21 -6
msprobe/pytorch/bench_functions/linear.py +27 -12
msprobe/pytorch/bench_functions/matmul_backward.py +63 -48
msprobe/pytorch/bench_functions/npu_fusion_attention.py +538 -421
msprobe/pytorch/bench_functions/rms_norm.py +30 -15
msprobe/pytorch/bench_functions/rotary_mul.py +71 -52
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +41 -26
msprobe/pytorch/bench_functions/swiglu.py +70 -55
msprobe/pytorch/common/__init__.py +17 -2
msprobe/pytorch/common/compare_script.template +14 -14
msprobe/pytorch/common/log.py +33 -32
msprobe/pytorch/common/parse_json.py +54 -39
msprobe/pytorch/common/utils.py +310 -300
msprobe/pytorch/compare/distributed_compare.py +66 -66
msprobe/pytorch/compare/mapping.yaml +607 -607
msprobe/pytorch/compare/match.py +49 -33
msprobe/pytorch/compare/pt_compare.py +82 -40
msprobe/pytorch/debugger/debugger_config.py +108 -95
msprobe/pytorch/debugger/precision_debugger.py +173 -125
msprobe/pytorch/free_benchmark/__init__.py +23 -8
msprobe/pytorch/free_benchmark/common/constant.py +70 -70
msprobe/pytorch/free_benchmark/common/counter.py +71 -71
msprobe/pytorch/free_benchmark/common/enums.py +65 -37
msprobe/pytorch/free_benchmark/common/params.py +144 -129
msprobe/pytorch/free_benchmark/common/utils.py +118 -102
msprobe/pytorch/free_benchmark/compare/grad_saver.py +200 -179
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +119 -104
msprobe/pytorch/free_benchmark/main.py +120 -105
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +28 -13
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +56 -41
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +105 -90
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +119 -104
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +87 -63
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +83 -68
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +43 -28
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +60 -45
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +34 -19
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +256 -217
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +54 -39
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +38 -23
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +45 -30
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +185 -170
msprobe/pytorch/function_factory.py +91 -75
msprobe/pytorch/functional/module_dump.py +84 -0
msprobe/pytorch/grad_probe/grad_monitor.py +91 -90
msprobe/pytorch/grad_probe/grad_stat_csv.py +128 -128
msprobe/pytorch/hook_module/__init__.py +16 -1
msprobe/pytorch/hook_module/api_registry.py +166 -161
msprobe/pytorch/hook_module/hook_module.py +118 -120
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1877
msprobe/pytorch/hook_module/utils.py +28 -29
msprobe/pytorch/hook_module/wrap_aten.py +111 -110
msprobe/pytorch/hook_module/wrap_distributed.py +77 -78
msprobe/pytorch/hook_module/wrap_functional.py +104 -105
msprobe/pytorch/hook_module/wrap_npu_custom.py +85 -84
msprobe/pytorch/hook_module/wrap_tensor.py +69 -71
msprobe/pytorch/hook_module/wrap_torch.py +84 -86
msprobe/pytorch/hook_module/wrap_vf.py +60 -62
msprobe/pytorch/module_processer.py +153 -138
msprobe/pytorch/online_dispatch/__init__.py +20 -20
msprobe/pytorch/online_dispatch/compare.py +235 -236
msprobe/pytorch/online_dispatch/dispatch.py +271 -271
msprobe/pytorch/online_dispatch/dump_compare.py +155 -156
msprobe/pytorch/online_dispatch/single_compare.py +391 -391
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +57 -49
msprobe/pytorch/online_dispatch/utils.py +127 -146
msprobe/pytorch/parse.py +19 -4
msprobe/pytorch/parse_tool/cli.py +31 -32
msprobe/pytorch/parse_tool/lib/compare.py +259 -271
msprobe/pytorch/parse_tool/lib/config.py +52 -52
msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +161 -158
msprobe/pytorch/parse_tool/lib/utils.py +320 -321
msprobe/pytorch/parse_tool/lib/visualization.py +85 -91
msprobe/pytorch/pt_config.py +317 -187
msprobe/pytorch/service.py +311 -252
mindstudio_probe-1.0.3.dist-info/RECORD +0 -272
msprobe/config/README.md +0 -539
msprobe/mindspore/doc/compare.md +0 -58
msprobe/mindspore/doc/dump.md +0 -217
msprobe/mindspore/dump/hook_cell/wrap_functional.py +0 -91
msprobe/mindspore/dump/hook_cell/wrap_tensor.py +0 -63
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +0 -10
msprobe/pytorch/doc/FAQ.md +0 -193
msprobe/pytorch/doc/api_accuracy_checker.md +0 -313
msprobe/pytorch/doc/api_accuracy_checker_online.md +0 -187
msprobe/pytorch/doc/dump.md +0 -260
msprobe/pytorch/doc/msprobe/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -240
msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
msprobe/pytorch/doc/run_overflow_check.md +0 -25
msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -151
msprobe/pytorch/functional/data_processor.py +0 -0
msprobe/pytorch/functional/dump_module.py +0 -39
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/top_level.txt +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
/msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
/msprobe/{config → docs}/img/free_benchmark.png +0 -0
/msprobe/{doc/grad_probe/img/image-1.png → docs/img/grad_probe_image-1.png} +0 -0
/msprobe/{doc/grad_probe/img/image-2.png → docs/img/grad_probe_image-2.png} +0 -0
/msprobe/{doc/grad_probe/img/image-3.png → docs/img/grad_probe_image-3.png} +0 -0
/msprobe/{doc/grad_probe/img/image-4.png → docs/img/grad_probe_image-4.png} +0 -0
/msprobe/{doc/grad_probe/img/image.png → docs/img/grad_probe_image.png} +0 -0
/msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0

msprobe/mindspore/compare/ms_graph_compare.py CHANGED Viewed

@@ -1,317 +1,364 @@
-import csv
-import glob
-import os
-import sys
-import copy
-import numpy as np
-import pandas as pd
-from msprobe.core.common.const import CompareConst, GraphMode
-from msprobe.core.common.exceptions import FileCheckException
-from msprobe.core.common.file_check import create_directory
-from msprobe.core.common.log import logger
-from msprobe.core.common.utils import add_time_with_xlsx, CompareException
-from msprobe.core.compare.multiprocessing_compute import _ms_graph_handle_multi_process, check_accuracy
-from msprobe.core.compare.npy_compare import npy_data_check, statistics_data_check, reshape_value, compare_ops_apply
-from msprobe.core.common.file_check import FileOpen
-class row_data:
-    def __init__(self, mode):
-        self.basic_data = copy.deepcopy(CompareConst.MS_GRAPH_BASE)
-        self.npy_data = copy.deepcopy(CompareConst.MS_GRAPH_NPY)
-        self.statistic_data = copy.deepcopy(CompareConst.MS_GRAPH_STATISTIC)
-        if mode == GraphMode.NPY_MODE:
-            self.data = {**self.basic_data, **self.npy_data}
-        else:
-            self.data = {**self.basic_data, **self.statistic_data}
-    def __call__(self):
-        return self.data
-def generate_step(npu_path, rank_id):
-    step_set = set()
-    rank_path = os.path.join(npu_path, f"rank_{rank_id}")
-    if not os.path.exists(rank_path):
-        return []
-    for path in os.listdir(rank_path):
-        if path not in ["execution_order", "graphs"]:
-            data_path = os.path.join(rank_path, path)
-            for graph_path in os.listdir(data_path):
-                step_set.update([int(i) for i in os.listdir(os.path.join(data_path, graph_path))])
-    return sorted(step_set)
-def generate_path_by_rank_step(base_path, rank_id, step_id):
-    path_with_rank_id = os.path.join(base_path, f"rank_{rank_id}")
-    if not os.path.exists(path_with_rank_id):
-        return ''
-    for path in os.listdir(path_with_rank_id):
-        if path not in ["execution_order", "graphs"]:
-            return os.path.join(path_with_rank_id, path, "*", str(step_id))
-    logger.error(f"Data_path {path_with_rank_id} is not exist.")
-    return ''
-def statistic_data_read(statistic_file_list, statistic_file_path):
-    data_list = []
-    statistic_data_list = []
-    for statistic_file in statistic_file_list:
-        with open(statistic_file, "r") as f:
-            csv_reader = csv.reader(f, delimiter=",")
-            header = next(csv_reader)
-            header_index = {'Data Type': None, 'Shape': None, 'Max Value': None, 'Min Value': None,
-                            'Avg Value': None, 'L2Norm Value': None}
-            for key in header_index.keys():
-                for index, value in enumerate(header):
-                    if key == value:
-                        header_index[key] = index
-            for key in header_index.keys():
-                if header_index[key] is None:
-                    logger.error(f"Data_path {statistic_file_path} has no key {key}")
-                    raise FileCheckException(f"Data_path {statistic_file_path} has no key {key}")
-            statistic_data_list.extend([row for row in csv_reader])
-    for data in statistic_data_list:
-        compare_key = f"{data[1]}.{data[2]}.{data[3]}.{data[5]}"
-        timestamp = int(data[4])
-        data_list.append(
-            [statistic_file_path, compare_key, timestamp, data[header_index['Data Type']],
-             data[header_index['Shape']], data[header_index['Max Value']], data[header_index['Min Value']],
-             data[header_index['Avg Value']], data[header_index['L2Norm Value']]])
-    return data_list
-def generate_data_name(data_path):
-    data_list = []
-    mapping_path = os.path.join(data_path, "mapping.csv")
-    statistic_path = os.path.join(data_path, "statistic.csv")
-    npy_path = os.path.join(data_path, "*.npy")
-    mapping_file_list = glob.glob(mapping_path)
-    statistic_file_list = glob.glob(statistic_path)
-    npy_file_list = glob.glob(npy_path)
-    mapping_exist = bool(mapping_file_list)
-    statistic_exist = bool(statistic_file_list)
-    npy_exist = bool(npy_file_list)
-    mapping_dict = []
-    if mapping_exist:
-        for mapping_file in mapping_file_list:
-            with FileOpen(mapping_file, "r") as f:
-                csv_reader = csv.reader(f, delimiter=",")
-                header = next(csv_reader)
-                for row in csv_reader:
-                    mapping_dict[row[0]] = row[1]
-    if npy_exist:
-        for data in npy_file_list:
-            if data in mapping_dict:
-                split_list = mapping_dict[data].split(".")
-            else:
-                split_list = data.split(".")
-            compare_key = f"{split_list[1]}.{split_list[2]}.{split_list[3]}.{split_list[5]}.{split_list[6]}"
-            timestamp = int(split_list[4])
-            data_list.append([os.path.join(data_path, data), compare_key, timestamp])
-    elif statistic_exist:
-        data_list = statistic_data_read(statistic_file_list, os.path.join(data_path, statistic_path))
-    if npy_exist:
-        mode = GraphMode.NPY_MODE
-    elif statistic_exist:
-        mode = GraphMode.STATISTIC_MODE
-    else:
-        mode = GraphMode.ERROR_MODE
-        logger.error(f"Error mode.")
-    return mode, data_list
-def read_npy_data(data_path):
-    try:
-        data_value = np.load(data_path)
-        if data_value.dtype == np.float16:
-            data_value = data_value.astype(np.float32)
-    except FileNotFoundError as e:
-        data_value = None
-    except EOFError:
-        data_value = None
-    return data_value
-class GraphMSComparator:
-    def __init__(self, input_param, output_path):
-        self.output_path = output_path
-        self.base_npu_path = input_param.get('npu_path', None)
-        self.base_bench_path = input_param.get('bench_path', None)
-        self.rank_list = input_param.get('rank_id', [])
-        self.step_list = input_param.get('step_id', [])
-    @staticmethod
-    def compare_ops(compare_result_db, mode):
-        def npy_mode_compute(row):
-            result_dict = row_data(GraphMode.NPY_MODE)()
-            def process_npy_file(file_path, name_prefix, result):
-                if os.path.exists(file_path):
-                    data = read_npy_data(file_path)
-                    result[f'{name_prefix} Name'] = file_path
-                    result[f'{name_prefix} Dtype'] = data.dtype
-                    result[f'{name_prefix} Tensor Shape'] = data.shape
-                    result[f'{name_prefix} max'] = np.max(data)
-                    result[f'{name_prefix} min'] = np.min(data)
-                    result[f'{name_prefix} mean'] = np.mean(data)
-                    result[f'{name_prefix} l2norm'] = np.linalg.norm(data)
-                    return data
-                return ""
-            n_value = process_npy_file(row[CompareConst.NPU_NAME], 'NPU', result_dict)
-            b_value = process_npy_file(row[CompareConst.BENCH_NAME], 'Bench', result_dict)
-            error_flag, error_message = npy_data_check(n_value, b_value)
-            result_dict[CompareConst.ERROR_MESSAGE] = error_message
-            if not error_flag:
-                n_value, b_value = reshape_value(n_value, b_value)
-                result_list, err_msg = compare_ops_apply(n_value, b_value, False, "")
-                result_dict[CompareConst.COSINE] = result_list[0]
-                result_dict[CompareConst.MAX_ABS_ERR] = result_list[1]
-                result_dict[CompareConst.MAX_RELATIVE_ERR] = result_list[2]
-                result_dict[CompareConst.ONE_THOUSANDTH_ERR_RATIO] = result_list[3]
-                result_dict[CompareConst.FIVE_THOUSANDTHS_ERR_RATIO] = result_list[4]
-                result_dict[CompareConst.ACCURACY] = check_accuracy(result_list[0], result_list[1])
-                result_dict[CompareConst.ERROR_MESSAGE] = err_msg
-            return pd.Series(result_dict)
-        def statistic_mode_compute(row):
-            result_dict = row_data('STATISTIC')()
-            def update_result_dict(result, rows, prefix):
-                result[f'{prefix} Name'] = rows[f'{prefix} Name']
-                result[f'{prefix} Dtype'] = rows[f'{prefix} Dtype']
-                result[f'{prefix} Tensor Shape'] = rows[f'{prefix} Tensor Shape']
-                result[f'{prefix} max'] = np.float32(rows[f'{prefix} max'])
-                result[f'{prefix} min'] = np.float32(rows[f'{prefix} min'])
-                result[f'{prefix} mean'] = np.float32(rows[f'{prefix} mean'])
-                result[f'{prefix} l2norm'] = np.float32(rows[f'{prefix} l2norm'])
-            # 使用示例
-            update_result_dict(result_dict, row, 'NPU')
-            update_result_dict(result_dict, row, 'Bench')
-            error_flag, error_message = statistics_data_check(result_dict)
-            result_dict[CompareConst.ERROR_MESSAGE] += error_message
-            if not error_flag:
-                result_dict[CompareConst.MAX_DIFF] = np.abs(
-                    result_dict[CompareConst.NPU_MAX] - result_dict[CompareConst.BENCH_MAX])
-                result_dict[CompareConst.MIN_DIFF] = np.abs(
-                    result_dict[CompareConst.NPU_MIN] - result_dict[CompareConst.BENCH_MIN])
-                result_dict[CompareConst.MEAN_DIFF] = np.abs(
-                    result_dict[CompareConst.NPU_MEAN] - result_dict[CompareConst.BENCH_MEAN])
-                result_dict[CompareConst.NORM_DIFF] = np.abs(
-                    result_dict[CompareConst.NPU_NORM] - result_dict[CompareConst.BENCH_NORM])
-                result_dict[CompareConst.MAX_RELATIVE_ERR] = result_dict[CompareConst.MAX_DIFF] / result_dict[
-                    CompareConst.BENCH_MAX] if result_dict[CompareConst.BENCH_MAX] > 0 else 0
-                result_dict[CompareConst.MAX_RELATIVE_ERR] = str(result_dict[CompareConst.MAX_RELATIVE_ERR] * 100) + "%"
-                result_dict[CompareConst.MIN_RELATIVE_ERR] = result_dict[CompareConst.MIN_DIFF] / result_dict[
-                    CompareConst.BENCH_MIN] if result_dict[CompareConst.BENCH_MIN] > 0 else 0
-                result_dict[CompareConst.MIN_RELATIVE_ERR] = str(result_dict[CompareConst.MIN_RELATIVE_ERR] * 100) + "%"
-                result_dict[CompareConst.MEAN_RELATIVE_ERR] = result_dict[CompareConst.MEAN_DIFF] / result_dict[
-                    CompareConst.BENCH_MEAN] if result_dict[CompareConst.BENCH_MEAN] > 0 else 0
-                result_dict[CompareConst.MEAN_RELATIVE_ERR] = str(
-                    result_dict[CompareConst.MEAN_RELATIVE_ERR] * 100) + "%"
-                result_dict[CompareConst.NORM_RELATIVE_ERR] = result_dict[CompareConst.NORM_DIFF] / result_dict[
-                    CompareConst.BENCH_NORM] if result_dict[CompareConst.BENCH_NORM] > 0 else 0
-                result_dict[CompareConst.NORM_RELATIVE_ERR] = str(
-                    result_dict[CompareConst.NORM_RELATIVE_ERR] * 100) + "%"
-                magnitude_diff = result_dict[CompareConst.MAX_DIFF] / (
-                            max(result_dict[CompareConst.NPU_MAX], result_dict[CompareConst.BENCH_MAX]) + 1e-10)
-                if magnitude_diff > CompareConst.MAGNITUDE:
-                    result_dict[CompareConst.ACCURACY] = 'No'
-                else:
-                    result_dict[CompareConst.ACCURACY] = 'Yes'
-            return pd.Series(result_dict)
-        if mode == GraphMode.NPY_MODE:
-            compare_result_db = compare_result_db.apply(npy_mode_compute, axis=1)
-        else:
-            compare_result_db = compare_result_db.apply(statistic_mode_compute, axis=1)
-        return compare_result_db
-    def compare_core(self):
-        logger.info("Please check whether the input data belongs to you. If not, there may be security risks.")
-        # split by rank and step
-        if not self.rank_list:
-            self.rank_list = [int(i.split("_")[-1]) for i in os.listdir(self.base_npu_path)]
-        for rank_id in self.rank_list:
-            if not self.step_list:
-                self.step_list = generate_step(self.base_npu_path, rank_id)
-            for step_id in self.step_list:
-                compare_result_df, mode = self.compare_process(rank_id, step_id)
-                if isinstance(compare_result_df, list):
-                    is_empty = not compare_result_df
-                elif isinstance(compare_result_df, pd.DataFrame):
-                    is_empty = compare_result_df.empty
-                else:
-                    is_empty = True
-                if is_empty or not mode:
-                    continue
-                compare_result_df = self._do_multi_process(compare_result_df, mode)
-                compare_result_name = add_time_with_xlsx(f"compare_result_{str(rank_id)}_{str(step_id)}")
-                compare_result_path = os.path.join(os.path.realpath(self.output_path), f"{compare_result_name}")
-                compare_result_df.to_excel(compare_result_path, index=False)
-                logger.info(f"Compare rank: {rank_id} step: {step_id} finish. Compare result: {compare_result_path}.")
-    def compare_process(self, rank_id, step_id):
-        # generate data_path
-        npu_data_path = generate_path_by_rank_step(self.base_npu_path, rank_id, step_id)
-        bench_data_path = generate_path_by_rank_step(self.base_bench_path, rank_id, step_id)
-        if not npu_data_path or not bench_data_path:
-            return [], ''
-        # generate file name
-        npu_mode, npu_data_list = generate_data_name(npu_data_path)
-        match_mode, match_data_list = generate_data_name(bench_data_path)
-        if npu_mode == "ERROR_MODE" or match_mode == "ERROR_MODE":
-            logger.warning(f"Data_path {npu_data_path} or {bench_data_path} is not exist.")
-            return [], ''
-        if npu_mode != match_mode:
-            logger.error(f"NPU mode {npu_mode} not equal to MATCH mode {match_mode}.")
-            return [], ''
-        if npu_mode == 'NPY_MODE':
-            npu_data_df = pd.DataFrame(npu_data_list, columns=[CompareConst.NPU_NAME, 'Compare Key', 'TimeStamp'])
-            bench_data_df = pd.DataFrame(match_data_list, columns=[CompareConst.BENCH_NAME, 'Compare Key', 'TimeStamp'])
-        else:
-            npu_data_df = pd.DataFrame(npu_data_list,
-                                       columns=[CompareConst.NPU_NAME, 'Compare Key', 'TimeStamp', CompareConst.NPU_DTYPE, CompareConst.NPU_SHAPE,
-                                                CompareConst.NPU_MAX, CompareConst.NPU_MIN, CompareConst.NPU_MEAN, CompareConst.NPU_NORM])
-            bench_data_df = pd.DataFrame(match_data_list,
-                                         columns=[CompareConst.BENCH_NAME, 'Compare Key', 'TimeStamp', CompareConst.BENCH_DTYPE,
-                                                  CompareConst.BENCH_SHAPE, CompareConst.BENCH_MAX, CompareConst.BENCH_MIN, CompareConst.BENCH_MEAN,
-                                                  CompareConst.BENCH_NORM])
-        npu_data_df['Local Index'] = npu_data_df.sort_values('TimeStamp').groupby('Compare Key').cumcount()
-        bench_data_df['Local Index'] = bench_data_df.sort_values('TimeStamp').groupby('Compare Key').cumcount()
-        compare_result_df = pd.merge(npu_data_df, bench_data_df, on=['Compare Key', 'Local Index'], how='outer')
-        compare_result_df[CompareConst.NPU_NAME] = compare_result_df[CompareConst.NPU_NAME].fillna('')
-        compare_result_df[CompareConst.BENCH_NAME] = compare_result_df[CompareConst.BENCH_NAME].fillna('')
-        return compare_result_df, npu_mode
-    def _do_multi_process(self, result_df, mode):
-        try:
-            result_df = _ms_graph_handle_multi_process(self.compare_ops, result_df, mode)
-        except ValueError as e:
-            logger.error('result dataframe is not found.')
-            raise CompareException(CompareException.INVALID_DATA_ERROR) from e
-        return result_df
+import copy
+import csv
+import glob
+import os
+import numpy as np
+import pandas as pd
+from msprobe.core.common.const import CompareConst, GraphMode, Const, FileCheckConst
+from msprobe.core.common.file_utils import FileOpen, check_path_before_create, change_mode, load_npy
+from msprobe.core.common.log import logger
+from msprobe.core.common.utils import add_time_with_xlsx, CompareException
+from msprobe.core.compare.multiprocessing_compute import _ms_graph_handle_multi_process, check_accuracy
+from msprobe.core.compare.npy_compare import npy_data_check, statistics_data_check, reshape_value, compare_ops_apply
+from msprobe.mindspore.common.utils import convert_to_int, list_lowest_level_directories
+class row_data:
+    def __init__(self, mode):
+        self.basic_data = copy.deepcopy(CompareConst.MS_GRAPH_BASE)
+        self.npy_data = copy.deepcopy(CompareConst.MS_GRAPH_NPY)
+        self.statistic_data = copy.deepcopy(CompareConst.MS_GRAPH_STATISTIC)
+        if mode == GraphMode.NPY_MODE:
+            self.data = {**self.basic_data, **self.npy_data}
+        else:
+            self.data = {**self.basic_data, **self.statistic_data}
+    def __call__(self):
+        return self.data
+def npy_data_read(data_path, npy_file_list, mapping_dict):
+    data_list = []
+    for data in npy_file_list:
+        if data in mapping_dict:
+            split_list = mapping_dict[data].split(Const.SEP)
+        else:
+            split_list = data.split(Const.SEP)
+        if len(split_list) < 7:
+            continue
+        compare_key = f"{split_list[1]}.{split_list[2]}.{split_list[3]}.{split_list[5]}.{split_list[6]}"
+        timestamp = convert_to_int(split_list[4])
+        data_list.append([os.path.join(data_path, data), compare_key, timestamp])
+    return data_list
+def statistic_data_read(statistic_file_list, statistic_file_path):
+    data_list = []
+    statistic_data_list = []
+    header_index = {
+        'Data Type': None, 'Shape': None, 'Max Value': None,
+        'Min Value': None,'Avg Value': None, 'L2Norm Value': None
+    }
+    for statistic_file in statistic_file_list:
+        with FileOpen(statistic_file, "r") as f:
+            csv_reader = csv.reader(f, delimiter=",")
+            header = next(csv_reader)
+            for key in header_index.keys():
+                for index, value in enumerate(header):
+                    if key == value:
+                        header_index[key] = index
+            statistic_data_list.extend([row for row in csv_reader])
+    for key in header_index.keys():
+        if header_index[key] is None:
+            logger.warning(f"Data_path {statistic_file_path} has no key {key}.")
+    for data in statistic_data_list:
+        compare_key = f"{data[1]}.{data[2]}.{data[3]}.{data[5]}"
+        op_name = f"{compare_key} {statistic_file_path}"
+        timestamp = int(data[4])
+        result_data = [op_name, compare_key, timestamp]
+        for key in header_index.keys():
+            if header_index[key] is None:
+                result_data.append(np.nan)
+            else:
+                result_data.append(data[header_index[key]])
+        data_list.append(result_data)
+    return data_list
+def generate_data_name(data_path):
+    data_list = []
+    mapping_path = os.path.join(data_path, "mapping.csv")
+    statistic_path = os.path.join(data_path, "statistic.csv")
+    npy_path = os.path.join(data_path, "*.npy")
+    mapping_file_list = glob.glob(mapping_path)
+    statistic_file_list = glob.glob(statistic_path)
+    npy_file_list = glob.glob(npy_path)
+    mapping_exist = bool(mapping_file_list)
+    statistic_exist = bool(statistic_file_list)
+    npy_exist = bool(npy_file_list)
+    mapping_dict = {}
+    if mapping_exist:
+        for mapping_file in mapping_file_list:
+            with FileOpen(mapping_file, "r") as f:
+                csv_reader = csv.reader(f, delimiter=",")
+                header = next(csv_reader)
+                for row in csv_reader:
+                    mapping_dict[row[0]] = row[1]
+    if npy_exist:
+        data_list = npy_data_read(data_path, npy_file_list, mapping_dict)
+    elif statistic_exist:
+        data_list = statistic_data_read(statistic_file_list, os.path.join(data_path, statistic_path))
+    if npy_exist:
+        mode = GraphMode.NPY_MODE
+    elif statistic_exist:
+        mode = GraphMode.STATISTIC_MODE
+    else:
+        mode = GraphMode.ERROR_MODE
+        logger.error(f"Error mode.")
+    return mode, data_list
+class GraphMSComparator:
+    def __init__(self, input_param, output_path):
+        self.output_path = output_path
+        self.base_npu_path = input_param.get('npu_path', None)
+        self.base_bench_path = input_param.get('bench_path', None)
+        self.rank_list = [convert_to_int(rank_id) for rank_id in input_param.get('rank_id', [])]
+        self.step_list = [convert_to_int(step_id) for step_id in input_param.get('step_id', [])]
+        # split by rank and step, generate rank step path
+        self.npu_rank_step_dict = self.generate_rank_step_path(self.base_npu_path)
+        self.bench_rank_step_dict = self.generate_rank_step_path(self.base_bench_path)
+        self.common_rank_step = sorted(
+            set(self.npu_rank_step_dict.keys()).intersection(self.bench_rank_step_dict.keys()))
+    @staticmethod
+    def compare_ops(compare_result_db, mode):
+        def npy_mode_compute(row):
+            result_dict = row_data(GraphMode.NPY_MODE)()
+            def process_npy_file(file_path, name_prefix, result):
+                if os.path.exists(file_path):
+                    data = load_npy(file_path)
+                    result[f'{name_prefix} Name'] = file_path
+                    result[f'{name_prefix} Dtype'] = data.dtype
+                    result[f'{name_prefix} Tensor Shape'] = data.shape
+                    result[f'{name_prefix} max'] = np.max(data)
+                    result[f'{name_prefix} min'] = np.min(data)
+                    result[f'{name_prefix} mean'] = np.mean(data)
+                    result[f'{name_prefix} l2norm'] = np.linalg.norm(data)
+                    return data
+                return ""
+            n_value = process_npy_file(row[CompareConst.NPU_NAME], 'NPU', result_dict)
+            b_value = process_npy_file(row[CompareConst.BENCH_NAME], 'Bench', result_dict)
+            error_flag, error_message = npy_data_check(n_value, b_value)
+            result_dict[CompareConst.ERROR_MESSAGE] = error_message
+            if not error_flag:
+                n_value, b_value = reshape_value(n_value, b_value)
+                result_list, err_msg = compare_ops_apply(n_value, b_value, False, "")
+                result_dict[CompareConst.COSINE] = result_list[0]
+                result_dict[CompareConst.MAX_ABS_ERR] = result_list[1]
+                result_dict[CompareConst.MAX_RELATIVE_ERR] = result_list[2]
+                result_dict[CompareConst.ONE_THOUSANDTH_ERR_RATIO] = result_list[3]
+                result_dict[CompareConst.FIVE_THOUSANDTHS_ERR_RATIO] = result_list[4]
+                result_dict[CompareConst.ACCURACY] = check_accuracy(result_list[0], result_list[1])
+                result_dict[CompareConst.ERROR_MESSAGE] = err_msg
+            return pd.Series(result_dict)
+        def statistic_mode_compute(row):
+            result_dict = row_data('STATISTIC')()
+            def update_result_dict(result, rows, prefix):
+                result[f'{prefix} Name'] = rows[f'{prefix} Name']
+                result[f'{prefix} Dtype'] = rows[f'{prefix} Dtype']
+                result[f'{prefix} Tensor Shape'] = rows[f'{prefix} Tensor Shape']
+                result[f'{prefix} max'] = np.float32(rows[f'{prefix} max'])
+                result[f'{prefix} min'] = np.float32(rows[f'{prefix} min'])
+                result[f'{prefix} mean'] = np.float32(rows[f'{prefix} mean'])
+                result[f'{prefix} l2norm'] = np.float32(rows[f'{prefix} l2norm'])
+            # 使用示例
+            update_result_dict(result_dict, row, 'NPU')
+            update_result_dict(result_dict, row, 'Bench')
+            error_flag, error_message = statistics_data_check(result_dict)
+            result_dict[CompareConst.ERROR_MESSAGE] += error_message
+            if not error_flag:
+                result_dict[CompareConst.MAX_DIFF] = np.abs(
+                    result_dict[CompareConst.NPU_MAX] - result_dict[CompareConst.BENCH_MAX])
+                result_dict[CompareConst.MIN_DIFF] = np.abs(
+                    result_dict[CompareConst.NPU_MIN] - result_dict[CompareConst.BENCH_MIN])
+                result_dict[CompareConst.MEAN_DIFF] = np.abs(
+                    result_dict[CompareConst.NPU_MEAN] - result_dict[CompareConst.BENCH_MEAN])
+                result_dict[CompareConst.NORM_DIFF] = np.abs(
+                    result_dict[CompareConst.NPU_NORM] - result_dict[CompareConst.BENCH_NORM])
+                result_dict[CompareConst.MAX_RELATIVE_ERR] = result_dict[CompareConst.MAX_DIFF] / result_dict[
+                    CompareConst.BENCH_MAX] if result_dict[CompareConst.BENCH_MAX] > 0 else 0
+                result_dict[CompareConst.MAX_RELATIVE_ERR] = str(result_dict[CompareConst.MAX_RELATIVE_ERR] * 100) + "%"
+                result_dict[CompareConst.MIN_RELATIVE_ERR] = result_dict[CompareConst.MIN_DIFF] / result_dict[
+                    CompareConst.BENCH_MIN] if result_dict[CompareConst.BENCH_MIN] > 0 else 0
+                result_dict[CompareConst.MIN_RELATIVE_ERR] = str(result_dict[CompareConst.MIN_RELATIVE_ERR] * 100) + "%"
+                result_dict[CompareConst.MEAN_RELATIVE_ERR] = result_dict[CompareConst.MEAN_DIFF] / result_dict[
+                    CompareConst.BENCH_MEAN] if result_dict[CompareConst.BENCH_MEAN] > 0 else 0
+                result_dict[CompareConst.MEAN_RELATIVE_ERR] = str(
+                    result_dict[CompareConst.MEAN_RELATIVE_ERR] * 100) + "%"
+                result_dict[CompareConst.NORM_RELATIVE_ERR] = result_dict[CompareConst.NORM_DIFF] / result_dict[
+                    CompareConst.BENCH_NORM] if result_dict[CompareConst.BENCH_NORM] > 0 else 0
+                result_dict[CompareConst.NORM_RELATIVE_ERR] = str(
+                    result_dict[CompareConst.NORM_RELATIVE_ERR] * 100) + "%"
+                magnitude_diff = result_dict[CompareConst.MAX_DIFF] / (
+                        max(result_dict[CompareConst.NPU_MAX], result_dict[CompareConst.BENCH_MAX]) + 1e-10)
+                if magnitude_diff > CompareConst.MAGNITUDE:
+                    result_dict[CompareConst.ACCURACY] = 'No'
+                else:
+                    result_dict[CompareConst.ACCURACY] = 'Yes'
+            return pd.Series(result_dict)
+        if mode == GraphMode.NPY_MODE:
+            compare_result_db = compare_result_db.apply(npy_mode_compute, axis=1)
+        else:
+            compare_result_db = compare_result_db.apply(statistic_mode_compute, axis=1)
+        return compare_result_db
+    def compare_core(self):
+        logger.info("Please check whether the input data belongs to you. If not, there may be security risks.")
+        for rank_id, step_id in self.common_rank_step:
+            compare_result_df, mode = self.compare_process(rank_id, step_id)
+            if isinstance(compare_result_df, list):
+                is_empty = not compare_result_df
+            elif isinstance(compare_result_df, pd.DataFrame):
+                is_empty = compare_result_df.empty
+            else:
+                is_empty = True
+            if is_empty or not mode:
+                continue
+            compare_result_df = self._do_multi_process(compare_result_df, mode)
+            compare_result_name = add_time_with_xlsx(f"compare_result_{str(rank_id)}_{str(step_id)}")
+            compare_result_path = os.path.join(os.path.realpath(self.output_path), f"{compare_result_name}")
+            check_path_before_create(compare_result_path)
+            self.to_excel(compare_result_df, compare_result_path)
+            logger.info(f"Compare rank: {rank_id} step: {step_id} finish. Compare result: {compare_result_path}.")
+    def to_excel(self, compare_result_df: pd.DataFrame, compare_result_path: str, slice_num=0, need_slice=False) -> int:
+        size = len(compare_result_df)
+        # sheet size cannot be larger than 1048576
+        if size < CompareConst.MAX_EXCEL_LENGTH:
+            compare_result_path = compare_result_path.replace('.xlsx', f'_slice_{slice_num}.xlsx') if need_slice else compare_result_path
+            compare_result_df.to_excel(compare_result_path, index=False)
+            change_mode(compare_result_path, FileCheckConst.DATA_FILE_AUTHORITY)
+            return slice_num + 1
+        else:
+            slice_num = self.to_excel(compare_result_df.iloc[0: size//2], compare_result_path, slice_num, True)
+            return self.to_excel(compare_result_df.iloc[size//2:], compare_result_path, slice_num, True)
+    def compare_process(self, rank_id, step_id):
+        # generate data_path
+        npu_data_path_list = self.npu_rank_step_dict.get((rank_id, step_id))
+        bench_data_path_list = self.bench_rank_step_dict.get((rank_id, step_id))
+        if not npu_data_path_list or not npu_data_path_list:
+            return [], ''
+        # generate file name
+        npu_mode = GraphMode.ERROR_MODE
+        bench_mode = GraphMode.ERROR_MODE
+        npu_data_list = []
+        bench_data_list = []
+        for npu_data_path in npu_data_path_list:
+            npu_mode, data_list = generate_data_name(npu_data_path)
+            npu_data_list.extend(data_list)
+        for bench_data_path in bench_data_path_list:
+            bench_mode, data_list = generate_data_name(bench_data_path)
+            bench_data_list.extend(data_list)
+        if npu_mode == GraphMode.ERROR_MODE or bench_mode == GraphMode.ERROR_MODE:
+            logger.warning(f"Data_path {npu_data_path} or {bench_data_path} is not exist.")
+            return [], ''
+        if npu_mode != bench_mode:
+            logger.error(f"NPU mode {npu_mode} not equal to MATCH mode {bench_mode}.")
+            return [], ''
+        if npu_mode == 'NPY_MODE':
+            npu_data_df = pd.DataFrame(npu_data_list, columns=[CompareConst.NPU_NAME, 'Compare Key', 'TimeStamp'])
+            bench_data_df = pd.DataFrame(bench_data_list, columns=[CompareConst.BENCH_NAME, 'Compare Key', 'TimeStamp'])
+        else:
+            npu_data_df = pd.DataFrame(npu_data_list,
+                                       columns=[CompareConst.NPU_NAME, 'Compare Key', 'TimeStamp',
+                                                CompareConst.NPU_DTYPE, CompareConst.NPU_SHAPE,
+                                                CompareConst.NPU_MAX, CompareConst.NPU_MIN, CompareConst.NPU_MEAN,
+                                                CompareConst.NPU_NORM])
+            bench_data_df = pd.DataFrame(bench_data_list,
+                                         columns=[CompareConst.BENCH_NAME, 'Compare Key', 'TimeStamp',
+                                                  CompareConst.BENCH_DTYPE,
+                                                  CompareConst.BENCH_SHAPE, CompareConst.BENCH_MAX,
+                                                  CompareConst.BENCH_MIN, CompareConst.BENCH_MEAN,
+                                                  CompareConst.BENCH_NORM])
+            npu_float_type = [CompareConst.NPU_MAX, CompareConst.NPU_MIN, CompareConst.NPU_MEAN, CompareConst.NPU_NORM]
+            npu_data_df[npu_float_type] = npu_data_df[npu_float_type].astype(float)
+            bench_float_type = [
+                CompareConst.BENCH_MAX, CompareConst.BENCH_MIN,
+                CompareConst.BENCH_MEAN,CompareConst.BENCH_NORM
+            ]
+            bench_data_df[bench_float_type] = bench_data_df[bench_float_type].astype(float)
+        npu_data_df['Local Index'] = npu_data_df.sort_values('TimeStamp').groupby('Compare Key').cumcount()
+        bench_data_df['Local Index'] = bench_data_df.sort_values('TimeStamp').groupby('Compare Key').cumcount()
+        compare_result_df = pd.merge(npu_data_df, bench_data_df, on=['Compare Key', 'Local Index'], how='outer')
+        compare_result_df[CompareConst.NPU_NAME] = compare_result_df[CompareConst.NPU_NAME].fillna('')
+        compare_result_df[CompareConst.BENCH_NAME] = compare_result_df[CompareConst.BENCH_NAME].fillna('')
+        return compare_result_df, npu_mode
+    def generate_rank_step_path(self, base_path):
+        def generate_rank_step_id(path_with_rank_step):
+            split_path = path_with_rank_step.split("/")
+            rank_id = -1
+            if "rank_" in path_with_rank_step:
+                # KBK mode
+                if len(split_path) > 4:
+                    rank_id = convert_to_int(split_path[-4].split("_")[-1])
+                step_id = convert_to_int(split_path[-1])
+            else:
+                if len(split_path) > 4:
+                    rank_id = convert_to_int(split_path[-4])
+                if rank_id == -1 and len(split_path) > 3:
+                    rank_id = convert_to_int(split_path[-3])
+                step_id = convert_to_int(split_path[-1])
+            return rank_id, step_id
+        base_path = os.path.abspath(base_path)
+        lowest_level = list_lowest_level_directories(base_path)
+        rank_step_path_dict = {}
+        for dir_path in lowest_level:
+            rank_id, step_id = generate_rank_step_id(dir_path)
+            if rank_id == -1 or step_id == -1:
+                continue
+            if self.rank_list and rank_id not in self.rank_list:
+                continue
+            if self.step_list and step_id not in self.step_list:
+                continue
+            rank_step_key = (rank_id, step_id)
+            if rank_step_key in rank_step_path_dict:
+                rank_step_path_dict[rank_step_key].append(dir_path)
+            else:
+                rank_step_path_dict[rank_step_key] = [dir_path]
+        return dict(sorted(rank_step_path_dict.items()))
+    def _do_multi_process(self, result_df, mode):
+        try:
+            result_df = _ms_graph_handle_multi_process(self.compare_ops, result_df, mode)
+        except ValueError as e:
+            logger.error('result dataframe is not found.')
+            raise CompareException(CompareException.INVALID_DATA_ERROR) from e
+        return result_df

mindstudio-probe 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl