PyPI - mindstudio-probe - Versions diffs - 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl - Mend

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (220) hide show

{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/METADATA +5 -5
mindstudio_probe-1.1.1.dist-info/RECORD +341 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/entry_points.txt +0 -1
msprobe/README.md +39 -3
msprobe/config.json +1 -3
msprobe/core/advisor/advisor.py +8 -3
msprobe/core/common/const.py +113 -13
msprobe/core/common/exceptions.py +25 -3
msprobe/core/common/file_utils.py +150 -26
msprobe/core/common/inplace_op_checker.py +15 -0
msprobe/core/common/log.py +27 -9
msprobe/core/common/utils.py +182 -69
msprobe/core/common_config.py +44 -15
msprobe/core/compare/acc_compare.py +207 -142
msprobe/core/compare/check.py +2 -5
msprobe/core/compare/compare_cli.py +21 -4
msprobe/core/compare/highlight.py +124 -55
msprobe/core/compare/layer_mapping/__init__.py +19 -0
msprobe/core/compare/layer_mapping/data_scope_parser.py +235 -0
msprobe/core/compare/layer_mapping/layer_mapping.py +242 -0
msprobe/core/compare/layer_mapping/postprocess_pass.py +94 -0
msprobe/core/compare/npy_compare.py +52 -23
msprobe/core/compare/utils.py +272 -247
msprobe/core/data_dump/data_collector.py +13 -11
msprobe/core/data_dump/data_processor/base.py +46 -16
msprobe/core/data_dump/data_processor/mindspore_processor.py +4 -4
msprobe/core/data_dump/data_processor/pytorch_processor.py +156 -59
msprobe/core/data_dump/scope.py +113 -34
msprobe/core/grad_probe/constant.py +27 -13
msprobe/core/grad_probe/grad_compare.py +18 -1
msprobe/core/grad_probe/utils.py +30 -2
msprobe/core/overflow_check/abnormal_scene.py +185 -0
msprobe/core/overflow_check/api_info.py +55 -0
msprobe/core/overflow_check/checker.py +138 -0
msprobe/core/overflow_check/filter.py +157 -0
msprobe/core/overflow_check/ignore_rules.yaml +55 -0
msprobe/core/overflow_check/level.py +22 -0
msprobe/core/overflow_check/utils.py +28 -0
msprobe/docs/01.installation.md +10 -0
msprobe/docs/02.config_introduction.md +49 -22
msprobe/docs/03.config_examples.md +2 -9
msprobe/docs/04.kernel_dump_PyTorch.md +73 -0
msprobe/docs/05.data_dump_PyTorch.md +3 -1
msprobe/docs/06.data_dump_MindSpore.md +157 -90
msprobe/docs/07.accuracy_checker_PyTorch.md +12 -12
msprobe/docs/08.accuracy_checker_online_PyTorch.md +1 -6
msprobe/docs/09.accuracy_checker_MindSpore.md +44 -8
msprobe/docs/10.accuracy_compare_PyTorch.md +19 -13
msprobe/docs/11.accuracy_compare_MindSpore.md +104 -13
msprobe/docs/12.overflow_check_PyTorch.md +1 -1
msprobe/docs/13.overflow_check_MindSpore.md +6 -6
msprobe/docs/15.free_benchmarking_PyTorch.md +4 -5
msprobe/docs/16.free_benchmarking_MindSpore.md +56 -37
msprobe/docs/17.grad_probe.md +5 -6
msprobe/docs/19.monitor.md +468 -0
msprobe/docs/20.monitor_performance_baseline.md +52 -0
msprobe/docs/21.visualization_PyTorch.md +386 -0
msprobe/docs/22.visualization_MindSpore.md +384 -0
msprobe/docs/23.tool_function_introduction.md +28 -0
msprobe/docs/FAQ.md +3 -0
msprobe/docs/data_dump_Mindspore/dynamic_graph_quick_start_example.md +211 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/mindspore/__init__.py +15 -0
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +113 -145
msprobe/mindspore/api_accuracy_checker/api_info.py +21 -6
msprobe/mindspore/api_accuracy_checker/api_runner.py +43 -18
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +21 -7
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +77 -0
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +63 -1
msprobe/mindspore/api_accuracy_checker/compute_element.py +59 -24
msprobe/mindspore/api_accuracy_checker/data_manager.py +264 -0
msprobe/mindspore/api_accuracy_checker/main.py +27 -3
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +206 -0
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +58 -0
msprobe/mindspore/api_accuracy_checker/type_mapping.py +22 -5
msprobe/mindspore/api_accuracy_checker/utils.py +34 -17
msprobe/mindspore/cell_processor.py +33 -12
msprobe/mindspore/common/const.py +33 -13
msprobe/mindspore/common/log.py +5 -9
msprobe/mindspore/common/utils.py +43 -4
msprobe/mindspore/compare/distributed_compare.py +22 -22
msprobe/mindspore/compare/ms_compare.py +271 -248
msprobe/mindspore/compare/ms_graph_compare.py +81 -47
msprobe/mindspore/debugger/debugger_config.py +4 -1
msprobe/mindspore/debugger/precision_debugger.py +7 -1
msprobe/mindspore/dump/dump_tool_factory.py +3 -1
msprobe/mindspore/dump/hook_cell/api_registry.py +12 -2
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +13 -16
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +25 -0
msprobe/mindspore/dump/jit_dump.py +17 -5
msprobe/mindspore/dump/kernel_graph_dump.py +2 -4
msprobe/mindspore/dump/kernel_kbyk_dump.py +2 -4
msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +140 -0
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +53 -0
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +145 -39
msprobe/mindspore/free_benchmark/common/handler_params.py +1 -2
msprobe/mindspore/free_benchmark/common/utils.py +19 -4
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -204
msprobe/mindspore/free_benchmark/handler/base_handler.py +3 -3
msprobe/mindspore/free_benchmark/handler/check_handler.py +4 -5
msprobe/mindspore/free_benchmark/handler/fix_handler.py +4 -4
msprobe/mindspore/free_benchmark/handler/handler_factory.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +15 -6
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +13 -6
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +2 -2
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +2 -2
msprobe/mindspore/grad_probe/global_context.py +28 -8
msprobe/mindspore/grad_probe/grad_analyzer.py +27 -13
msprobe/mindspore/grad_probe/grad_monitor.py +16 -1
msprobe/mindspore/grad_probe/grad_stat_csv.py +33 -5
msprobe/mindspore/grad_probe/hook.py +24 -10
msprobe/mindspore/grad_probe/utils.py +18 -5
msprobe/mindspore/ms_config.py +22 -15
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +2 -4
msprobe/mindspore/runtime.py +15 -0
msprobe/mindspore/service.py +36 -30
msprobe/mindspore/task_handler_factory.py +15 -0
msprobe/msprobe.py +24 -7
msprobe/pytorch/__init__.py +3 -2
msprobe/pytorch/api_accuracy_checker/common/config.py +62 -0
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +3 -4
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +9 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +454 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +365 -0
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +6 -1
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +19 -14
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +13 -9
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +77 -53
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +15 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +9 -24
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +4 -12
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +9 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +3 -11
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +2 -2
msprobe/pytorch/bench_functions/confusion_transpose.py +5 -1
msprobe/pytorch/bench_functions/matmul_backward.py +12 -0
msprobe/pytorch/bench_functions/npu_fusion_attention.py +100 -6
msprobe/pytorch/bench_functions/rotary_mul.py +4 -0
msprobe/pytorch/bench_functions/swiglu.py +10 -2
msprobe/pytorch/common/parse_json.py +6 -6
msprobe/pytorch/common/utils.py +56 -5
msprobe/pytorch/compare/distributed_compare.py +8 -9
msprobe/pytorch/compare/pt_compare.py +8 -6
msprobe/pytorch/debugger/debugger_config.py +19 -15
msprobe/pytorch/dump/kernel_dump/kernel_config.py +33 -0
msprobe/pytorch/free_benchmark/common/constant.py +15 -0
msprobe/pytorch/free_benchmark/common/counter.py +15 -0
msprobe/pytorch/free_benchmark/common/enums.py +15 -0
msprobe/pytorch/free_benchmark/common/params.py +8 -1
msprobe/pytorch/free_benchmark/common/utils.py +26 -4
msprobe/pytorch/free_benchmark/compare/grad_saver.py +20 -3
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +3 -1
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +6 -4
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +4 -0
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +10 -0
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +6 -5
msprobe/pytorch/grad_probe/grad_monitor.py +23 -6
msprobe/pytorch/grad_probe/grad_stat_csv.py +40 -10
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1 -0
msprobe/pytorch/hook_module/wrap_functional.py +14 -12
msprobe/pytorch/module_processer.py +2 -5
msprobe/pytorch/monitor/anomaly_analyse.py +201 -0
msprobe/pytorch/monitor/anomaly_detect.py +340 -0
msprobe/pytorch/monitor/distributed/__init__.py +0 -0
msprobe/pytorch/monitor/distributed/distributed_ops.yaml +19 -0
msprobe/pytorch/monitor/distributed/stack_blacklist.yaml +5 -0
msprobe/pytorch/monitor/distributed/wrap_distributed.py +272 -0
msprobe/pytorch/monitor/features.py +108 -0
msprobe/pytorch/monitor/module_hook.py +870 -0
msprobe/pytorch/monitor/module_metric.py +193 -0
msprobe/pytorch/monitor/module_spec_verifier.py +93 -0
msprobe/pytorch/monitor/optimizer_collect.py +295 -0
msprobe/pytorch/monitor/unittest/__init__.py +0 -0
msprobe/pytorch/monitor/unittest/test_monitor.py +145 -0
msprobe/pytorch/monitor/utils.py +250 -0
msprobe/pytorch/monitor/visualizer.py +59 -0
msprobe/pytorch/online_dispatch/__init__.py +2 -3
msprobe/pytorch/online_dispatch/compare.py +29 -38
msprobe/pytorch/online_dispatch/dispatch.py +50 -25
msprobe/pytorch/online_dispatch/dump_compare.py +21 -9
msprobe/pytorch/online_dispatch/single_compare.py +53 -32
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +1 -1
msprobe/pytorch/online_dispatch/utils.py +49 -21
msprobe/pytorch/parse_tool/lib/compare.py +12 -18
msprobe/pytorch/parse_tool/lib/config.py +1 -1
msprobe/pytorch/parse_tool/lib/parse_tool.py +1 -2
msprobe/pytorch/parse_tool/lib/utils.py +16 -35
msprobe/pytorch/parse_tool/lib/visualization.py +2 -0
msprobe/pytorch/pt_config.py +31 -8
msprobe/pytorch/service.py +15 -5
msprobe/visualization/__init__.py +14 -0
msprobe/visualization/builder/__init__.py +14 -0
msprobe/visualization/builder/graph_builder.py +165 -0
msprobe/visualization/builder/msprobe_adapter.py +205 -0
msprobe/visualization/compare/__init__.py +14 -0
msprobe/visualization/compare/graph_comparator.py +130 -0
msprobe/visualization/compare/mode_adapter.py +211 -0
msprobe/visualization/graph/__init__.py +14 -0
msprobe/visualization/graph/base_node.py +124 -0
msprobe/visualization/graph/graph.py +200 -0
msprobe/visualization/graph/node_colors.py +95 -0
msprobe/visualization/graph/node_op.py +39 -0
msprobe/visualization/graph_service.py +214 -0
msprobe/visualization/utils.py +232 -0
mindstudio_probe-1.1.0.dist-info/RECORD +0 -287
msprobe/docs/04.acl_config_examples.md +0 -78
msprobe/mindspore/compare/layer_mapping.py +0 -146
msprobe/mindspore/compare/modify_mapping.py +0 -107
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +0 -57
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +0 -122
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/LICENSE +0 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/top_level.txt +0 -0
/msprobe/{mindspore/free_benchmark/decorator → pytorch/monitor}/__init__.py +0 -0

msprobe/core/compare/highlight.py CHANGED Viewed

@@ -20,89 +20,108 @@ from collections import namedtuple
 import numpy as np
 import openpyxl
 from openpyxl.styles import PatternFill
+from tqdm import tqdm
 from msprobe.core.common.utils import get_header_index
 from msprobe.core.common.file_utils import save_workbook
 from msprobe.core.common.log import logger
-from msprobe.core.common.const import CompareConst, FileCheckConst
+from msprobe.core.common.const import CompareConst, FileCheckConst, Const
+from msprobe.core.common.utils import safe_get_value
 class HighlightCheck(abc.ABC):
     @abc.abstractmethod
-    def apply(self, info, color_columns, summary_compare):
+    def apply(self, info, color_columns, dump_mode):
         raise NotImplementedError
+def add_highlight_row_info(color_list, num, highlight_err_msg):
+    for i, (existing_num, existing_err_msg) in enumerate(color_list):
+        if num == existing_num:
+            color_list[i][1].append(highlight_err_msg)
+            return
+    color_list.append((num, [highlight_err_msg]))
 class CheckOrderMagnitude(HighlightCheck):
     """检查Max diff的数量级差异"""
-    def apply(self, info, color_columns, summary_compare=True):
+    def apply(self, info, color_columns, dump_mode):
         api_in, api_out, num = info
-        max_diff_index = get_header_index('Max diff' if summary_compare else 'MaxAbsErr', summary_compare)
+        max_diff_index = get_header_index(CompareConst.MAX_DIFF if dump_mode == Const.SUMMARY
+                                          else CompareConst.MAX_ABS_ERR, dump_mode)
         if abs(api_in[max_diff_index]) > abs(api_out[max_diff_index]):
             return
         in_order = 0 if abs(api_in[max_diff_index]) < 1 else math.log10(abs(api_in[max_diff_index]))
         out_order = 0 if abs(api_out[max_diff_index]) < 1 else math.log10(abs(api_out[max_diff_index]))
         if out_order - in_order >= CompareConst.ORDER_MAGNITUDE_DIFF_YELLOW:
-            color_columns.yellow.append(num)
+            add_highlight_row_info(color_columns.yellow, num,
+                                   "maximum absolute error of both input and output exceed 1, "
+                                   "with the output larger by an order of magnitude")
 class CheckOneThousandErrorRatio(HighlightCheck):
     """检查千分误差比率"""
-    def apply(self, info, color_columns, summary_compare=True):
+    def apply(self, info, color_columns, dump_mode):
         api_in, api_out, num = info
-        one_thousand_index = get_header_index('One Thousandth Err Ratio', summary_compare)
+        one_thousand_index = get_header_index(CompareConst.ONE_THOUSANDTH_ERR_RATIO, dump_mode)
         if (not isinstance(api_in[one_thousand_index], (float, int)) or
                 not isinstance(api_out[one_thousand_index], (float, int))):
             return
         if (api_in[one_thousand_index] > CompareConst.ONE_THOUSAND_ERROR_IN_RED and
                 api_out[one_thousand_index] < CompareConst.ONE_THOUSAND_ERROR_OUT_RED):
-            color_columns.red.append(num)
+            add_highlight_row_info(color_columns.red, num,
+                                   "The input's one thousandth err ratio exceeds 0.9, while the output's is below 0.6")
         elif api_in[one_thousand_index] - api_out[one_thousand_index] > CompareConst.ONE_THOUSAND_ERROR_DIFF_YELLOW:
-            color_columns.yellow.append(num)
+            add_highlight_row_info(color_columns.yellow, num,
+                                   "The output's one thousandth err ratio decreases by more than 0.1 "
+                                   "compared to the input's")
 class CheckCosineSimilarity(HighlightCheck):
     """检查余弦相似度"""
-    def apply(self, info, color_columns, summary_compare=True):
+    def apply(self, info, color_columns, dump_mode):
         api_in, api_out, num = info
-        cosine_index = get_header_index('Cosine', summary_compare)
+        cosine_index = get_header_index(CompareConst.COSINE, dump_mode)
         if not isinstance(api_in[cosine_index], (float, int)) or not isinstance(api_out[cosine_index], (float, int)):
             return
         if api_in[cosine_index] - api_out[cosine_index] > CompareConst.COSINE_DIFF_YELLOW:
-            color_columns.yellow.append(num)
+            add_highlight_row_info(color_columns.yellow, num,
+                                   "The output's cosine decreases by more than 0.1 compared to the input's")
 class CheckMaxRelativeDiff(HighlightCheck):
     """检查最大相对差异"""
-    def apply(self, info, color_columns, summary_compare=True):
+    def apply(self, info, color_columns, dump_mode):
         api_in, api_out, num = info
-        max_diff_index = get_header_index('Max diff', summary_compare)
-        bench_max_index = get_header_index('Bench max', summary_compare)
+        max_diff_index = get_header_index(CompareConst.MAX_DIFF, dump_mode)
+        bench_max_index = get_header_index(CompareConst.BENCH_MAX, dump_mode)
         input_max_relative_diff = np.abs(np.divide(api_in[max_diff_index], max(0.01, api_in[bench_max_index])))
         output_max_relative_diff = np.abs(np.divide(api_out[max_diff_index], max(0.01, api_out[bench_max_index])))
         if not isinstance(input_max_relative_diff, (float, int)) or not isinstance(output_max_relative_diff,
                                                                                    (float, int)):
             return
         if output_max_relative_diff > CompareConst.MAX_RELATIVE_OUT_RED:
-            color_columns.red.append(num)
+            add_highlight_row_info(color_columns.red, num, "maximum relative error exceeds 0.5")
         elif (output_max_relative_diff > CompareConst.MAX_RELATIVE_OUT_YELLOW and
               input_max_relative_diff < CompareConst.MAX_RELATIVE_IN_YELLOW):
-            color_columns.yellow.append(num)
+            add_highlight_row_info(color_columns.yellow, num,
+                                   "The output's maximum relative error exceeds 0.1, while the input's is below 0.01")
 class CheckOverflow(HighlightCheck):
     """检查是否存在溢出"""
-    def apply(self, info, color_columns, summary_compare=True):
+    def apply(self, info, color_columns, dump_mode):
         line, num = info
-        npu_max_index = get_header_index('NPU max', summary_compare)
-        npu_min_index = get_header_index('NPU min', summary_compare)
-        max_diff_index = get_header_index('Max diff' if summary_compare else 'MaxAbsErr', summary_compare)
+        npu_max_index = get_header_index(CompareConst.NPU_MAX, dump_mode)
+        npu_min_index = get_header_index(CompareConst.NPU_MIN, dump_mode)
+        max_diff_index = get_header_index(CompareConst.MAX_DIFF if dump_mode == Const.SUMMARY
+                                          else CompareConst.MAX_ABS_ERR, dump_mode)
         if str(line[npu_max_index]) in CompareConst.OVERFLOW_LIST or str(
                 line[npu_min_index]) in CompareConst.OVERFLOW_LIST:
-            color_columns.red.append(num)
+            add_highlight_row_info(color_columns.red, num, "maximum or minimum is nan, -inf, or inf")
             return
         # check if Max_Diff > 1e+10
-        if isinstance(line[max_diff_index], (float, int)) and line[max_diff_index] > CompareConst.MAX_DIFF_RED:
-            color_columns.red.append(num)
+        if isinstance(line[max_diff_index], (float, int)) and abs(line[max_diff_index]) > CompareConst.MAX_DIFF_RED:
+            add_highlight_row_info(color_columns.red, num, "maximum absolute error exceeds 1e+10")
 class HighlightRules:
@@ -124,13 +143,14 @@ class HighlightRules:
     }
-def find_error_rows(result, last_len, n_num_input, highlight_dict, summary_compare=False, md5_compare=False):
+def find_error_rows(result, last_len, n_num_input, highlight_dict, dump_mode):
     """找到单个API中需要高亮的行"""
-    if md5_compare:
+    if dump_mode == Const.MD5:
         return
-    npu_max_index = get_header_index('NPU max', summary_compare)
-    bench_max_index = get_header_index('Bench max', summary_compare)
-    max_diff_index = get_header_index('Max diff' if summary_compare else 'MaxAbsErr', summary_compare)
+    npu_max_index = get_header_index(CompareConst.NPU_MAX, dump_mode)
+    bench_max_index = get_header_index(CompareConst.BENCH_MAX, dump_mode)
+    max_diff_index = get_header_index(CompareConst.MAX_DIFF if dump_mode == Const.SUMMARY
+                                      else CompareConst.MAX_ABS_ERR, dump_mode)
     red_lines, yellow_lines = [], []
     LineInfo = namedtuple('LineInfo', ['line_data', 'num_pointer'])
@@ -143,7 +163,7 @@ def find_error_rows(result, last_len, n_num_input, highlight_dict, summary_compa
         num = last_len + i
         line_info = LineInfo(line_data=line, num_pointer=num)
         for rule in HighlightRules.basic_rules.values():
-            rule.apply(line_info, color_columns, summary_compare)
+            rule.apply(line_info, color_columns, dump_mode)
     # 对API的输出与输入比较，进行误差判断
     for n, api_out in enumerate(result[n_num_input:len(result)]):
@@ -161,36 +181,42 @@ def find_error_rows(result, last_len, n_num_input, highlight_dict, summary_compa
                 continue
             api_info = ApiInfo(api_input=api_in, api_output=api_out, num_pointer=num)
-            if summary_compare:
+            if dump_mode == Const.SUMMARY:
                 for rule in HighlightRules.summary_compare_rules.values():
-                    rule.apply(api_info, color_columns, summary_compare)
+                    rule.apply(api_info, color_columns, dump_mode)
             else:
                 for rule in HighlightRules.compare_rules.values():
-                    rule.apply(api_info, color_columns, summary_compare)
+                    rule.apply(api_info, color_columns, dump_mode)
-    highlight_dict.get('red_rows', []).extend(list(set(red_lines)))
-    highlight_dict.get('yellow_rows', []).extend(list(set(yellow_lines) - set(red_lines)))
+    red_lines_num_set = {x[0] for x in red_lines}
+    yellow_lines_num_set = {x[0] for x in yellow_lines}
+    highlight_dict.get('red_rows', set()).update(red_lines_num_set)
+    highlight_dict.get('yellow_rows', set()).update(yellow_lines_num_set - red_lines_num_set)
+    highlight_dict.get('red_lines', []).extend(red_lines)
+    highlight_dict.get('yellow_lines', []).extend(yellow_lines)
 def get_name_and_state(name):
     """Get api/module name and state"""
-    if "input" in name:
-        api_name = name.split("input")[0]
-        state = "input"
+    if Const.INPUT in name:
+        api_name = name.split(Const.INPUT)[0]
+        state = Const.INPUT
     else:
-        api_name = name.split("output")[0]
-        state = "output"
+        api_name = name.split(Const.OUTPUT)[0]
+        state = Const.OUTPUT
     return api_name, state
-def find_compare_result_error_rows(result_df, highlight_dict, summary_compare, md5_compare):
+def find_compare_result_error_rows(result_df, highlight_dict, dump_mode):
     """将dataframe根据API分组，并找到有误差的算子用于高亮"""
     result = result_df.values
     start, input_num, output_num, end = 0, 0, 0, len(result_df)
     last_api_name, last_state = None, None
     num, last_len = 0, 0
+    progress_bar = tqdm(total=len(result), desc="API/Module Analyse Progress", unit="item", ncols=100)
     for res_i in result:
-        api_name, state = get_name_and_state(res_i[0])
+        api_full_name = safe_get_value(res_i, 0, "res_i")
+        api_name, state = get_name_and_state(api_full_name)
         if last_api_name:
             if api_name == last_api_name:
                 if state == last_state:
@@ -201,29 +227,33 @@ def find_compare_result_error_rows(result_df, highlight_dict, summary_compare, m
             else:
                 output_num = num
                 find_error_rows(result[start:start + input_num + output_num], start, input_num, highlight_dict,
-                                summary_compare, md5_compare)
+                                dump_mode)
                 num, last_api_name, last_state = 1, api_name, state
                 start += input_num + output_num
                 input_num, output_num = 1, 0
         else:
             num, last_api_name, last_state = 1, api_name, state
+        progress_bar.update(1)
+    progress_bar.close()
     if state:
-        if state == "input":
+        if state == Const.INPUT:
             input_num = num
         else:
             output_num = num
         find_error_rows(result[start:start + input_num + output_num], start, input_num, highlight_dict,
-                        summary_compare, md5_compare)
+                        dump_mode)
 def highlight_rows_xlsx(result_df, highlight_dict, file_path):
     """Write and highlight results in Excel"""
-    logger.info('Compare result is %s' % file_path)
+    update_highlight_err_msg(result_df, highlight_dict)     # add highlight err_msg
     wb = openpyxl.Workbook()
     ws = wb.active
     # write header
+    logger.info('Initializing Excel file.')
     for j, col_name in enumerate(result_df.columns, start=1):
         if not csv_value_is_valid(col_name):
             raise RuntimeError(f"Malicious value [{col_name}] is not allowed to be written into the xlsx: {file_path}.")
@@ -231,20 +261,59 @@ def highlight_rows_xlsx(result_df, highlight_dict, file_path):
     for i, row in enumerate(result_df.iterrows(), start=2):
         for j, value in enumerate(row[1], start=1):
-            if not isinstance(value, (float, int)):
+            if not isinstance(value, (float, int)) or isinstance(value, bool):
                 value = f'{str(value)}\t' if str(value) in ('inf', '-inf', 'nan') else str(value)
             if not csv_value_is_valid(value):
-                raise RuntimeError(f"Malicious value [{value}] is not allowed to be written into the xlsx: {file_path}.")
+                raise RuntimeError(f"Malicious value [{value}] is not allowed to be written into the xlsx: "
+                                   f"{file_path}.")
             ws.cell(row=i, column=j, value=f'{str(value)}\t' if str(value) in ('inf', '-inf', 'nan') else value)
+    # 对可疑数据标色
+    logger.info('Coloring Excel in progress.')
+    col_len = len(result_df.columns)
+    red_fill = PatternFill(
+        start_color=CompareConst.RED, end_color=CompareConst.RED, fill_type="solid"
+    )
+    yellow_fill = PatternFill(
+        start_color=CompareConst.YELLOW, end_color=CompareConst.YELLOW, fill_type="solid",
+    )
+    for i in highlight_dict.get("red_rows", []):
+        for j in range(1, col_len + 1):
+            ws.cell(row=i + 2, column=j).fill = red_fill
+    for i in highlight_dict.get("yellow_rows", []):
+        for j in range(1, col_len + 1):
+            ws.cell(row=i + 2, column=j).fill = yellow_fill
+    logger.info('Saving Excel file to disk: %s' % file_path)
+    save_workbook(wb, file_path)
-            if (i - 2) in highlight_dict['red_rows']:
-                ws.cell(row=i, column=j).fill = PatternFill(start_color=CompareConst.RED,
-                                                            end_color=CompareConst.RED, fill_type="solid")
-            elif (i - 2) in highlight_dict['yellow_rows']:
-                ws.cell(row=i, column=j).fill = PatternFill(start_color=CompareConst.YELLOW,
-                                                            end_color=CompareConst.YELLOW, fill_type="solid")
-    save_workbook(wb, file_path)
+def update_highlight_err_msg(result_df, highlight_dict):
+    if result_df.shape[1] <= 1:
+        return
+    if CompareConst.NPU_MD5 in result_df.columns:
+        return
+    err_msg = result_df.get(CompareConst.ERROR_MESSAGE)
+    red_lines_num_set = highlight_dict.get('red_rows')
+    for color in ['red', 'yellow']:
+        line_key = f'{color}_lines'
+        lines = highlight_dict.get(line_key, [])
+        for line_index, messages in lines:
+            if color == 'yellow' and line_index in red_lines_num_set:
+                continue  # 如果是 yellow 行，且已被 red 行覆盖，跳过
+            for msg in messages:
+                if err_msg[line_index] == '':
+                    err_msg[line_index] = msg
+                else:
+                    err_msg[line_index] += '\n' + msg
+            if color == 'red':
+                red_lines_num_set.add(line_index)
+    result_df[CompareConst.ERROR_MESSAGE] = err_msg
 def csv_value_is_valid(value: str) -> bool:

msprobe/core/compare/layer_mapping/__init__.py ADDED Viewed

@@ -0,0 +1,19 @@
+# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
+# All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0  (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from msprobe.core.compare.layer_mapping.layer_mapping import (
+    generate_data_mapping_by_layer_mapping,
+    generate_api_mapping_by_layer_mapping,
+)

msprobe/core/compare/layer_mapping/data_scope_parser.py ADDED Viewed

@@ -0,0 +1,235 @@
+# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
+# All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0  (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+import re
+from copy import deepcopy
+from dataclasses import dataclass
+from typing import ClassVar, Dict, List, Optional, Tuple
+import yaml
+from msprobe.core.common.const import Const
+from msprobe.core.common.file_utils import save_yaml
+from msprobe.core.common.log import logger
+from msprobe.core.common.utils import CompareException, add_time_with_yaml
+from msprobe.core.compare.layer_mapping.postprocess_pass import postprocess_pass
+@dataclass
+class DumpDataItem:
+    framework: str
+    data_name: Optional[str] = None
+    api_type: Optional[str] = None
+    api_name: Optional[str] = None
+    type_name: Optional[str] = None
+    full_scope: str = ""
+    layer_scope: str = ""
+    stack_scope: str = ""
+    frame_stack_scope: str = ""
+    user_stack_scope: str = ""
+    construct_scope: str = ""
+    scope_direction: Optional[str] = None
+    scope_id: Optional[int] = None
+    # 类变量使用 ClassVar
+    framework2layername: ClassVar[Dict[str, str]] = {
+        Const.MS_FRAMEWORK: Const.CELL, Const.PT_FRAMEWORK: Const.MODULE}
+    framework2stack_sign: ClassVar[Dict[str, Tuple[str, str]]] = {
+        Const.MS_FRAMEWORK: ("Template", "construct"),
+        Const.PT_FRAMEWORK: ("Template", r"in (for|back)ward,")
+    }
+    @staticmethod
+    def check_stack_valid(stack_info):
+        if stack_info is not None:
+            if not isinstance(stack_info, list):
+                logger.error(f"stack is invalid, it should be a list[str], but got {stack_info}")
+                raise CompareException(CompareException.INVALID_DATA_ERROR)
+            for stack in stack_info:
+                if not isinstance(stack, str):
+                    logger.error(f"stack is invalid, it should be a list[str], but got {stack_info}")
+                    raise CompareException(CompareException.INVALID_DATA_ERROR)
+    def set(self, data_name: str, construct_info: str, stack_info: str) -> None:
+        self.set_name(data_name)
+        self.set_layer_scope(construct_info)
+        self.set_stack_scope(stack_info)
+        self.set_full_scope()
+    def set_name(self, data_name: str) -> None:
+        self.data_name = data_name
+        data_name_list = data_name.split(Const.SEP)
+        if not data_name_list or len(data_name_list) < abs(Const.LAYER_NAME_INDEX):
+            logger.error(
+                f"The dump data does not comply with the format specification and "
+                f"must contain no less than four fields. "
+                f"The current data is {data_name}"
+            )
+            raise CompareException(CompareException.INVALID_DATA_ERROR)
+        self.api_type = data_name_list[Const.API_TYPE_INDEX]
+        self.type_name = data_name_list[Const.TYPE_NAME_INDEX]
+        if self.api_type == self.framework2layername.get(self.framework):
+            self.api_name = data_name_list[Const.LAYER_NAME_INDEX]
+        else:
+            self.api_name = self.type_name
+    def set_layer_scope(self, construct_info: str) -> None:
+        self.construct_scope = construct_info
+        if self.api_type == self.framework2layername.get(self.framework):
+            # remove api name
+            data_list = self.data_name.split(Const.SEP)
+            data_list = data_list[:Const.LAYER_NAME_INDEX] + data_list[Const.TYPE_NAME_INDEX:]
+        elif construct_info:
+            data_list = construct_info.split(Const.SEP)
+        else:
+            data_list = []
+        if data_list:
+            self.layer_scope = Const.SEP.join(data_list[:Const.TYPE_NAME_INDEX])
+        else:
+            self.layer_scope = self.framework2layername.get(self.framework)
+        if construct_info:
+            construct_list = construct_info.split(Const.SEP)
+            if len(construct_list) < abs(Const.LAYER_NAME_INDEX):
+                logger.error(
+                    f"The construct data does not comply with the format specification and "
+                    f"must contain no less than four fields. "
+                    f"The current data is {construct_info}"
+                )
+                raise CompareException(CompareException.INVALID_DATA_ERROR)
+            self.scope_id = construct_list[Const.SCOPE_ID_INDEX]
+            self.scope_direction = construct_list[Const.SCOPE_DIRECTION_INDEX]
+    def set_stack_scope(self, stack_info: str) -> None:
+        # Cell/Module has no stack info
+        if self.api_type == self.framework2layername.get(self.framework):
+            return
+        if self.api_type in Const.DATA_TYPE_SKIP_LIST or not stack_info:
+            return
+        start_sign, end_sign = self.framework2stack_sign.get(self.framework)
+        self.check_stack_valid(stack_info)
+        start_pos, end_pos = find_regard_scope(stack_info, start_sign, end_sign)
+        # 获取指定范围的代码
+        regard_scope = stack_info[start_pos + 1:end_pos]
+        frame_func_stack_list, user_func_stack_list = find_stack_func_list(regard_scope)
+        self.frame_stack_scope = Const.SEP.join(frame_func_stack_list)
+        self.user_stack_scope = Const.SEP.join(user_func_stack_list)
+    def set_full_scope(self, use_user_func_scope=False, use_frame_func_scope=True) -> None:
+        scope_list = [self.layer_scope]
+        if use_user_func_scope and self.user_stack_scope:
+            scope_list.append(self.user_stack_scope)
+        if use_frame_func_scope and self.frame_stack_scope:
+            scope_list.append(self.frame_stack_scope)
+        scope_list.append(self.api_name)
+        self.full_scope = Const.SEP.join(scope_list)
+def find_regard_scope(lines, start_sign, end_sign):
+    # 找出 start_pos 和 end_pos
+    start_pos = -1
+    end_pos = len(lines)
+    for idx, ii in enumerate(lines):
+        if re.search(start_sign, ii):
+            start_pos = idx
+        elif start_pos >= 0 and re.search(end_sign, ii):
+            end_pos = idx
+            break
+    return start_pos, end_pos
+def find_stack_func_list(lines, record_user=True):
+    res_list = []
+    user_stack = []
+    frame_stack = None
+    no_entrance = True
+    for line in lines:
+        ele_list = line.split(Const.COMMA)
+        file_ele = ele_list[Const.STACK_FILE_INDEX]
+        # if framework func line and no framework entrance found yet
+        if any(ii in file_ele for ii in Const.FRAME_FILE_LIST) and no_entrance:
+            frame_stack = line  # Update the last target index
+        else:
+            if record_user:
+                user_stack.append(line)
+            no_entrance = False
+    # Check if the last string in the list contains target str
+    if frame_stack and no_entrance:
+        no_entrance = False
+    # 过滤和处理 regard_scope
+    frame_func = get_stack_in_lines([frame_stack])
+    user_func = get_stack_in_lines(user_stack)
+    return (frame_func, user_func)
+def get_stack_in_lines(simplified: List[str]):
+    res_list = []
+    if not simplified:
+        return res_list
+    for line in simplified:
+        if not line:
+            continue
+        ele_list = line.split(Const.COMMA)
+        file_ele = ele_list[Const.STACK_FILE_INDEX]
+        if any(ii in file_ele for ii in Const.FILE_SKIP_LIST):
+            continue
+        func_ele = ele_list[Const.STACK_FUNC_INDEX]
+        if any(ii in func_ele for ii in Const.FUNC_SKIP_LIST):
+            continue
+        in_func_name = func_ele.split()[Const.STACK_FUNC_ELE_INDEX]
+        res_list.append(in_func_name)
+    reversed_list = res_list[::-1]
+    return reversed_list
+def dumpdata_representer(dumper, data):
+    d = deepcopy(data.__dict__)
+    d.pop("data_name")
+    return dumper.represent_dict(d)
+def get_dump_data_items(dump, stack, construct, framework, output_path=None):
+    if not stack or not construct:
+        return []
+    name2item = {}
+    data_items = []
+    dump_data = dump.get("data", {})
+    for data_name in dump_data:
+        code_info = stack.get(data_name, None)
+        parent_info = construct.get(data_name, None)
+        data_item = DumpDataItem(framework)
+        data_item.set(data_name, parent_info, code_info)
+        name2item[data_name] = data_item
+        data_items.append(data_item)
+    postprocess_pass(data_items, name2item)
+    if output_path:
+        yaml.add_representer(DumpDataItem, dumpdata_representer)
+        file_name = add_time_with_yaml(f"{framework}_data")
+        file_path = os.path.join(os.path.realpath(output_path), file_name)
+        save_yaml(file_path, name2item)
+    return data_items

mindstudio-probe 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl