PyPI - mindstudio-probe - Versions diffs - 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl - Mend

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (220) hide show

{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/METADATA +5 -5
mindstudio_probe-1.1.1.dist-info/RECORD +341 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/entry_points.txt +0 -1
msprobe/README.md +39 -3
msprobe/config.json +1 -3
msprobe/core/advisor/advisor.py +8 -3
msprobe/core/common/const.py +113 -13
msprobe/core/common/exceptions.py +25 -3
msprobe/core/common/file_utils.py +150 -26
msprobe/core/common/inplace_op_checker.py +15 -0
msprobe/core/common/log.py +27 -9
msprobe/core/common/utils.py +182 -69
msprobe/core/common_config.py +44 -15
msprobe/core/compare/acc_compare.py +207 -142
msprobe/core/compare/check.py +2 -5
msprobe/core/compare/compare_cli.py +21 -4
msprobe/core/compare/highlight.py +124 -55
msprobe/core/compare/layer_mapping/__init__.py +19 -0
msprobe/core/compare/layer_mapping/data_scope_parser.py +235 -0
msprobe/core/compare/layer_mapping/layer_mapping.py +242 -0
msprobe/core/compare/layer_mapping/postprocess_pass.py +94 -0
msprobe/core/compare/npy_compare.py +52 -23
msprobe/core/compare/utils.py +272 -247
msprobe/core/data_dump/data_collector.py +13 -11
msprobe/core/data_dump/data_processor/base.py +46 -16
msprobe/core/data_dump/data_processor/mindspore_processor.py +4 -4
msprobe/core/data_dump/data_processor/pytorch_processor.py +156 -59
msprobe/core/data_dump/scope.py +113 -34
msprobe/core/grad_probe/constant.py +27 -13
msprobe/core/grad_probe/grad_compare.py +18 -1
msprobe/core/grad_probe/utils.py +30 -2
msprobe/core/overflow_check/abnormal_scene.py +185 -0
msprobe/core/overflow_check/api_info.py +55 -0
msprobe/core/overflow_check/checker.py +138 -0
msprobe/core/overflow_check/filter.py +157 -0
msprobe/core/overflow_check/ignore_rules.yaml +55 -0
msprobe/core/overflow_check/level.py +22 -0
msprobe/core/overflow_check/utils.py +28 -0
msprobe/docs/01.installation.md +10 -0
msprobe/docs/02.config_introduction.md +49 -22
msprobe/docs/03.config_examples.md +2 -9
msprobe/docs/04.kernel_dump_PyTorch.md +73 -0
msprobe/docs/05.data_dump_PyTorch.md +3 -1
msprobe/docs/06.data_dump_MindSpore.md +157 -90
msprobe/docs/07.accuracy_checker_PyTorch.md +12 -12
msprobe/docs/08.accuracy_checker_online_PyTorch.md +1 -6
msprobe/docs/09.accuracy_checker_MindSpore.md +44 -8
msprobe/docs/10.accuracy_compare_PyTorch.md +19 -13
msprobe/docs/11.accuracy_compare_MindSpore.md +104 -13
msprobe/docs/12.overflow_check_PyTorch.md +1 -1
msprobe/docs/13.overflow_check_MindSpore.md +6 -6
msprobe/docs/15.free_benchmarking_PyTorch.md +4 -5
msprobe/docs/16.free_benchmarking_MindSpore.md +56 -37
msprobe/docs/17.grad_probe.md +5 -6
msprobe/docs/19.monitor.md +468 -0
msprobe/docs/20.monitor_performance_baseline.md +52 -0
msprobe/docs/21.visualization_PyTorch.md +386 -0
msprobe/docs/22.visualization_MindSpore.md +384 -0
msprobe/docs/23.tool_function_introduction.md +28 -0
msprobe/docs/FAQ.md +3 -0
msprobe/docs/data_dump_Mindspore/dynamic_graph_quick_start_example.md +211 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/mindspore/__init__.py +15 -0
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +113 -145
msprobe/mindspore/api_accuracy_checker/api_info.py +21 -6
msprobe/mindspore/api_accuracy_checker/api_runner.py +43 -18
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +21 -7
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +77 -0
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +63 -1
msprobe/mindspore/api_accuracy_checker/compute_element.py +59 -24
msprobe/mindspore/api_accuracy_checker/data_manager.py +264 -0
msprobe/mindspore/api_accuracy_checker/main.py +27 -3
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +206 -0
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +58 -0
msprobe/mindspore/api_accuracy_checker/type_mapping.py +22 -5
msprobe/mindspore/api_accuracy_checker/utils.py +34 -17
msprobe/mindspore/cell_processor.py +33 -12
msprobe/mindspore/common/const.py +33 -13
msprobe/mindspore/common/log.py +5 -9
msprobe/mindspore/common/utils.py +43 -4
msprobe/mindspore/compare/distributed_compare.py +22 -22
msprobe/mindspore/compare/ms_compare.py +271 -248
msprobe/mindspore/compare/ms_graph_compare.py +81 -47
msprobe/mindspore/debugger/debugger_config.py +4 -1
msprobe/mindspore/debugger/precision_debugger.py +7 -1
msprobe/mindspore/dump/dump_tool_factory.py +3 -1
msprobe/mindspore/dump/hook_cell/api_registry.py +12 -2
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +13 -16
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +25 -0
msprobe/mindspore/dump/jit_dump.py +17 -5
msprobe/mindspore/dump/kernel_graph_dump.py +2 -4
msprobe/mindspore/dump/kernel_kbyk_dump.py +2 -4
msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +140 -0
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +53 -0
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +145 -39
msprobe/mindspore/free_benchmark/common/handler_params.py +1 -2
msprobe/mindspore/free_benchmark/common/utils.py +19 -4
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -204
msprobe/mindspore/free_benchmark/handler/base_handler.py +3 -3
msprobe/mindspore/free_benchmark/handler/check_handler.py +4 -5
msprobe/mindspore/free_benchmark/handler/fix_handler.py +4 -4
msprobe/mindspore/free_benchmark/handler/handler_factory.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +15 -6
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +13 -6
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +2 -2
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +2 -2
msprobe/mindspore/grad_probe/global_context.py +28 -8
msprobe/mindspore/grad_probe/grad_analyzer.py +27 -13
msprobe/mindspore/grad_probe/grad_monitor.py +16 -1
msprobe/mindspore/grad_probe/grad_stat_csv.py +33 -5
msprobe/mindspore/grad_probe/hook.py +24 -10
msprobe/mindspore/grad_probe/utils.py +18 -5
msprobe/mindspore/ms_config.py +22 -15
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +2 -4
msprobe/mindspore/runtime.py +15 -0
msprobe/mindspore/service.py +36 -30
msprobe/mindspore/task_handler_factory.py +15 -0
msprobe/msprobe.py +24 -7
msprobe/pytorch/__init__.py +3 -2
msprobe/pytorch/api_accuracy_checker/common/config.py +62 -0
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +3 -4
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +9 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +454 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +365 -0
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +6 -1
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +19 -14
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +13 -9
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +77 -53
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +15 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +9 -24
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +4 -12
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +9 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +3 -11
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +2 -2
msprobe/pytorch/bench_functions/confusion_transpose.py +5 -1
msprobe/pytorch/bench_functions/matmul_backward.py +12 -0
msprobe/pytorch/bench_functions/npu_fusion_attention.py +100 -6
msprobe/pytorch/bench_functions/rotary_mul.py +4 -0
msprobe/pytorch/bench_functions/swiglu.py +10 -2
msprobe/pytorch/common/parse_json.py +6 -6
msprobe/pytorch/common/utils.py +56 -5
msprobe/pytorch/compare/distributed_compare.py +8 -9
msprobe/pytorch/compare/pt_compare.py +8 -6
msprobe/pytorch/debugger/debugger_config.py +19 -15
msprobe/pytorch/dump/kernel_dump/kernel_config.py +33 -0
msprobe/pytorch/free_benchmark/common/constant.py +15 -0
msprobe/pytorch/free_benchmark/common/counter.py +15 -0
msprobe/pytorch/free_benchmark/common/enums.py +15 -0
msprobe/pytorch/free_benchmark/common/params.py +8 -1
msprobe/pytorch/free_benchmark/common/utils.py +26 -4
msprobe/pytorch/free_benchmark/compare/grad_saver.py +20 -3
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +3 -1
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +6 -4
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +4 -0
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +10 -0
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +6 -5
msprobe/pytorch/grad_probe/grad_monitor.py +23 -6
msprobe/pytorch/grad_probe/grad_stat_csv.py +40 -10
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1 -0
msprobe/pytorch/hook_module/wrap_functional.py +14 -12
msprobe/pytorch/module_processer.py +2 -5
msprobe/pytorch/monitor/anomaly_analyse.py +201 -0
msprobe/pytorch/monitor/anomaly_detect.py +340 -0
msprobe/pytorch/monitor/distributed/__init__.py +0 -0
msprobe/pytorch/monitor/distributed/distributed_ops.yaml +19 -0
msprobe/pytorch/monitor/distributed/stack_blacklist.yaml +5 -0
msprobe/pytorch/monitor/distributed/wrap_distributed.py +272 -0
msprobe/pytorch/monitor/features.py +108 -0
msprobe/pytorch/monitor/module_hook.py +870 -0
msprobe/pytorch/monitor/module_metric.py +193 -0
msprobe/pytorch/monitor/module_spec_verifier.py +93 -0
msprobe/pytorch/monitor/optimizer_collect.py +295 -0
msprobe/pytorch/monitor/unittest/__init__.py +0 -0
msprobe/pytorch/monitor/unittest/test_monitor.py +145 -0
msprobe/pytorch/monitor/utils.py +250 -0
msprobe/pytorch/monitor/visualizer.py +59 -0
msprobe/pytorch/online_dispatch/__init__.py +2 -3
msprobe/pytorch/online_dispatch/compare.py +29 -38
msprobe/pytorch/online_dispatch/dispatch.py +50 -25
msprobe/pytorch/online_dispatch/dump_compare.py +21 -9
msprobe/pytorch/online_dispatch/single_compare.py +53 -32
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +1 -1
msprobe/pytorch/online_dispatch/utils.py +49 -21
msprobe/pytorch/parse_tool/lib/compare.py +12 -18
msprobe/pytorch/parse_tool/lib/config.py +1 -1
msprobe/pytorch/parse_tool/lib/parse_tool.py +1 -2
msprobe/pytorch/parse_tool/lib/utils.py +16 -35
msprobe/pytorch/parse_tool/lib/visualization.py +2 -0
msprobe/pytorch/pt_config.py +31 -8
msprobe/pytorch/service.py +15 -5
msprobe/visualization/__init__.py +14 -0
msprobe/visualization/builder/__init__.py +14 -0
msprobe/visualization/builder/graph_builder.py +165 -0
msprobe/visualization/builder/msprobe_adapter.py +205 -0
msprobe/visualization/compare/__init__.py +14 -0
msprobe/visualization/compare/graph_comparator.py +130 -0
msprobe/visualization/compare/mode_adapter.py +211 -0
msprobe/visualization/graph/__init__.py +14 -0
msprobe/visualization/graph/base_node.py +124 -0
msprobe/visualization/graph/graph.py +200 -0
msprobe/visualization/graph/node_colors.py +95 -0
msprobe/visualization/graph/node_op.py +39 -0
msprobe/visualization/graph_service.py +214 -0
msprobe/visualization/utils.py +232 -0
mindstudio_probe-1.1.0.dist-info/RECORD +0 -287
msprobe/docs/04.acl_config_examples.md +0 -78
msprobe/mindspore/compare/layer_mapping.py +0 -146
msprobe/mindspore/compare/modify_mapping.py +0 -107
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +0 -57
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +0 -122
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/LICENSE +0 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/top_level.txt +0 -0
/msprobe/{mindspore/free_benchmark/decorator → pytorch/monitor}/__init__.py +0 -0

msprobe/core/compare/utils.py CHANGED Viewed

@@ -15,28 +15,31 @@
 import os
 import re
+import math
+import zlib
+from dataclasses import dataclass
 import numpy as np
 from msprobe.core.common.const import Const, CompareConst
-from msprobe.core.common.utils import CompareException, check_regex_prefix_format_valid, logger
+from msprobe.core.common.utils import CompareException, check_regex_prefix_format_valid, logger, safe_get_value
 from msprobe.core.common.file_utils import check_file_or_directory_path
 def extract_json(dirname, stack_json=False):
     json_path = ''
-    for fname in os.listdir(dirname):
-        if fname == "construct.json":
-            continue
-        full_path = os.path.join(dirname, fname)
-        if full_path.endswith('.json'):
-            json_path = full_path
-            if not stack_json and 'stack' not in json_path:
-                break
-            if stack_json and 'stack' in json_path:
-                break
+    for filename in os.listdir(dirname):
+        target_file_name = 'stack.json' if stack_json else 'dump.json'
+        if filename == target_file_name:
+            json_path = os.path.join(dirname, filename)
+            break
     # Provide robustness on invalid directory inputs
     if not json_path:
-        logger.error(f'No file is found in dump dir {dirname}. ')
+        if stack_json:
+            logger.error(f'stack.json is not found in dump dir {dirname}.')
+        else:
+            logger.error(f'dump.json is not found in dump dir {dirname}.')
         raise CompareException(CompareException.NO_DUMP_FILE_ERROR)
     return json_path
@@ -44,7 +47,7 @@ def extract_json(dirname, stack_json=False):
 def check_and_return_dir_contents(dump_dir, prefix):
     """
     check the given dump dir and validate files in dump dir by using the given prefix patterns to build a
-    pattern: ^{prefix}(?:0|[0-9][1-9]*)?$
+    pattern: ^{prefix}(?:0|[1-9][0-9]*)?$
     Args:
         dump_dir (str): dump dir
@@ -60,7 +63,7 @@ def check_and_return_dir_contents(dump_dir, prefix):
     check_regex_prefix_format_valid(prefix)
     check_file_or_directory_path(dump_dir, True)
     contents = os.listdir(dump_dir)
-    pattern = re.compile(rf'^{prefix}(?:0|[0-9][1-9]*)?$')
+    pattern = re.compile(rf'^{prefix}(?:0|[1-9][0-9]*)?$')
     for name in contents:
         if not pattern.match(name):
             logger.error(
@@ -84,122 +87,89 @@ def rename_api(npu_name, process):
 def read_op(op_data, op_name):
+    io_name_mapping = {
+        Const.INPUT_ARGS: '.input',
+        Const.INPUT_KWARGS: '.input',
+        Const.INPUT: '.input',
+        Const.OUTPUT: '.output'
+    }
     op_parsed_list = []
-    if Const.FORWARD in op_name:
-        if Const.INPUT_ARGS in op_data:
-            input_item = op_data[Const.INPUT_ARGS]
-            input_parsed_list = op_item_parse(input_item, op_name + '.input', None)
-            op_parsed_list = input_parsed_list.copy()
-            input_parsed_list.clear()
-        if Const.INPUT_KWARGS in op_data:
-            kwargs_item = op_data[Const.INPUT_KWARGS]
-            if isinstance(kwargs_item, dict) and "type" in kwargs_item or isinstance(kwargs_item, list):
-                kwarg_parsed_list = op_item_parse(kwargs_item, op_name + '.input', None)
-                op_parsed_list += kwarg_parsed_list
-                kwarg_parsed_list.clear()
-            elif kwargs_item:
-                for kwarg in kwargs_item:
-                    kwarg_parsed_list = op_item_parse(kwargs_item[kwarg], op_name + '.input.' + kwarg, None)
-                    op_parsed_list += kwarg_parsed_list
-                    kwarg_parsed_list.clear()
-        if Const.OUTPUT in op_data:
-            output_item = op_data[Const.OUTPUT]
-            output_parsed_list = op_item_parse(output_item, op_name + '.output', None)
-            op_parsed_list += output_parsed_list
-            output_parsed_list.clear()
-    if Const.BACKWARD in op_name:
-        if Const.INPUT in op_data:
-            input_item = op_data[Const.INPUT]
-            input_parsed_list = op_item_parse(input_item, op_name + '.input', None)
-            op_parsed_list = input_parsed_list.copy()
-            input_parsed_list.clear()
-        if Const.OUTPUT in op_data:
-            output_item = op_data[Const.OUTPUT]
-            output_parsed_list = op_item_parse(output_item, op_name + '.output', None)
-            op_parsed_list += output_parsed_list
-            output_parsed_list.clear()
+    for name in io_name_mapping:
+        if name in op_data:
+            op_parsed_list.extend(op_item_parse(op_data[name], op_name + io_name_mapping[name]))
     return op_parsed_list
-def op_item_parse(item, op_name, index, item_list=None, top_bool=True, depth=0):
+def op_item_parse(op_data, op_name: str, depth: int = 0) -> list:
+    default_item = {
+        'full_op_name': op_name,
+        'type': None,
+        'Max': None,
+        'Min': None,
+        'Mean': None,
+        'Norm': None,
+        'dtype': None,
+        'shape': None,
+        'md5': None,
+        'value': None,
+        'data_name': '-1'
+    }
     if depth > Const.MAX_DEPTH:
-        logger.error(f"parse of api/module of {op_name} exceeds the recursion limit.")
+        logger.error(f'parse of api/module of {op_name} exceeds the recursion limit.')
         raise CompareException(CompareException.RECURSION_LIMIT_ERROR)
-    if item_list is None:
-        item_list = []
-    if item is None or (isinstance(item, dict) and not item):
-        if not top_bool:
-            tmp = {
-                'full_op_name': op_name + '.' + str(index), 'Max': None, 'Min': None, 'Mean': None, 'Norm': None,
-                'dtype': None, 'shape': None, 'md5': None, 'data_name': '-1'
-            }
-        else:
-            tmp = {
-                'full_op_name': op_name + '.0', 'Max': None, 'Min': None, 'Mean': None, 'Norm': None, 'dtype': None,
-                'shape': None, 'md5': None, 'data_name': '-1'
-            }
-        item_list.append(tmp)
-        return item_list
-    if index is None:
-        if isinstance(item, dict):
-            full_op_name = op_name + '.0'
-        else:
-            full_op_name = op_name
-    else:
-        full_op_name = op_name + Const.SEP + str(index)
-    if isinstance(item, dict):
-        if 'type' not in item:
-            for kwarg in item:
-                kwarg_parsed_list = op_item_parse(item[kwarg], op_name + Const.SEP + kwarg, None, depth=depth+1)
-                item_list += kwarg_parsed_list
-                kwarg_parsed_list.clear()
-        elif 'dtype' in item:
-            parsed_item = item
-            parsed_item['full_op_name'] = full_op_name
-            item_list.append(parsed_item)
-        elif 'type' in item:
-            parsed_item = {}
-            if item['type'] == 'torch.Size':
-                parsed_item['full_op_name'] = full_op_name
-                parsed_item['dtype'] = 'torch.Size'
-                parsed_item['shape'] = str(item['value'])
-                parsed_item['md5'] = None
-                parsed_item['Max'] = None
-                parsed_item['Min'] = None
-                parsed_item['Mean'] = None
-                parsed_item['Norm'] = None
-                parsed_item['data_name'] = '-1'
-                item_list.append(parsed_item)
-            elif item['type'] == 'slice':
-                parsed_item['full_op_name'] = full_op_name
-                parsed_item['dtype'] = 'slice'
-                parsed_item['shape'] = str(np.shape(np.array(item['value'])))
-                parsed_item['md5'] = None
-                parsed_item['Max'] = None
-                parsed_item['Min'] = None
-                parsed_item['Mean'] = None
-                parsed_item['Norm'] = None
-                parsed_item['data_name'] = '-1'
-                item_list.append(parsed_item)
-            else:
-                parsed_item['full_op_name'] = full_op_name
-                parsed_item['dtype'] = str(type(item['value']))
-                parsed_item['shape'] = '[]'
-                parsed_item['md5'] = None
-                parsed_item['Max'] = item['value']
-                parsed_item['Min'] = item['value']
-                parsed_item['Mean'] = item['value']
-                parsed_item['Norm'] = item['value']
-                parsed_item['data_name'] = '-1'
-                item_list.append(parsed_item)
-        else:
-            resolve_api_special_parameters(item, full_op_name, item_list)
-    else:
-        for j, item_spec in enumerate(item):
-            op_item_parse(item_spec, full_op_name, j, item_list=item_list, top_bool=False, depth=depth+1)
+    if op_data is None:
+        return [default_item]
+    elif not op_data:
+        return []
+    item_list = []
+    if isinstance(op_data, list):
+        for i, data in enumerate(op_data):
+            item_list.extend(op_item_parse(data, op_name + Const.SEP + str(i), depth + 1))
+    elif isinstance(op_data, dict):
+        if is_leaf_data(op_data):
+            return [gen_op_item(op_data, op_name)]
+        for sub_name, sub_data in op_data.items():
+            item_list.extend(op_item_parse(sub_data, op_name + Const.SEP + str(sub_name), depth + 1))
     return item_list
+def is_leaf_data(op_data):
+    return 'type' in op_data and isinstance(op_data['type'], str)
+def gen_op_item(op_data, op_name):
+    op_item = {}
+    op_item.update(op_data)
+    op_item['full_op_name'] = op_name
+    op_item['data_name'] = op_data.get('data_name', '-1')
+    params = ['Max', 'Min', 'Mean', 'Norm']
+    for i in params:
+        if i not in op_item:
+            op_item[i] = None
+    if not op_item.get('dtype'):
+        if op_item.get('type') == 'torch.Size':
+            op_item['dtype'] = op_data.get('type')
+            op_item['shape'] = str(op_data.get('value'))
+        elif op_item.get('type') == 'slice':
+            op_item['dtype'] = op_data.get('type')
+            op_item['shape'] = str(np.shape(np.array(op_data.get('value'))))
+        else:
+            op_item['dtype'] = str(type(op_data.get('value')))
+            op_item['shape'] = '[]'
+            for i in params:
+                op_item[i] = op_data.get('value')
+    if not op_item.get('md5'):
+        op_item['md5'] = f"{zlib.crc32(str(op_data.get('value', '')).encode()):08x}"
+    return op_item
 def resolve_api_special_parameters(data_dict, full_op_name, item_list):
     """
     Function Description:
@@ -231,131 +201,173 @@ def resolve_api_special_parameters(data_dict, full_op_name, item_list):
             item_list.append(parsed_item)
-def get_accuracy(result, n_dict, b_dict, summary_compare=False, md5_compare=False):
+def process_summary_data(summary_data):
+    """处理summary_data中的nan值，返回处理后的列表"""
+    return [CompareConst.NAN if isinstance(x, float) and math.isnan(x) else x for x in summary_data]
+def get_rela_diff_summary_mode(result_item, npu_summary_data, bench_summary_data, err_msg):
+    start_idx = CompareConst.SUMMARY_COMPARE_RESULT_HEADER.index(CompareConst.MAX_DIFF)
+    warning_flag = False
+    for i, (npu_val, bench_val) in enumerate(zip(npu_summary_data, bench_summary_data)):
+        if all(isinstance(val, (float, int)) and not isinstance(val, bool) for val in [npu_val, bench_val]):
+            diff = npu_val - bench_val
+            if math.isnan(diff):
+                diff = CompareConst.NAN
+                relative = CompareConst.NAN
+            else:
+                if bench_val != 0:
+                    relative = str(abs((diff / bench_val) * 100)) + '%'
+                else:
+                    relative = CompareConst.N_A
+                magnitude_diff = abs(diff) / (max(abs(npu_val), abs(bench_val)) + CompareConst.EPSILON)
+                if magnitude_diff > CompareConst.MAGNITUDE:
+                    warning_flag = True
+            result_item[start_idx + i] = diff
+            result_item[start_idx + i + CompareConst.STATISTICS_INDICATOR_NUM] = relative
+        else:
+            result_item[start_idx + i] = CompareConst.N_A
+            result_item[start_idx + i + CompareConst.STATISTICS_INDICATOR_NUM] = CompareConst.N_A
+    accuracy_check = CompareConst.WARNING if warning_flag else ""
+    err_msg += "Need double check api accuracy." if warning_flag else ""
+    for i in range(start_idx, len(result_item)):
+        if str(result_item[i]) in ('inf', '-inf', 'nan'):
+            result_item[i] = f'{result_item[i]}\t'
+    return result_item, accuracy_check, err_msg
+@dataclass
+class ApiItemInfo:
+    name: str
+    struct: tuple
+    stack_info: list
+def stack_column_process(result_item, has_stack, index, key, npu_stack_info):
+    if has_stack and index == 0 and key == CompareConst.INPUT_STRUCT:
+        result_item.extend(npu_stack_info)
+    else:
+        result_item.append(CompareConst.NONE)
+    return result_item
+def result_item_init(n_info, b_info, dump_mode):
+    n_len = len(n_info.struct)
+    b_len = len(b_info.struct)
+    struct_long_enough = (n_len > 2 and b_len > 2) if dump_mode == Const.MD5 else (n_len > 1 and b_len > 1)
+    if struct_long_enough:
+        result_item = [
+            n_info.name, b_info.name, n_info.struct[0], b_info.struct[0], n_info.struct[1], b_info.struct[1]
+        ]
+        if dump_mode == Const.MD5:
+            md5_compare_result = CompareConst.PASS if n_info.struct[2] == b_info.struct[2] else CompareConst.DIFF
+            result_item.extend([n_info.struct[2], b_info.struct[2], md5_compare_result])
+        elif dump_mode == Const.SUMMARY:
+            result_item.extend([" "] * 8)
+        else:
+            result_item.extend([" "] * 5)
+    else:
+        err_msg = "index out of bounds error will occur in result_item_init, please check!\n" \
+                  f"npu_info_struct is {n_info.struct}\n" \
+                  f"bench_info_struct is {b_info.struct}"
+        logger.error(err_msg)
+        raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR)
+    return result_item
+def get_accuracy(result, n_dict, b_dict, dump_mode):
     def get_accuracy_core(n_start, n_len, b_start, b_len, key):
         min_len = min(n_len, b_len)
         npu_stack_info = n_dict.get("stack_info", None)
         bench_stack_info = b_dict.get("stack_info", None)
         has_stack = npu_stack_info and bench_stack_info
-        all_mode_bool = not (summary_compare or md5_compare)
-        if all_mode_bool:
+        if dump_mode == Const.ALL:
             npu_data_name = n_dict.get("data_name", None)
             bench_data_name = b_dict.get("data_name", None)
         for index in range(min_len):
-            n_name = n_dict['op_name'][n_start + index]
-            b_name = b_dict['op_name'][b_start + index]
-            n_struct = n_dict[key][index]
-            b_struct = b_dict[key][index]
+            n_name = safe_get_value(n_dict, n_start + index, "n_dict", key="op_name")
+            b_name = safe_get_value(b_dict, b_start + index, "b_dict", key="op_name")
+            n_struct = safe_get_value(n_dict, index, "n_dict", key=key)
+            b_struct = safe_get_value(b_dict, index, "b_dict", key=key)
             err_msg = ""
-            if md5_compare:
-                result_item = [
-                    n_name, b_name, n_struct[0], b_struct[0], n_struct[1], b_struct[1], n_struct[2], b_struct[2],
-                    CompareConst.PASS if n_struct[2] == b_struct[2] else CompareConst.DIFF
-                ]
-                if has_stack and index == 0 and key == "input_struct":
-                    result_item.extend(npu_stack_info)
-                else:
-                    result_item.append(CompareConst.NONE)
+            npu_info = ApiItemInfo(n_name, n_struct, npu_stack_info)
+            bench_info = ApiItemInfo(b_name, b_struct, bench_stack_info)
+            result_item = result_item_init(npu_info, bench_info, dump_mode)
+            if dump_mode == Const.MD5:
+                result_item = stack_column_process(result_item, has_stack, index, key, npu_stack_info)
                 result.append(result_item)
                 continue
-            if summary_compare:
-                result_item = [
-                    n_name, b_name, n_struct[0], b_struct[0], n_struct[1], b_struct[1],
-                    " ", " ", " ", " ", " ", " ", " ", " "
-                ]
-            else:
-                result_item = [
-                    n_name, b_name, n_struct[0], b_struct[0], n_struct[1], b_struct[1],
-                    " ", " ", " ", " ", " "
-                ]
-            npu_summary_data = n_dict.get(CompareConst.SUMMARY)[n_start + index]
-            result_item.extend(npu_summary_data)
-            bench_summary_data = b_dict.get(CompareConst.SUMMARY)[b_start + index]
-            result_item.extend(bench_summary_data)
-            if summary_compare:
-                start_idx = CompareConst.SUMMARY_COMPARE_RESULT_HEADER.index(CompareConst.MAX_DIFF)
-                warning_flag = False
-                for i, (npu_val, bench_val) in enumerate(zip(npu_summary_data, bench_summary_data)):
-                    if isinstance(npu_val, (float, int)) and isinstance(bench_val, (float, int)):
-                        diff = npu_val - bench_val
-                        if bench_val != 0:
-                            relative = str(abs((diff / bench_val) * 100)) + '%'
-                        else:
-                            relative = CompareConst.N_A
-                        result_item[start_idx + i] = diff
-                        result_item[start_idx + i + 4] = relative
-                        magnitude_diff = abs(diff) / (max(abs(npu_val), abs(bench_val)) + 1e-10)
-                        if magnitude_diff > 0.5:
-                            warning_flag = True
-                    else:
-                        result_item[start_idx + i] = CompareConst.NONE
-                accuracy_check = CompareConst.WARNING if warning_flag else ""
-                err_msg += "Need double check api accuracy." if warning_flag else ""
-                for i in range(start_idx, len(result_item)):
-                    if str(result_item[i]) in ('inf', '-inf', 'nan'):
-                        result_item[i] = f'{result_item[i]}\t'
-            result_item.append(accuracy_check if summary_compare else CompareConst.ACCURACY_CHECK_YES)
+            npu_summary_data = safe_get_value(n_dict, n_start + index, "n_dict", key=CompareConst.SUMMARY)
+            bench_summary_data = safe_get_value(b_dict, b_start + index, "b_dict", key=CompareConst.SUMMARY)
+            result_item.extend(process_summary_data(npu_summary_data))
+            result_item.extend(process_summary_data(bench_summary_data))
+            if dump_mode == Const.SUMMARY:
+                result_item, accuracy_check, err_msg = get_rela_diff_summary_mode(result_item, npu_summary_data,
+                                                                                  bench_summary_data, err_msg)
+            result_item.append(accuracy_check if dump_mode == Const.SUMMARY else CompareConst.ACCURACY_CHECK_YES)
             result_item.append(err_msg)
-            if has_stack and index == 0 and key == "input_struct":
-                result_item.extend(npu_stack_info)
-            else:
-                result_item.append(CompareConst.NONE)
-            if all_mode_bool:
-                result_item.append(npu_data_name[n_start + index])
+            result_item = stack_column_process(result_item, has_stack, index, key, npu_stack_info)
+            if dump_mode == Const.ALL:
+                result_item.append(safe_get_value(npu_data_name, n_start + index, "npu_data_name"))
             result.append(result_item)
         if n_len > b_len:
             for index in range(b_len, n_len):
-                n_name = n_dict['op_name'][n_start + index]
-                n_struct = n_dict[key][index]
-                if md5_compare:
+                try:
+                    n_name = n_dict['op_name'][n_start + index]
+                    n_struct = n_dict[key][index]
+                    if dump_mode == Const.MD5:
+                        result_item = [
+                            n_name, CompareConst.NAN, n_struct[0], CompareConst.NAN, n_struct[1], CompareConst.NAN,
+                            n_struct[2], CompareConst.NAN, CompareConst.NAN
+                        ]
+                        result.append(result_item)
+                        continue
                     result_item = [
                         n_name, CompareConst.NAN, n_struct[0], CompareConst.NAN, n_struct[1], CompareConst.NAN,
-                        n_struct[2], CompareConst.NAN, CompareConst.NAN
+                        " ", " ", " ", " ", " "
                     ]
-                    result.append(result_item)
-                    continue
-                result_item = [
-                    n_name, CompareConst.NAN, n_struct[0], CompareConst.NAN, n_struct[1], CompareConst.NAN,
-                    " ", " ", " ", " ", " "
-                ]
-                summary_data = n_dict.get(CompareConst.SUMMARY)[n_start + index]
-                result_item.extend(summary_data)
-                summary_data = [CompareConst.NAN for _ in range(len(n_dict.get(CompareConst.SUMMARY)[0]))]
-                result_item.extend(summary_data)
+                    summary_data = n_dict.get(CompareConst.SUMMARY)[n_start + index]
+                    result_item.extend(summary_data)
+                    summary_data = [CompareConst.NAN for _ in range(len(n_dict.get(CompareConst.SUMMARY)[0]))]
+                    result_item.extend(summary_data)
+                except IndexError as e:
+                    err_msg = "index out of bounds error occurs, please check!\n" \
+                              f"n_dict is {n_dict}"
+                    logger.error(err_msg)
+                    raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR) from e
                 err_msg = ""
                 result_item.append(CompareConst.ACCURACY_CHECK_YES)
                 result_item.append(err_msg)
-                if has_stack and index == 0 and key == "input_struct":
-                    result_item.extend(npu_stack_info)
-                else:
-                    result_item.append(CompareConst.NONE)
-                if all_mode_bool:
-                    result_item.append(npu_data_name[n_start + index])
+                result_item = stack_column_process(result_item, has_stack, index, key, npu_stack_info)
+                if dump_mode == Const.ALL:
+                    result_item.append(safe_get_value(npu_data_name, n_start + index, "npu_data_name"))
                 result.append(result_item)
     n_num = len(n_dict['op_name'])
     b_num = len(b_dict['op_name'])
-    n_num_input = len([name for name in n_dict['op_name'] if Const.INPUT in name.split(Const.SEP) or Const.KWARGS in name.split(Const.SEP)])
-    b_num_input = len([name for name in b_dict['op_name'] if Const.INPUT in name.split(Const.SEP) or Const.KWARGS in name.split(Const.SEP)])
+    n_num_input = len([name for name in n_dict['op_name']
+                       if Const.INPUT in name.split(Const.SEP) or Const.KWARGS in name.split(Const.SEP)])
+    b_num_input = len([name for name in b_dict['op_name']
+                       if Const.INPUT in name.split(Const.SEP) or Const.KWARGS in name.split(Const.SEP)])
     n_num_output = n_num - n_num_input
     b_num_output = b_num - b_num_input
     get_accuracy_core(0, n_num_input, 0, b_num_input, 'input_struct')
     get_accuracy_core(n_num_input, n_num_output, b_num_input, b_num_output, 'output_struct')
-def get_un_match_accuracy(result, n_dict, md5_compare, summary_compare):
+def get_un_match_accuracy(result, n_dict, dump_mode):
     index_out = 0
     npu_stack_info = n_dict.get("stack_info", None)
     bench_name, bench_type, bench_shape = CompareConst.N_A, CompareConst.N_A, CompareConst.N_A
@@ -363,14 +375,22 @@ def get_un_match_accuracy(result, n_dict, md5_compare, summary_compare):
     accuracy_check_res = CompareConst.N_A
     for index, n_name in enumerate(n_dict["op_name"]):
         name_ele_list = n_name.split(Const.SEP)
-        if "input" in name_ele_list:
-            n_struct = n_dict["input_struct"][index]
-        else:
-            n_struct = n_dict["output_struct"][index_out]
+        if Const.INPUT in name_ele_list or Const.KWARGS in name_ele_list:
+            n_struct = safe_get_value(n_dict, index, "n_dict", key=CompareConst.INPUT_STRUCT)
+        if Const.OUTPUT in name_ele_list:
+            n_struct = safe_get_value(n_dict, index_out, "n_dict", key=CompareConst.OUTPUT_STRUCT)
             index_out += 1
-        result_item = [n_name, bench_name, n_struct[0], bench_type, n_struct[1], bench_shape]
-        if md5_compare:
+        try:
+            result_item = [n_name, bench_name, n_struct[0], bench_type, n_struct[1], bench_shape]
+        except IndexError as e:
+            err_msg = "index out of bounds error occurs, please check!\n" \
+                      f"op_name of n_dict is {n_dict['op_name']}\n" \
+                      f"input_struct of n_dict is {n_dict[CompareConst.INPUT_STRUCT]}\n" \
+                      f"output_struct of n_dict is {n_dict[CompareConst.OUTPUT_STRUCT]}"
+            logger.error(err_msg)
+            raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR) from e
+        if dump_mode == Const.MD5:
             result_item.extend([CompareConst.N_A] * 3)
             if npu_stack_info and index == 0:
                 result_item.extend(npu_stack_info)
@@ -378,11 +398,11 @@ def get_un_match_accuracy(result, n_dict, md5_compare, summary_compare):
                 result_item.append(CompareConst.NONE)
             result.append(result_item)
             continue
-        if summary_compare:
+        if dump_mode == Const.SUMMARY:
             result_item.extend([CompareConst.N_A] * 8)
         else:
             result_item.extend([CompareConst.N_A] * 5)
-        npu_summary_data = n_dict.get("summary")[index]
+        npu_summary_data = safe_get_value(n_dict, index, "n_dict", key=CompareConst.SUMMARY)
         result_item.extend(npu_summary_data)
         bench_summary_data = [CompareConst.N_A] * 4
         result_item.extend(bench_summary_data)
@@ -392,22 +412,21 @@ def get_un_match_accuracy(result, n_dict, md5_compare, summary_compare):
             result_item.extend(npu_stack_info)
         else:
             result_item.append(CompareConst.NONE)
-        if not md5_compare and not summary_compare and result_item[1] == CompareConst.N_A:
+        if dump_mode == Const.ALL and result_item[1] == CompareConst.N_A:
             result_item.extend(["-1"])
         result.append(result_item)
-def merge_tensor(tensor_list, summary_compare, md5_compare):
+def merge_tensor(tensor_list, dump_mode):
     op_dict = {}
     op_dict["op_name"] = []
-    op_dict["input_struct"] = []
-    op_dict["kwargs_struct"] = []
-    op_dict["output_struct"] = []
-    op_dict["summary"] = []
+    op_dict[CompareConst.INPUT_STRUCT] = []
+    op_dict[CompareConst.KWARGS_STRUCT] = []
+    op_dict[CompareConst.OUTPUT_STRUCT] = []
+    op_dict[Const.SUMMARY] = []
     op_dict["stack_info"] = []
-    all_mode_bool = not (summary_compare or md5_compare)
-    if all_mode_bool:
+    if dump_mode == Const.ALL:
         op_dict["data_name"] = []
     for tensor in tensor_list:
@@ -416,38 +435,44 @@ def merge_tensor(tensor_list, summary_compare, md5_compare):
             break
         op_dict["op_name"].append(tensor['full_op_name'])
         name_ele_list = tensor['full_op_name'].split(Const.SEP)
-        if not md5_compare:
-            if "input" in name_ele_list:
-                op_dict["input_struct"].append((tensor['dtype'], tensor['shape']))
-            elif "kwarg" in name_ele_list:
-                op_dict["kwargs_struct"].append((tensor['dtype'], tensor['shape']))
-            elif "output" in name_ele_list:
-                op_dict["output_struct"].append((tensor['dtype'], tensor['shape']))
-        else:
-            if "input" in name_ele_list:
-                op_dict["input_struct"].append((tensor['dtype'], tensor['shape'], tensor['md5']))
-            if "kwarg" in name_ele_list:
-                op_dict["kwargs_struct"].append((tensor['dtype'], tensor['shape'], tensor['md5']))
-            elif "output" in name_ele_list:
-                op_dict["output_struct"].append((tensor['dtype'], tensor['shape'], tensor['md5']))
-        op_dict["summary"].append([tensor['Max'], tensor['Min'], tensor['Mean'], tensor['Norm']])
-        if all_mode_bool:
+        name_to_struct_mapping = {
+            Const.INPUT: CompareConst.INPUT_STRUCT,
+            Const.KWARGS: CompareConst.KWARGS_STRUCT,
+            Const.OUTPUT: CompareConst.OUTPUT_STRUCT
+        }
+        for name_key, struct_key in name_to_struct_mapping.items():
+            if name_key in name_ele_list:
+                if dump_mode == Const.MD5:
+                    op_dict.get(struct_key).append((tensor[Const.DTYPE], tensor[Const.SHAPE], tensor[Const.MD5]))
+                else:
+                    op_dict.get(struct_key).append((tensor[Const.DTYPE], tensor[Const.SHAPE]))
+                break
+        op_dict[Const.SUMMARY].append([tensor[Const.MAX], tensor[Const.MIN], tensor[Const.MEAN], tensor[Const.NORM]])
+        if dump_mode == Const.ALL:
             op_dict["data_name"].append(tensor['data_name'])
-            data_name = op_dict["data_name"][-1].rsplit(Const.SEP, 1)[0]
+            data_name = safe_get_value(op_dict, -1, "op_dict", key="data_name").rsplit(Const.SEP, 1)[0]
             if data_name != "-1":
                 op_dict["op_name"][-1] = data_name
-    if not op_dict["kwargs_struct"]:
-        del op_dict["kwargs_struct"]
+    if not op_dict[CompareConst.KWARGS_STRUCT]:
+        del op_dict[CompareConst.KWARGS_STRUCT]
     return op_dict if op_dict["op_name"] else {}
+def print_compare_ends_info():
+    total_len = len(CompareConst.COMPARE_ENDS_SUCCESSFULLY) + Const.FILL_CHAR_NUMS
+    logger.info('*' * total_len)
+    logger.info(f"*{CompareConst.COMPARE_ENDS_SUCCESSFULLY.center(total_len - 2)}*")
+    logger.info('*' * total_len)
 def _compare_parser(parser):
     parser.add_argument("-i", "--input_path", dest="input_path", type=str,
                         help="<Required> The compare input path, a dict json.", required=True)
     parser.add_argument("-o", "--output_path", dest="output_path", type=str,
-                        help="<Required> The compare task result out path.", required=True)
+                        help="<Required> The compare task result out path. Default path: ./output",
+                        required=False, default="./output", nargs="?", const="./output")
     parser.add_argument("-s", "--stack_mode", dest="stack_mode", action="store_true",
                         help="<optional> Whether to save stack info.", required=False)
     parser.add_argument("-c", "--compare_only", dest="compare_only", action="store_true",
@@ -457,8 +482,8 @@ def _compare_parser(parser):
     parser.add_argument("-cm", "--cell_mapping", dest="cell_mapping", type=str, nargs='?', const=True,
                         help="<optional> The cell mapping file path.", required=False)
     parser.add_argument("-am", "--api_mapping", dest="api_mapping", type=str, nargs='?', const=True,
-                        help="<optional> The api mapping file path.", required=False)
+                        help="<optional> The api mapping file path.", required=False)
     parser.add_argument("-dm", "--data_mapping", dest="data_mapping", type=str,
                         help="<optional> The data mapping file path.", required=False)
-    parser.add_argument("-lm", "--layer_mapping", dest="layer_mapping", type=str,
+    parser.add_argument("-lm", "--layer_mapping", dest="layer_mapping", type=str, nargs='?', const=True,
                         help="<optional> The layer mapping file path.", required=False)

mindstudio-probe 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl