PyPI - mindstudio-probe - Versions diffs - 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl - Mend

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (220) hide show

{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/METADATA +5 -5
mindstudio_probe-1.1.1.dist-info/RECORD +341 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/entry_points.txt +0 -1
msprobe/README.md +39 -3
msprobe/config.json +1 -3
msprobe/core/advisor/advisor.py +8 -3
msprobe/core/common/const.py +113 -13
msprobe/core/common/exceptions.py +25 -3
msprobe/core/common/file_utils.py +150 -26
msprobe/core/common/inplace_op_checker.py +15 -0
msprobe/core/common/log.py +27 -9
msprobe/core/common/utils.py +182 -69
msprobe/core/common_config.py +44 -15
msprobe/core/compare/acc_compare.py +207 -142
msprobe/core/compare/check.py +2 -5
msprobe/core/compare/compare_cli.py +21 -4
msprobe/core/compare/highlight.py +124 -55
msprobe/core/compare/layer_mapping/__init__.py +19 -0
msprobe/core/compare/layer_mapping/data_scope_parser.py +235 -0
msprobe/core/compare/layer_mapping/layer_mapping.py +242 -0
msprobe/core/compare/layer_mapping/postprocess_pass.py +94 -0
msprobe/core/compare/npy_compare.py +52 -23
msprobe/core/compare/utils.py +272 -247
msprobe/core/data_dump/data_collector.py +13 -11
msprobe/core/data_dump/data_processor/base.py +46 -16
msprobe/core/data_dump/data_processor/mindspore_processor.py +4 -4
msprobe/core/data_dump/data_processor/pytorch_processor.py +156 -59
msprobe/core/data_dump/scope.py +113 -34
msprobe/core/grad_probe/constant.py +27 -13
msprobe/core/grad_probe/grad_compare.py +18 -1
msprobe/core/grad_probe/utils.py +30 -2
msprobe/core/overflow_check/abnormal_scene.py +185 -0
msprobe/core/overflow_check/api_info.py +55 -0
msprobe/core/overflow_check/checker.py +138 -0
msprobe/core/overflow_check/filter.py +157 -0
msprobe/core/overflow_check/ignore_rules.yaml +55 -0
msprobe/core/overflow_check/level.py +22 -0
msprobe/core/overflow_check/utils.py +28 -0
msprobe/docs/01.installation.md +10 -0
msprobe/docs/02.config_introduction.md +49 -22
msprobe/docs/03.config_examples.md +2 -9
msprobe/docs/04.kernel_dump_PyTorch.md +73 -0
msprobe/docs/05.data_dump_PyTorch.md +3 -1
msprobe/docs/06.data_dump_MindSpore.md +157 -90
msprobe/docs/07.accuracy_checker_PyTorch.md +12 -12
msprobe/docs/08.accuracy_checker_online_PyTorch.md +1 -6
msprobe/docs/09.accuracy_checker_MindSpore.md +44 -8
msprobe/docs/10.accuracy_compare_PyTorch.md +19 -13
msprobe/docs/11.accuracy_compare_MindSpore.md +104 -13
msprobe/docs/12.overflow_check_PyTorch.md +1 -1
msprobe/docs/13.overflow_check_MindSpore.md +6 -6
msprobe/docs/15.free_benchmarking_PyTorch.md +4 -5
msprobe/docs/16.free_benchmarking_MindSpore.md +56 -37
msprobe/docs/17.grad_probe.md +5 -6
msprobe/docs/19.monitor.md +468 -0
msprobe/docs/20.monitor_performance_baseline.md +52 -0
msprobe/docs/21.visualization_PyTorch.md +386 -0
msprobe/docs/22.visualization_MindSpore.md +384 -0
msprobe/docs/23.tool_function_introduction.md +28 -0
msprobe/docs/FAQ.md +3 -0
msprobe/docs/data_dump_Mindspore/dynamic_graph_quick_start_example.md +211 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/mindspore/__init__.py +15 -0
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +113 -145
msprobe/mindspore/api_accuracy_checker/api_info.py +21 -6
msprobe/mindspore/api_accuracy_checker/api_runner.py +43 -18
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +21 -7
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +77 -0
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +63 -1
msprobe/mindspore/api_accuracy_checker/compute_element.py +59 -24
msprobe/mindspore/api_accuracy_checker/data_manager.py +264 -0
msprobe/mindspore/api_accuracy_checker/main.py +27 -3
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +206 -0
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +58 -0
msprobe/mindspore/api_accuracy_checker/type_mapping.py +22 -5
msprobe/mindspore/api_accuracy_checker/utils.py +34 -17
msprobe/mindspore/cell_processor.py +33 -12
msprobe/mindspore/common/const.py +33 -13
msprobe/mindspore/common/log.py +5 -9
msprobe/mindspore/common/utils.py +43 -4
msprobe/mindspore/compare/distributed_compare.py +22 -22
msprobe/mindspore/compare/ms_compare.py +271 -248
msprobe/mindspore/compare/ms_graph_compare.py +81 -47
msprobe/mindspore/debugger/debugger_config.py +4 -1
msprobe/mindspore/debugger/precision_debugger.py +7 -1
msprobe/mindspore/dump/dump_tool_factory.py +3 -1
msprobe/mindspore/dump/hook_cell/api_registry.py +12 -2
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +13 -16
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +25 -0
msprobe/mindspore/dump/jit_dump.py +17 -5
msprobe/mindspore/dump/kernel_graph_dump.py +2 -4
msprobe/mindspore/dump/kernel_kbyk_dump.py +2 -4
msprobe/mindspore/dym_loader/hook_dynamic_loader.cc +140 -0
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +53 -0
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +145 -39
msprobe/mindspore/free_benchmark/common/handler_params.py +1 -2
msprobe/mindspore/free_benchmark/common/utils.py +19 -4
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -204
msprobe/mindspore/free_benchmark/handler/base_handler.py +3 -3
msprobe/mindspore/free_benchmark/handler/check_handler.py +4 -5
msprobe/mindspore/free_benchmark/handler/fix_handler.py +4 -4
msprobe/mindspore/free_benchmark/handler/handler_factory.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +15 -6
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +4 -4
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +2 -2
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +13 -6
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +2 -2
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +2 -2
msprobe/mindspore/grad_probe/global_context.py +28 -8
msprobe/mindspore/grad_probe/grad_analyzer.py +27 -13
msprobe/mindspore/grad_probe/grad_monitor.py +16 -1
msprobe/mindspore/grad_probe/grad_stat_csv.py +33 -5
msprobe/mindspore/grad_probe/hook.py +24 -10
msprobe/mindspore/grad_probe/utils.py +18 -5
msprobe/mindspore/ms_config.py +22 -15
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +2 -4
msprobe/mindspore/runtime.py +15 -0
msprobe/mindspore/service.py +36 -30
msprobe/mindspore/task_handler_factory.py +15 -0
msprobe/msprobe.py +24 -7
msprobe/pytorch/__init__.py +3 -2
msprobe/pytorch/api_accuracy_checker/common/config.py +62 -0
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +3 -4
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +9 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +454 -0
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +365 -0
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +6 -1
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +19 -14
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +13 -9
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +77 -53
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +15 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +9 -24
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +4 -12
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +9 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +3 -11
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +2 -2
msprobe/pytorch/bench_functions/confusion_transpose.py +5 -1
msprobe/pytorch/bench_functions/matmul_backward.py +12 -0
msprobe/pytorch/bench_functions/npu_fusion_attention.py +100 -6
msprobe/pytorch/bench_functions/rotary_mul.py +4 -0
msprobe/pytorch/bench_functions/swiglu.py +10 -2
msprobe/pytorch/common/parse_json.py +6 -6
msprobe/pytorch/common/utils.py +56 -5
msprobe/pytorch/compare/distributed_compare.py +8 -9
msprobe/pytorch/compare/pt_compare.py +8 -6
msprobe/pytorch/debugger/debugger_config.py +19 -15
msprobe/pytorch/dump/kernel_dump/kernel_config.py +33 -0
msprobe/pytorch/free_benchmark/common/constant.py +15 -0
msprobe/pytorch/free_benchmark/common/counter.py +15 -0
msprobe/pytorch/free_benchmark/common/enums.py +15 -0
msprobe/pytorch/free_benchmark/common/params.py +8 -1
msprobe/pytorch/free_benchmark/common/utils.py +26 -4
msprobe/pytorch/free_benchmark/compare/grad_saver.py +20 -3
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +3 -1
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +6 -4
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +2 -0
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +4 -0
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +10 -0
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +6 -5
msprobe/pytorch/grad_probe/grad_monitor.py +23 -6
msprobe/pytorch/grad_probe/grad_stat_csv.py +40 -10
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1 -0
msprobe/pytorch/hook_module/wrap_functional.py +14 -12
msprobe/pytorch/module_processer.py +2 -5
msprobe/pytorch/monitor/anomaly_analyse.py +201 -0
msprobe/pytorch/monitor/anomaly_detect.py +340 -0
msprobe/pytorch/monitor/distributed/__init__.py +0 -0
msprobe/pytorch/monitor/distributed/distributed_ops.yaml +19 -0
msprobe/pytorch/monitor/distributed/stack_blacklist.yaml +5 -0
msprobe/pytorch/monitor/distributed/wrap_distributed.py +272 -0
msprobe/pytorch/monitor/features.py +108 -0
msprobe/pytorch/monitor/module_hook.py +870 -0
msprobe/pytorch/monitor/module_metric.py +193 -0
msprobe/pytorch/monitor/module_spec_verifier.py +93 -0
msprobe/pytorch/monitor/optimizer_collect.py +295 -0
msprobe/pytorch/monitor/unittest/__init__.py +0 -0
msprobe/pytorch/monitor/unittest/test_monitor.py +145 -0
msprobe/pytorch/monitor/utils.py +250 -0
msprobe/pytorch/monitor/visualizer.py +59 -0
msprobe/pytorch/online_dispatch/__init__.py +2 -3
msprobe/pytorch/online_dispatch/compare.py +29 -38
msprobe/pytorch/online_dispatch/dispatch.py +50 -25
msprobe/pytorch/online_dispatch/dump_compare.py +21 -9
msprobe/pytorch/online_dispatch/single_compare.py +53 -32
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +1 -1
msprobe/pytorch/online_dispatch/utils.py +49 -21
msprobe/pytorch/parse_tool/lib/compare.py +12 -18
msprobe/pytorch/parse_tool/lib/config.py +1 -1
msprobe/pytorch/parse_tool/lib/parse_tool.py +1 -2
msprobe/pytorch/parse_tool/lib/utils.py +16 -35
msprobe/pytorch/parse_tool/lib/visualization.py +2 -0
msprobe/pytorch/pt_config.py +31 -8
msprobe/pytorch/service.py +15 -5
msprobe/visualization/__init__.py +14 -0
msprobe/visualization/builder/__init__.py +14 -0
msprobe/visualization/builder/graph_builder.py +165 -0
msprobe/visualization/builder/msprobe_adapter.py +205 -0
msprobe/visualization/compare/__init__.py +14 -0
msprobe/visualization/compare/graph_comparator.py +130 -0
msprobe/visualization/compare/mode_adapter.py +211 -0
msprobe/visualization/graph/__init__.py +14 -0
msprobe/visualization/graph/base_node.py +124 -0
msprobe/visualization/graph/graph.py +200 -0
msprobe/visualization/graph/node_colors.py +95 -0
msprobe/visualization/graph/node_op.py +39 -0
msprobe/visualization/graph_service.py +214 -0
msprobe/visualization/utils.py +232 -0
mindstudio_probe-1.1.0.dist-info/RECORD +0 -287
msprobe/docs/04.acl_config_examples.md +0 -78
msprobe/mindspore/compare/layer_mapping.py +0 -146
msprobe/mindspore/compare/modify_mapping.py +0 -107
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +0 -57
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +0 -122
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/LICENSE +0 -0
{mindstudio_probe-1.1.0.dist-info → mindstudio_probe-1.1.1.dist-info}/top_level.txt +0 -0
/msprobe/{mindspore/free_benchmark/decorator → pytorch/monitor}/__init__.py +0 -0

msprobe/core/compare/layer_mapping/layer_mapping.py ADDED Viewed

@@ -0,0 +1,242 @@
+# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
+# All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0  (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import os
+from msprobe.core.common.const import CompareConst, Const
+from msprobe.core.common.file_utils import load_json, load_yaml, save_yaml
+from msprobe.core.common.utils import (add_time_with_yaml,
+                                       detect_framework_by_dump_json,
+                                       get_stack_construct_by_dump_json_path)
+from msprobe.core.compare.layer_mapping.data_scope_parser import get_dump_data_items
+from msprobe.core.compare.utils import read_op
+class LayerTrie:
+    def __init__(self, type_name, framework=None):
+        self.type_name = type_name
+        self.data_items = []
+        self.children = {}
+        self.framework = framework
+    def __repr__(self):
+        return f"Layer(type_name={self.type_name}, data_number={len(self.data_items)})"
+    def get(self, name):
+        return self.children.get(name)
+    def insert(self, data_item):
+        parts = data_item.full_scope.split(Const.SEP)
+        node = self
+        scope_name_list = parts[Const.RIGHT_MOVE_INDEX:]
+        for name in scope_name_list:
+            if name not in node.children:
+                node.children[name] = LayerTrie(name, data_item.framework)
+            node = node.children[name]
+        node.data_items.append(data_item)
+        node.type_name = data_item.type_name
+    def query_data(self, scope, index, default_value=None):
+        parts = scope.split(Const.SEP)
+        node = self
+        scope_name_list = parts[1:]
+        for name in scope_name_list:
+            if name not in node.children:
+                return default_value
+            node = node.children[name]
+        if index >= len(node.data_items):
+            return default_value
+        return node.data_items[index]
+    def save_to_yaml(self, output_path):
+        result = {f"{self.type_name} @ {self}": self.convert_to_dict(self)}
+        file_name = add_time_with_yaml(f"{self.framework}_tree")
+        file_path = os.path.join(os.path.realpath(output_path), file_name)
+        save_yaml(file_path, result)
+    def convert_to_dict(self, node):
+        result = {}
+        result["data_item"] = [node.data_name for node in node.data_items]
+        for child_key, child_node in node.children.items():
+            key = f"{child_key} @ {child_node}"
+            result[key] = self.convert_to_dict(child_node)
+        return result
+def convert_scope(layer_trie, data_item, mapping=None):
+    if not mapping:
+        mapping = {}
+    new_scope = Const.TOP_LAYER
+    scope_list = data_item.full_scope.split(Const.SEP)
+    cur_node = layer_trie
+    idx = 0
+    while idx < len(scope_list) - 1:
+        child_name = scope_list[idx + 1]
+        type_name = cur_node.type_name
+        prefix_mapping = mapping.get(type_name, {})
+        mapping_list = prefix_mapping.get(child_name, [])
+        mapping_list.append((child_name, child_name, 1))
+        step = 1
+        for origin, target, level in mapping_list:
+            if Const.SEP.join(scope_list[idx + 1: idx + level + 1]) == origin:
+                new_scope = new_scope + Const.SEP + target
+                step = level
+                break
+        for _ in range(step):
+            child_node = cur_node.get(scope_list[idx + 1])
+            cur_node = child_node
+            idx += 1
+    index = -1
+    for idx, child in enumerate(cur_node.data_items):
+        if data_item.data_name == child.data_name:
+            index = idx
+    return new_scope, index
+def get_data_items_and_tree(dump_json_path, output_path):
+    framework = detect_framework_by_dump_json(dump_json_path)
+    stack, construct = get_stack_construct_by_dump_json_path(dump_json_path)
+    dump = load_json(dump_json_path)
+    dump_data_items = get_dump_data_items(dump, stack, construct, framework, output_path)
+    root = LayerTrie(Const.TOP_LAYER, framework)
+    for data_item in dump_data_items:
+        root.insert(data_item)
+    if output_path:
+        root.save_to_yaml(output_path)
+    return dump_data_items, root
+def convert_data_item(npu_tree, bench_tree, npu_data_item, mapping):
+    new_scope, index = convert_scope(npu_tree, npu_data_item, mapping)
+    bench_data_item = bench_tree.query_data(new_scope, index)
+    return bench_data_item
+def update_keys_in_place(d):
+    """
+    This function is used to compare and maintain compatibility between the old and new versions.
+    In the old version, 'Cell' was used as the top layer name, while the new version uses 'TopLayer'.
+    """
+    cell_value = d.pop(Const.CELL, None)
+    if cell_value is not None:
+        d[Const.TOP_LAYER] = cell_value
+def preprocess_layer_mapping(mapping):
+    """
+    before:
+        {'A': {'a.b.c': 'new_c',
+               'a.demo': 'new_demo',
+               'z': 'new_z',
+               'd.e': 'e'}}
+    after:
+        {'A': {'a': [('a.b.c', 'new_c', 3), ('a.demo', 'new_demo', 2)],
+               'z': [('z', 'new_z', 1)],
+               'd': [('d.e', 'e', 2)]}}
+    """
+    update_keys_in_place(mapping)
+    final_mapping = {}
+    for type_name, name_map in mapping.items():
+        final_mapping[type_name] = {}
+        for key, value in name_map.items():
+            key_list = key.split('.')
+            prefix = key_list[0]  # 取前缀
+            key_len = len(key_list)
+            if prefix not in final_mapping[type_name]:
+                final_mapping[type_name][prefix] = []
+            final_mapping[type_name][prefix].append((key, value, key_len))
+        # 前缀映射列表按规则长度排序
+        for prefix in final_mapping[type_name]:
+            final_mapping[type_name][prefix].sort(key=lambda x: -x[-1])
+    return final_mapping
+def convert_data_items(npu_tree, bench_tree, npu_data_items, mapping):
+    mapping = preprocess_layer_mapping(mapping)
+    api_mapping = {}
+    for npu_data_item in npu_data_items:
+        bench_data_item = convert_data_item(npu_tree, bench_tree, npu_data_item, mapping)
+        bench_name = bench_data_item.data_name if bench_data_item else CompareConst.N_A
+        npu_name = npu_data_item.data_name
+        api_mapping[npu_name] = bench_name
+    return api_mapping
+def generate_api_mapping_by_layer_mapping(npu_json_path, bench_json_path, layer_mapping_path=None, output_path=None):
+    npu_data_items, npu_root = get_data_items_and_tree(npu_json_path, output_path)
+    _, bench_root = get_data_items_and_tree(bench_json_path, output_path)
+    if isinstance(layer_mapping_path, str):
+        mapping = load_yaml(layer_mapping_path)
+    else:
+        mapping = {}
+    api_mapping = convert_data_items(npu_root, bench_root, npu_data_items, mapping)
+    if output_path:
+        file_name = add_time_with_yaml("api_mapping")
+        file_path = os.path.join(os.path.realpath(output_path), file_name)
+        save_yaml(file_path, api_mapping)
+    return api_mapping
+def generate_data_mapping(npu_json_path, bench_json_path, api_mapping, output_path=None):
+    def read_full_op_names(data, op_name):
+        op_parsed_list = read_op(data.get(op_name, {}), op_name)
+        full_op_names = [op_parsed.get('full_op_name') for op_parsed in op_parsed_list]
+        return full_op_names
+    def generate_op_data_mapping(npu_op_name, npu_full_op_names, bench_op_name, bench_full_op_names):
+        suffix_to_full_op_name = {}
+        op_data_mapping = {}
+        for bench_full_op_name in bench_full_op_names:
+            suffix = bench_full_op_name[len(bench_op_name):]
+            suffix_to_full_op_name[suffix] = bench_full_op_name
+        for npu_full_op_name in npu_full_op_names:
+            suffix = npu_full_op_name[len(npu_op_name):]
+            op_data_mapping[npu_full_op_name] = suffix_to_full_op_name.get(suffix, CompareConst.N_A)
+        return op_data_mapping
+    npu_data = load_json(npu_json_path).get("data", {})
+    bench_data = load_json(bench_json_path).get("data", {})
+    data_mapping = {}
+    for npu_op_name, bench_op_name in api_mapping.items():
+        if not npu_op_name:
+            continue
+        npu_full_op_names = read_full_op_names(npu_data, npu_op_name)
+        bench_full_op_names = read_full_op_names(bench_data, bench_op_name)
+        mapping = generate_op_data_mapping(npu_op_name, npu_full_op_names, bench_op_name, bench_full_op_names)
+        data_mapping.update(mapping)
+    if output_path:
+        file_name = add_time_with_yaml("data_mapping")
+        file_path = os.path.join(os.path.realpath(output_path), file_name)
+        save_yaml(file_path, data_mapping)
+    return data_mapping
+def generate_data_mapping_by_layer_mapping(input_param, layer_mapping_path=None, output_path=None):
+    npu_json_path = input_param.get("npu_json_path")
+    bench_json_path = input_param.get("bench_json_path")
+    api_mapping = generate_api_mapping_by_layer_mapping(
+        npu_json_path, bench_json_path, layer_mapping_path)
+    data_mapping = generate_data_mapping(
+        npu_json_path, bench_json_path, api_mapping, output_path)
+    return data_mapping

msprobe/core/compare/layer_mapping/postprocess_pass.py ADDED Viewed

@@ -0,0 +1,94 @@
+# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
+# All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0  (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+import re
+import math
+from msprobe.core.common.const import Const
+def postprocess_pass(data_items, name2item):
+    backward_pass(data_items, name2item)
+    renumber_index_pass(data_items, "ParallelTransformer", "layers")
+def backward_pass(data_items, name2item):
+    # 处理反向数据，反向无栈信息，沿用正向数据栈信息
+    for data_item in data_items:
+        data_name_list = data_item.data_name.split(Const.SEP)
+        if not data_name_list:
+            continue
+        if Const.BACKWARD in data_name_list[Const.SCOPE_DIRECTION_INDEX :]:
+            data_name_list[Const.SCOPE_DIRECTION_INDEX :] = [
+                s.replace(Const.BACKWARD, Const.FORWARD) for s in data_name_list[Const.SCOPE_DIRECTION_INDEX :]
+            ]
+            forward_name = Const.SEP.join(data_name_list)
+            forward_item = name2item.get(forward_name, None)
+            if not forward_item:
+                continue
+            data_item.stack_scope = forward_item.stack_scope
+            data_item.full_scope = forward_item.full_scope
+            data_item.layer_scope = forward_item.layer_scope
+def extract_next_item_last_number(data, prefix, default_result=None):
+    result = default_result
+    match = re.search(rf"^{re.escape(prefix)}\.(\S+?)(?:\.|$)", data)
+    if match:
+        next_item = match.group(1)
+        numbers = re.findall(r"\d+", next_item)
+        if numbers:
+            result = int(numbers[-1])
+    return result
+def replace_next_item_index(full_scope, prefix, index):
+    if math.isinf(index):
+        return full_scope
+    prefix_pattern = rf"^{re.escape(prefix)}\."
+    result = full_scope
+    match = re.search(rf"{prefix_pattern}(\S+?)(?:\.|$)", full_scope)
+    if match:
+        next_item = match.group(1)
+        pattern = rf"{prefix_pattern}{re.escape(next_item)}"
+        result = re.sub(pattern, f"{prefix}.{index}", full_scope, count=1)
+    return result
+def renumber_index_pass(data_items, type_name, suffix=None):
+    """
+    该函数为解决并行切分场景中编号不一致的比对问题。例如在MindSpore中ParallelTransformer层的PP切分场景，
+    MindSpore中的layers的成员编号是全局的，而在PyTorch中编号为局部的。
+    为适配此种场景，对指定层的索引进行重新编号，以确保在后续处理阶段序号对齐。
+    """
+    prefix_dict = {}  # 保存类型为type_name的前缀和最小编号的映射
+    for data_item in data_items:
+        if data_item.type_name == type_name:
+            prefix = f"{data_item.full_scope}.{suffix}" if suffix else data_item.layer_scope
+            prefix_dict[prefix] = math.inf
+    # 计算前缀对应的最小编号
+    for prefix in prefix_dict:
+        for data_item in data_items:
+            res = extract_next_item_last_number(data_item.full_scope, prefix, math.inf)
+            prefix_dict[prefix] = min(prefix_dict[prefix], res)
+    # 重新编号
+    for prefix, min_index in prefix_dict.items():
+        for data_item in data_items:
+            full_scope = data_item.full_scope
+            abs_index = extract_next_item_last_number(data_item.full_scope, prefix, math.inf)
+            rel_index = abs_index - min_index
+            full_scope = replace_next_item_index(full_scope, prefix, rel_index)
+            data_item.full_scope = full_scope

msprobe/core/compare/npy_compare.py CHANGED Viewed

@@ -14,18 +14,32 @@
 # limitations under the License.
 import abc
 import numpy as np
 from msprobe.core.common.utils import format_value
 from msprobe.core.common.const import Const, CompareConst
 from msprobe.core.common.log import logger
+from msprobe.core.common.utils import CompareException
 def handle_inf_nan(n_value, b_value):
+    def convert_to_float(value):
+        try:
+            if isinstance(value, np.ndarray):
+                return value.astype(float)
+            else:
+                return float(value)
+        except ValueError as e:
+            logger.error('\n'.join(e.args))
+            raise CompareException(CompareException.INVALID_DATA_ERROR) from e
+    n_value_convert, b_value_convert = convert_to_float(n_value), convert_to_float(b_value)
     """处理inf和nan的数据"""
-    n_inf = np.isinf(n_value)
-    b_inf = np.isinf(b_value)
-    n_nan = np.isnan(n_value)
-    b_nan = np.isnan(b_value)
+    n_inf = np.isinf(n_value_convert)
+    b_inf = np.isinf(b_value_convert)
+    n_nan = np.isnan(n_value_convert)
+    b_nan = np.isnan(b_value_convert)
     n_invalid = np.any(n_inf) or np.any(n_nan)
     b_invalid = np.any(b_inf) or np.any(b_nan)
     if n_invalid or b_invalid:
@@ -50,7 +64,11 @@ def get_error_type(n_value, b_value, error_flag):
     if not n_value.shape:  # 判断数据是否为标量
         return n_value, b_value, False
-    n_value, b_value = handle_inf_nan(n_value, b_value)  # 判断是否有nan/inf数据
+    try:
+        n_value, b_value = handle_inf_nan(n_value, b_value)  # 判断是否有nan/inf数据
+    except CompareException:
+        logger.error('Numpy data is unreadable, please check!')
+        return CompareConst.UNREADABLE, CompareConst.UNREADABLE, True
     if n_value is CompareConst.NAN or b_value is CompareConst.NAN:
         return CompareConst.NAN, CompareConst.NAN, True
     return n_value, b_value, False
@@ -73,7 +91,9 @@ def get_error_message(n_value, b_value, npu_op_name, error_flag, error_file=None
     """获取异常情况的错误信息"""
     if error_flag:
         if n_value == CompareConst.READ_NONE:
-            if error_file:
+            if error_file == 'no_bench_data':
+                return 'Bench does not have data file.'
+            elif error_file is not None:
                 return "Dump file: {} not found.".format(error_file)
             return CompareConst.NO_BENCH
         if n_value == CompareConst.NONE:
@@ -82,6 +102,8 @@ def get_error_message(n_value, b_value, npu_op_name, error_flag, error_file=None
             return "Shape of NPU and bench Tensor do not match. Skipped."
         if n_value == CompareConst.NAN:
             return "The position of inf or nan in NPU and bench Tensor do not match."
+        if n_value == CompareConst.UNREADABLE:
+            return "The npy data is unable to be read or compared, please check dump data files."
     else:
         if not n_value.shape:
             return "This is type of scalar data, can not compare."
@@ -109,7 +131,11 @@ def npy_data_check(n_value, b_value):
             error_message += "Dtype of NPU and bench Tensor do not match. Skipped.\n"
     if not error_message:
-        n_value, b_value = handle_inf_nan(n_value, b_value)  # 判断是否有 nan/inf 数据
+        try:
+            n_value, b_value = handle_inf_nan(n_value, b_value)  # 判断是否有nan/inf数据
+        except CompareException:
+            logger.error('Numpy data is unreadable, please check!')
+            return True, 'Numpy data is unreadable, please check!'
         # handle_inf_nan 会返回'Nan'或ndarray类型，使用类型判断是否存在无法处理的nan/inf数据
         if not isinstance(n_value, np.ndarray) or not isinstance(b_value, np.ndarray):
             error_message += "The position of inf or nan in NPU and bench Tensor do not match.\n"
@@ -160,14 +186,14 @@ class GetCosineSimilarity(TensorComparisonBasic):
     def apply(self, n_value, b_value, error_flag, relative_err=None):
         if error_flag:
-            if n_value == CompareConst.READ_NONE:
-                return CompareConst.NONE, ''
+            if n_value == CompareConst.READ_NONE or n_value == CompareConst.UNREADABLE:
+                return CompareConst.UNSUPPORTED, ''
             if n_value == CompareConst.NONE:
                 return CompareConst.UNSUPPORTED, ''
             if n_value == CompareConst.SHAPE_UNMATCH:
                 return CompareConst.SHAPE_UNMATCH, ''
             if n_value == CompareConst.NAN:
-                return "N/A", ''
+                return CompareConst.N_A, ''
         if not n_value.shape:
             return CompareConst.UNSUPPORTED, ''
@@ -198,17 +224,20 @@ class GetMaxAbsErr(TensorComparisonBasic):
     """计算最大绝对误差"""
     def apply(self, n_value, b_value, error_flag, relative_err=None):
         if error_flag:
-            if n_value == CompareConst.READ_NONE:
-                return CompareConst.NONE, ""
+            if n_value == CompareConst.READ_NONE or n_value == CompareConst.UNREADABLE:
+                return CompareConst.UNSUPPORTED, ""
             if n_value == CompareConst.NONE:
                 return 0, ""
             if n_value == CompareConst.SHAPE_UNMATCH:
                 return CompareConst.SHAPE_UNMATCH, ""
             if n_value == CompareConst.NAN:
-                return "N/A", ""
+                return CompareConst.N_A, ""
         temp_res = n_value - b_value
         max_value = np.max(np.abs(temp_res))
+        if np.isnan(max_value):
+            message = 'Cannot compare by MaxRelativeError, the data contains nan/inf/-inf in dump data.'
+            return CompareConst.NAN, message
         return format_value(max_value), ""
@@ -228,20 +257,20 @@ class GetMaxRelativeErr(TensorComparisonBasic):
     """计算最大相对误差"""
     def apply(self, n_value, b_value, error_flag, relative_err=None):
         if error_flag:
-            if n_value == CompareConst.READ_NONE:
-                return CompareConst.NONE, ''
+            if n_value == CompareConst.READ_NONE or n_value == CompareConst.UNREADABLE:
+                return CompareConst.UNSUPPORTED, ''
             if n_value == CompareConst.NONE:
                 return 0, ''
             if n_value == CompareConst.SHAPE_UNMATCH:
                 return CompareConst.SHAPE_UNMATCH, ''
             if n_value == CompareConst.NAN:
-                return "N/A", ''
+                return CompareConst.N_A, ''
         if relative_err is None:
             relative_err = get_relative_err(n_value, b_value)
         max_relative_err = np.max(np.abs(relative_err))
         if np.isnan(max_relative_err):
-            message = 'Cannot compare by MaxRelativeError, the data contains nan in dump data.'
+            message = 'Cannot compare by MaxRelativeError, the data contains nan/inf/-inf in dump data.'
             return CompareConst.NAN, message
         return format_value(max_relative_err), ''
@@ -250,14 +279,14 @@ class GetThousandErrRatio(TensorComparisonBasic):
     """计算相对误差小于千分之一的比例"""
     def apply(self, n_value, b_value, error_flag, relative_err=None):
         if error_flag:
-            if n_value == CompareConst.READ_NONE:
-                return CompareConst.NONE, ""
+            if n_value == CompareConst.READ_NONE or n_value == CompareConst.UNREADABLE:
+                return CompareConst.UNSUPPORTED, ""
             if n_value == CompareConst.NONE:
                 return 0, ""
             if n_value == CompareConst.SHAPE_UNMATCH:
                 return CompareConst.SHAPE_UNMATCH, ""
             if n_value == CompareConst.NAN:
-                return "N/A", ""
+                return CompareConst.N_A, ""
         if not n_value.shape:
             return CompareConst.NAN, ""
@@ -272,14 +301,14 @@ class GetFiveThousandErrRatio(TensorComparisonBasic):
     """计算相对误差小于千分之五的比例"""
     def apply(self, n_value, b_value, error_flag, relative_err=None):
         if error_flag:
-            if n_value == CompareConst.READ_NONE:
-                return CompareConst.NONE, ""
+            if n_value == CompareConst.READ_NONE or n_value == CompareConst.UNREADABLE:
+                return CompareConst.UNSUPPORTED, ""
             if n_value == CompareConst.NONE:
                 return 0, ""
             if n_value == CompareConst.SHAPE_UNMATCH:
                 return CompareConst.SHAPE_UNMATCH, ""
             if n_value == CompareConst.NAN:
-                return "N/A", ""
+                return CompareConst.N_A, ""
         if not n_value.shape:
             return CompareConst.NAN, ""

mindstudio-probe 1.1.0__py3-none-any.whl → 1.1.1__py3-none-any.whl

mindstudio-probe 1.1.0py3-none-any.whl → 1.1.1py3-none-any.whl