PyPI - mindstudio-probe - Versions diffs - 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl - Mend

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (278) hide show

{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/LICENSE +201 -201
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/METADATA +36 -34
mindstudio_probe-1.1.0.dist-info/RECORD +287 -0
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/WHEEL +1 -1
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/entry_points.txt +1 -0
msprobe/README.md +131 -237
msprobe/__init__.py +16 -1
msprobe/{config/config.json → config.json} +47 -49
msprobe/core/advisor/advisor.py +124 -124
msprobe/core/advisor/advisor_const.py +58 -59
msprobe/core/advisor/advisor_result.py +58 -58
msprobe/core/common/const.py +402 -318
msprobe/core/common/exceptions.py +99 -99
msprobe/core/common/{file_check.py → file_utils.py} +523 -283
msprobe/core/common/inplace_op_checker.py +38 -0
msprobe/core/common/inplace_ops.yaml +251 -0
msprobe/core/common/log.py +86 -69
msprobe/core/common/utils.py +371 -616
msprobe/core/common_config.py +78 -71
msprobe/core/compare/acc_compare.py +472 -298
msprobe/core/compare/check.py +180 -95
msprobe/core/compare/compare_cli.py +69 -49
msprobe/core/compare/highlight.py +259 -222
msprobe/core/compare/multiprocessing_compute.py +174 -149
msprobe/core/compare/npy_compare.py +310 -295
msprobe/core/compare/utils.py +464 -429
msprobe/core/data_dump/data_collector.py +153 -144
msprobe/core/data_dump/data_processor/base.py +337 -293
msprobe/core/data_dump/data_processor/factory.py +76 -59
msprobe/core/data_dump/data_processor/mindspore_processor.py +192 -198
msprobe/core/data_dump/data_processor/pytorch_processor.py +383 -389
msprobe/core/data_dump/json_writer.py +117 -116
msprobe/core/data_dump/scope.py +194 -178
msprobe/core/grad_probe/constant.py +74 -70
msprobe/core/grad_probe/grad_compare.py +170 -175
msprobe/core/grad_probe/utils.py +77 -52
msprobe/docs/01.installation.md +99 -0
msprobe/docs/02.config_introduction.md +137 -0
msprobe/docs/03.config_examples.md +237 -0
msprobe/docs/04.acl_config_examples.md +78 -0
msprobe/docs/05.data_dump_PyTorch.md +326 -0
msprobe/docs/06.data_dump_MindSpore.md +285 -0
msprobe/docs/07.accuracy_checker_PyTorch.md +297 -0
msprobe/docs/08.accuracy_checker_online_PyTorch.md +238 -0
msprobe/docs/09.accuracy_checker_MindSpore.md +68 -0
msprobe/docs/10.accuracy_compare_PyTorch.md +327 -0
msprobe/docs/11.accuracy_compare_MindSpore.md +333 -0
msprobe/docs/12.overflow_check_PyTorch.md +79 -0
msprobe/docs/13.overflow_check_MindSpore.md +31 -0
msprobe/{pytorch/doc/parse_tool.md → docs/14.data_parse_PyTorch.md} +283 -286
msprobe/docs/15.free_benchmarking_PyTorch.md +170 -0
msprobe/docs/16.free_benchmarking_MindSpore.md +140 -0
msprobe/{doc/grad_probe/grad_probe.md → docs/17.grad_probe.md} +205 -207
msprobe/{pytorch/doc//321/205/320/254/320/270/321/207/342/225/221/342/224/220/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/206/320/277/320/244/321/205/320/277/342/225/243.md → docs/18.online_dispatch.md} +89 -90
msprobe/docs/FAQ.md +189 -0
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +146 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/mindspore/__init__.py +2 -1
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +278 -245
msprobe/mindspore/api_accuracy_checker/api_info.py +76 -69
msprobe/mindspore/api_accuracy_checker/api_runner.py +155 -151
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +196 -196
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +6 -0
msprobe/mindspore/api_accuracy_checker/compute_element.py +238 -223
msprobe/mindspore/api_accuracy_checker/main.py +8 -15
msprobe/mindspore/api_accuracy_checker/type_mapping.py +113 -113
msprobe/mindspore/api_accuracy_checker/utils.py +79 -62
msprobe/mindspore/cell_processor.py +58 -34
msprobe/mindspore/common/const.py +108 -87
msprobe/mindspore/common/log.py +37 -37
msprobe/mindspore/common/utils.py +97 -57
msprobe/mindspore/compare/distributed_compare.py +62 -75
msprobe/mindspore/compare/layer_mapping.py +146 -0
msprobe/mindspore/compare/modify_mapping.py +107 -0
msprobe/mindspore/compare/ms_compare.py +357 -117
msprobe/mindspore/compare/ms_graph_compare.py +364 -317
msprobe/mindspore/compare/ms_to_pt_api.yaml +399 -399
msprobe/mindspore/debugger/debugger_config.py +69 -74
msprobe/mindspore/debugger/precision_debugger.py +150 -107
msprobe/mindspore/dump/dump_tool_factory.py +50 -35
msprobe/mindspore/dump/hook_cell/api_registry.py +128 -104
msprobe/mindspore/dump/hook_cell/hook_cell.py +55 -53
msprobe/mindspore/dump/hook_cell/primitive_hooks.py +206 -0
msprobe/mindspore/dump/hook_cell/support_wrap_ops.yaml +994 -925
msprobe/mindspore/dump/hook_cell/wrap_api.py +121 -0
msprobe/mindspore/dump/jit_dump.py +96 -56
msprobe/mindspore/dump/kernel_graph_dump.py +75 -60
msprobe/mindspore/dump/kernel_kbyk_dump.py +79 -65
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +131 -116
msprobe/mindspore/free_benchmark/common/config.py +27 -12
msprobe/mindspore/free_benchmark/common/handler_params.py +32 -17
msprobe/mindspore/free_benchmark/common/utils.py +85 -71
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +842 -842
msprobe/mindspore/free_benchmark/decorator/dec_forward.py +57 -42
msprobe/mindspore/free_benchmark/decorator/decorator_factory.py +122 -107
msprobe/mindspore/free_benchmark/handler/base_handler.py +105 -90
msprobe/mindspore/free_benchmark/handler/check_handler.py +56 -41
msprobe/mindspore/free_benchmark/handler/fix_handler.py +51 -36
msprobe/mindspore/free_benchmark/handler/handler_factory.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +82 -67
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +36 -21
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +78 -63
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +77 -0
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +49 -34
msprobe/mindspore/free_benchmark/perturbation/no_change.py +27 -12
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +44 -27
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +48 -33
msprobe/mindspore/grad_probe/global_context.py +100 -91
msprobe/mindspore/grad_probe/grad_analyzer.py +231 -231
msprobe/mindspore/grad_probe/grad_monitor.py +27 -27
msprobe/mindspore/grad_probe/grad_stat_csv.py +131 -131
msprobe/mindspore/grad_probe/hook.py +94 -92
msprobe/mindspore/grad_probe/utils.py +29 -28
msprobe/mindspore/ms_config.py +128 -126
msprobe/mindspore/overflow_check/kernel_graph_overflow_check.py +60 -45
msprobe/mindspore/overflow_check/overflow_check_tool_factory.py +49 -34
msprobe/mindspore/runtime.py +4 -4
msprobe/mindspore/service.py +297 -354
msprobe/mindspore/task_handler_factory.py +24 -24
msprobe/msprobe.py +105 -107
msprobe/pytorch/__init__.py +23 -4
msprobe/pytorch/api_accuracy_checker/common/config.py +70 -55
msprobe/pytorch/api_accuracy_checker/common/utils.py +246 -165
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +230 -213
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +632 -581
msprobe/pytorch/api_accuracy_checker/compare/api_precision_standard.yaml +132 -132
msprobe/pytorch/api_accuracy_checker/compare/api_precision_threshold.yaml +390 -390
msprobe/pytorch/api_accuracy_checker/compare/compare.py +416 -381
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +90 -73
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +265 -244
msprobe/pytorch/api_accuracy_checker/config.yaml +10 -10
msprobe/pytorch/api_accuracy_checker/run_ut/data_generate.py +370 -332
msprobe/pytorch/api_accuracy_checker/run_ut/multi_run_ut.py +221 -199
msprobe/pytorch/api_accuracy_checker/run_ut/run_overflow_check.py +150 -134
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut.py +518 -581
msprobe/pytorch/api_accuracy_checker/run_ut/run_ut_utils.py +213 -74
msprobe/pytorch/api_accuracy_checker/run_ut/torch_ut_setting.json +7 -4
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/attl.py +218 -202
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/client.py +370 -324
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/device_dispatch.py +227 -204
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/dump_dispatch.py +110 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/server.py +244 -218
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/torch_ops_config.yaml +63 -0
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/utils.py +44 -0
msprobe/pytorch/bench_functions/__init__.py +30 -15
msprobe/pytorch/bench_functions/apply_adam_w.py +43 -28
msprobe/pytorch/bench_functions/confusion_transpose.py +34 -19
msprobe/pytorch/bench_functions/fast_gelu.py +70 -55
msprobe/pytorch/bench_functions/layer_norm_eval.py +21 -6
msprobe/pytorch/bench_functions/linear.py +27 -12
msprobe/pytorch/bench_functions/matmul_backward.py +63 -48
msprobe/pytorch/bench_functions/npu_fusion_attention.py +538 -421
msprobe/pytorch/bench_functions/rms_norm.py +30 -15
msprobe/pytorch/bench_functions/rotary_mul.py +71 -52
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +41 -26
msprobe/pytorch/bench_functions/swiglu.py +70 -55
msprobe/pytorch/common/__init__.py +17 -2
msprobe/pytorch/common/compare_script.template +14 -14
msprobe/pytorch/common/log.py +33 -32
msprobe/pytorch/common/parse_json.py +54 -39
msprobe/pytorch/common/utils.py +310 -300
msprobe/pytorch/compare/distributed_compare.py +66 -66
msprobe/pytorch/compare/mapping.yaml +607 -607
msprobe/pytorch/compare/match.py +49 -33
msprobe/pytorch/compare/pt_compare.py +82 -40
msprobe/pytorch/debugger/debugger_config.py +108 -95
msprobe/pytorch/debugger/precision_debugger.py +173 -125
msprobe/pytorch/free_benchmark/__init__.py +23 -8
msprobe/pytorch/free_benchmark/common/constant.py +70 -70
msprobe/pytorch/free_benchmark/common/counter.py +71 -71
msprobe/pytorch/free_benchmark/common/enums.py +65 -37
msprobe/pytorch/free_benchmark/common/params.py +144 -129
msprobe/pytorch/free_benchmark/common/utils.py +118 -102
msprobe/pytorch/free_benchmark/compare/grad_saver.py +200 -179
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +119 -104
msprobe/pytorch/free_benchmark/main.py +120 -105
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +28 -13
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +56 -41
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +105 -90
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +119 -104
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +87 -63
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +83 -68
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +43 -28
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +60 -45
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +34 -19
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +256 -217
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +54 -39
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +38 -23
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +45 -30
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +185 -170
msprobe/pytorch/function_factory.py +91 -75
msprobe/pytorch/functional/module_dump.py +84 -0
msprobe/pytorch/grad_probe/grad_monitor.py +91 -90
msprobe/pytorch/grad_probe/grad_stat_csv.py +128 -128
msprobe/pytorch/hook_module/__init__.py +16 -1
msprobe/pytorch/hook_module/api_registry.py +166 -161
msprobe/pytorch/hook_module/hook_module.py +118 -120
msprobe/pytorch/hook_module/support_wrap_ops.yaml +1879 -1877
msprobe/pytorch/hook_module/utils.py +28 -29
msprobe/pytorch/hook_module/wrap_aten.py +111 -110
msprobe/pytorch/hook_module/wrap_distributed.py +77 -78
msprobe/pytorch/hook_module/wrap_functional.py +104 -105
msprobe/pytorch/hook_module/wrap_npu_custom.py +85 -84
msprobe/pytorch/hook_module/wrap_tensor.py +69 -71
msprobe/pytorch/hook_module/wrap_torch.py +84 -86
msprobe/pytorch/hook_module/wrap_vf.py +60 -62
msprobe/pytorch/module_processer.py +153 -138
msprobe/pytorch/online_dispatch/__init__.py +20 -20
msprobe/pytorch/online_dispatch/compare.py +235 -236
msprobe/pytorch/online_dispatch/dispatch.py +271 -271
msprobe/pytorch/online_dispatch/dump_compare.py +155 -156
msprobe/pytorch/online_dispatch/single_compare.py +391 -391
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +57 -49
msprobe/pytorch/online_dispatch/utils.py +127 -146
msprobe/pytorch/parse.py +19 -4
msprobe/pytorch/parse_tool/cli.py +31 -32
msprobe/pytorch/parse_tool/lib/compare.py +259 -271
msprobe/pytorch/parse_tool/lib/config.py +52 -52
msprobe/pytorch/parse_tool/lib/file_desc.py +31 -31
msprobe/pytorch/parse_tool/lib/interactive_cli.py +102 -102
msprobe/pytorch/parse_tool/lib/parse_exception.py +54 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +161 -158
msprobe/pytorch/parse_tool/lib/utils.py +320 -321
msprobe/pytorch/parse_tool/lib/visualization.py +85 -91
msprobe/pytorch/pt_config.py +317 -187
msprobe/pytorch/service.py +311 -252
mindstudio_probe-1.0.3.dist-info/RECORD +0 -272
msprobe/config/README.md +0 -539
msprobe/mindspore/doc/compare.md +0 -58
msprobe/mindspore/doc/dump.md +0 -217
msprobe/mindspore/dump/hook_cell/wrap_functional.py +0 -91
msprobe/mindspore/dump/hook_cell/wrap_tensor.py +0 -63
msprobe/pytorch/api_accuracy_checker/tensor_transport_layer/ssl_config.py +0 -10
msprobe/pytorch/doc/FAQ.md +0 -193
msprobe/pytorch/doc/api_accuracy_checker.md +0 -313
msprobe/pytorch/doc/api_accuracy_checker_online.md +0 -187
msprobe/pytorch/doc/dump.md +0 -260
msprobe/pytorch/doc/msprobe/321/207/342/226/223/342/225/233/321/205/342/225/221/320/266/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/206/320/245/342/226/221/321/206/320/235/320/276dump/321/206/320/260/320/227/321/205/320/227/320/226/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -182
msprobe/pytorch/doc/ptdbg_ascend_compare.md +0 -240
msprobe/pytorch/doc/ptdbg_ascend_overview.md +0 -68
msprobe/pytorch/doc/ptdbg_ascend_quickstart.md +0 -381
msprobe/pytorch/doc/run_overflow_check.md +0 -25
msprobe/pytorch/doc//321/206/320/247/320/260/321/206/320/260/320/227/321/206/320/255/320/226/321/205/342/225/226/320/265/321/205/320/225/342/225/226/321/205/320/254/342/225/221/321/206/320/251/320/277/321/211/320/272/320/234/321/210/320/277/320/221/321/205/320/242/320/234/321/206/320/220/320/267/321/210/320/223/342/225/234/321/205/320/257/342/225/221/321/207/342/225/221/342/224/220/321/206/320/232/320/265/321/205/320/241/320/232.md +0 -151
msprobe/pytorch/functional/data_processor.py +0 -0
msprobe/pytorch/functional/dump_module.py +0 -39
{mindstudio_probe-1.0.3.dist-info → mindstudio_probe-1.1.0.dist-info}/top_level.txt +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/BLOOM-7B_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_3.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_4.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_5.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_6.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_7.png +0 -0
/msprobe/{pytorch/doc → docs}/img/GPT-3_8.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_1.png +0 -0
/msprobe/{pytorch/doc → docs}/img/YOLOV5S_2.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/accuracy_checking_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_details.png +0 -0
/msprobe/{pytorch/doc → docs}/img/api_precision_compare_result.png +0 -0
/msprobe/{pytorch/doc → docs}/img/auto_analyze_log.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl.png +0 -0
/msprobe/{pytorch/doc → docs}/img/compare_result_pkl_md5.png.png +0 -0
/msprobe/{pytorch/doc → docs}/img/cpu_info.png +0 -0
/msprobe/{config → docs}/img/free_benchmark.png +0 -0
/msprobe/{doc/grad_probe/img/image-1.png → docs/img/grad_probe_image-1.png} +0 -0
/msprobe/{doc/grad_probe/img/image-2.png → docs/img/grad_probe_image-2.png} +0 -0
/msprobe/{doc/grad_probe/img/image-3.png → docs/img/grad_probe_image-3.png} +0 -0
/msprobe/{doc/grad_probe/img/image-4.png → docs/img/grad_probe_image-4.png} +0 -0
/msprobe/{doc/grad_probe/img/image.png → docs/img/grad_probe_image.png} +0 -0
/msprobe/{pytorch/doc → docs}/img/module_compare.png +0 -0

msprobe/core/data_dump/data_processor/factory.py CHANGED Viewed

@@ -1,59 +1,76 @@
-from msprobe.core.common.const import Const
-class DataProcessorFactory:
-    _data_processor = {}
-    _module_processor = {}
-    @classmethod
-    def register_processor(cls, framework, task, processor_class):
-        key = (framework, task)
-        cls._data_processor[key] = processor_class
-    @classmethod
-    def register_module_processor(cls, framework, processor_class):
-        cls._module_processor[framework] = processor_class
-    @classmethod
-    def get_module_processor(cls, framework):
-        processor_class = cls._module_processor.get(framework)
-        if not processor_class:
-            raise ValueError(f"ModuleProcesser not found for framework: {framework}")
-        return processor_class
-    @classmethod
-    def create_processor(cls, config, data_writer):
-        cls.register_processors(config.framework)
-        task = Const.KERNEL_DUMP if config.level == "L2" else config.task
-        key = (config.framework, task)
-        processor_class = cls._data_processor.get(key)
-        if not processor_class:
-            raise ValueError(f"Processor not found for framework: {config.framework}, task: {config.task}")
-        return processor_class(config, data_writer)
-    @classmethod
-    def register_processors(cls, framework):
-        if framework == Const.PT_FRAMEWORK:
-            from .pytorch_processor import (
-                StatisticsDataProcessor as PytorchStatisticsDataProcessor,
-                TensorDataProcessor as PytorchTensorDataProcessor,
-                OverflowCheckDataProcessor as PytorchOverflowCheckDataProcessor,
-                FreeBenchmarkDataProcessor as PytorchFreeBenchmarkDataProcessor,
-                KernelDumpDataProcessor as PytorchKernelDumpDataProcessor
-            )
-            from ....pytorch.module_processer import ModuleProcesser
-            cls.register_processor(Const.PT_FRAMEWORK, Const.STATISTICS, PytorchStatisticsDataProcessor)
-            cls.register_processor(Const.PT_FRAMEWORK, Const.TENSOR, PytorchTensorDataProcessor)
-            cls.register_processor(Const.PT_FRAMEWORK, Const.OVERFLOW_CHECK, PytorchOverflowCheckDataProcessor)
-            cls.register_processor(Const.PT_FRAMEWORK, Const.FREE_BENCHMARK, PytorchFreeBenchmarkDataProcessor)
-            cls.register_processor(Const.PT_FRAMEWORK, Const.KERNEL_DUMP, PytorchKernelDumpDataProcessor)
-            cls.register_module_processor(Const.PT_FRAMEWORK, ModuleProcesser)
-        elif framework == Const.MS_FRAMEWORK:
-            from .mindspore_processor import (
-                StatisticsDataProcessor as MindsporeStatisticsDataProcessor,
-                TensorDataProcessor as MindsporeTensorDataProcessor,
-                OverflowCheckDataProcessor as MindsporeOverflowCheckDataProcessor
-            )
-            cls.register_processor(Const.MS_FRAMEWORK, Const.STATISTICS, MindsporeStatisticsDataProcessor)
-            cls.register_processor(Const.MS_FRAMEWORK, Const.TENSOR, MindsporeTensorDataProcessor)
-            cls.register_processor(Const.MS_FRAMEWORK, Const.OVERFLOW_CHECK, MindsporeOverflowCheckDataProcessor)
+# Copyright (c) 2024-2024, Huawei Technologies Co., Ltd.
+# All rights reserved.
+#
+# Licensed under the Apache License, Version 2.0  (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+from msprobe.core.common.const import Const
+class DataProcessorFactory:
+    _data_processor = {}
+    _module_processor = {}
+    @classmethod
+    def register_processor(cls, framework, task, processor_class):
+        key = (framework, task)
+        cls._data_processor[key] = processor_class
+    @classmethod
+    def register_module_processor(cls, framework, processor_class):
+        cls._module_processor[framework] = processor_class
+    @classmethod
+    def get_module_processor(cls, framework):
+        processor_class = cls._module_processor.get(framework)
+        if not processor_class:
+            raise ValueError(f"ModuleProcesser not found for framework: {framework}")
+        return processor_class
+    @classmethod
+    def create_processor(cls, config, data_writer):
+        cls.register_processors(config.framework)
+        task = Const.KERNEL_DUMP if config.level == "L2" else config.task
+        key = (config.framework, task)
+        processor_class = cls._data_processor.get(key)
+        if not processor_class:
+            raise ValueError(f"Processor not found for framework: {config.framework}, task: {config.task}")
+        return processor_class(config, data_writer)
+    @classmethod
+    def register_processors(cls, framework):
+        if framework == Const.PT_FRAMEWORK:
+            from msprobe.core.data_dump.data_processor.pytorch_processor import (
+                StatisticsDataProcessor as PytorchStatisticsDataProcessor,
+                TensorDataProcessor as PytorchTensorDataProcessor,
+                OverflowCheckDataProcessor as PytorchOverflowCheckDataProcessor,
+                FreeBenchmarkDataProcessor as PytorchFreeBenchmarkDataProcessor,
+                KernelDumpDataProcessor as PytorchKernelDumpDataProcessor
+            )
+            from msprobe.pytorch.module_processer import ModuleProcesser
+            cls.register_processor(Const.PT_FRAMEWORK, Const.STATISTICS, PytorchStatisticsDataProcessor)
+            cls.register_processor(Const.PT_FRAMEWORK, Const.TENSOR, PytorchTensorDataProcessor)
+            cls.register_processor(Const.PT_FRAMEWORK, Const.OVERFLOW_CHECK, PytorchOverflowCheckDataProcessor)
+            cls.register_processor(Const.PT_FRAMEWORK, Const.FREE_BENCHMARK, PytorchFreeBenchmarkDataProcessor)
+            cls.register_processor(Const.PT_FRAMEWORK, Const.KERNEL_DUMP, PytorchKernelDumpDataProcessor)
+            cls.register_module_processor(Const.PT_FRAMEWORK, ModuleProcesser)
+        elif framework == Const.MS_FRAMEWORK:
+            from msprobe.core.data_dump.data_processor.mindspore_processor import (
+                StatisticsDataProcessor as MindsporeStatisticsDataProcessor,
+                TensorDataProcessor as MindsporeTensorDataProcessor,
+                OverflowCheckDataProcessor as MindsporeOverflowCheckDataProcessor
+            )
+            from msprobe.mindspore.cell_processor import CellProcessor
+            cls.register_processor(Const.MS_FRAMEWORK, Const.STATISTICS, MindsporeStatisticsDataProcessor)
+            cls.register_processor(Const.MS_FRAMEWORK, Const.TENSOR, MindsporeTensorDataProcessor)
+            cls.register_processor(Const.MS_FRAMEWORK, Const.OVERFLOW_CHECK, MindsporeOverflowCheckDataProcessor)
+            cls.register_module_processor(Const.MS_FRAMEWORK, CellProcessor)

msprobe/core/data_dump/data_processor/mindspore_processor.py CHANGED Viewed

@@ -1,198 +1,192 @@
-# Copyright 2024 Huawei Technologies Co., Ltd
-#
-# Licensed under the Apache License, Version 2.0 (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
-#
-# http://www.apache.org/licenses/LICENSE-2.0
-#
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
-# ============================================================================
-import zlib
-import mindspore as ms
-from mindspore import ops
-import numpy as np
-from msprobe.core.common.const import Const
-from msprobe.core.data_dump.data_processor.base import (BaseDataProcessor, TensorStatInfo,
-                                                        ModuleForwardInputsOutputs, ModuleBackwardInputsOutputs)
-from msprobe.core.common.file_check import path_len_exceeds_limit
-from msprobe.mindspore.dump.hook_cell.wrap_functional import load_ops_functions
-from msprobe.mindspore.common.utils import convert_bf16_to_fp32, save_tensor_as_npy
-from msprobe.mindspore.common.log import logger
-from msprobe.mindspore.dump.hook_cell.api_registry import api_register
-class MindsporeDataProcessor(BaseDataProcessor):
-    mindspore_special_type = tuple([ms.Tensor])
-    ops_func, mint_ops_func, _ = load_ops_functions()
-    def __init__(self, config, data_writer):
-        super().__init__(config, data_writer)
-        self.mindspore_object_key = {
-            "dtype": self.analyze_dtype_in_kwargs
-        }
-    @staticmethod
-    def get_md5_for_tensor(x):
-        x = convert_bf16_to_fp32(x)
-        tensor_bytes = x.asnumpy().tobytes()
-        crc32_hash = zlib.crc32(tensor_bytes)
-        return f"{crc32_hash:08x}"
-    @staticmethod
-    def analyze_dtype_in_kwargs(element):
-        return {"type": "mindspore.dtype", "value": str(element)}
-    @staticmethod
-    def _analyze_builtin(arg):
-        single_arg = {}
-        if isinstance(arg, slice):
-            single_arg.update({"type": "slice"})
-            # slice参数中可能存在tensor类型，json序列化，需要转换为python数值类型
-            values = [
-                value if not isinstance(value, ms.Tensor) else value.item()
-                for value in [arg.start, arg.stop, arg.step]
-            ]
-            single_arg.update({"value": values})
-        else:
-            single_arg.update({"type": type(arg).__name__})
-            single_arg.update({"value": arg})
-        return single_arg
-    @classmethod
-    def get_special_types(cls):
-        return super().get_special_types() + cls.mindspore_special_type
-    def get_stat_info(self, data):
-        tensor_stat = TensorStatInfo()
-        if data.numel() == 0:
-            return tensor_stat
-        elif data.dtype == ms.bool_:
-            data_np = data.asnumpy()
-            tensor_stat.max = np.max(data_np).item()
-            tensor_stat.min = np.min(data_np).item()
-        elif not data.shape:
-            tensor_stat.max = tensor_stat.min = tensor_stat.mean = tensor_stat.norm = data.item()
-        elif data.dtype == ms.complex64 or data.dtype == ms.complex128:
-            data_abs = np.abs(data.asnumpy())
-            tensor_stat.max = np.max(data_abs).item()
-            tensor_stat.min = np.min(data_abs).item()
-            tensor_stat.mean = np.mean(data_abs).item()
-            tensor_stat.norm = np.linalg.norm(data_abs).item()
-        else:
-            if data.dtype == ms.bfloat16 or not ops.is_floating_point(data):
-                data = data.to(ms.float32)
-            api_register.norm_inner_op_set_ori_func()
-            tensor_stat.max = self.mint_ops_func["max"](data).item()
-            tensor_stat.min = self.mint_ops_func["min"](data).item()
-            tensor_stat.mean = self.mint_ops_func["mean"](data).item()
-            tensor_stat.norm = self.ops_func["norm"](data).item()
-            api_register.norm_inner_op_set_hook_func()
-        return tensor_stat
-    def analyze_single_element(self, element, suffix_stack):
-        if suffix_stack and suffix_stack[-1] in self.mindspore_object_key:
-            return self.mindspore_object_key[suffix_stack[-1]](element)
-        converted_numpy, numpy_type = self._convert_numpy_to_builtin(element)
-        if converted_numpy is not element:
-            return self._analyze_numpy(converted_numpy, numpy_type)
-        if isinstance(element, ms.Tensor):
-            return self._analyze_tensor(element, Const.SEP.join(suffix_stack))
-        if isinstance(element, (bool, int, float, str, slice)):
-            return self._analyze_builtin(element)
-        return {}
-    def _analyze_tensor(self, tensor, suffix):
-        tensor_stat = self.get_stat_info(tensor)
-        tensor_json = {
-            'type': 'mindspore.Tensor',
-            'dtype': str(tensor.dtype),
-            'shape': tensor.shape,
-            'Max': self.transfer_type(tensor_stat.max),
-            'Min': self.transfer_type(tensor_stat.min),
-            'Mean': self.transfer_type(tensor_stat.mean),
-            'Norm': self.transfer_type(tensor_stat.norm),
-        }
-        if self.config.summary_mode == Const.MD5:
-            tensor_md5 = self.get_md5_for_tensor(tensor)
-            tensor_json.update({Const.MD5: tensor_md5})
-        return tensor_json
-class StatisticsDataProcessor(MindsporeDataProcessor):
-    pass
-class TensorDataProcessor(MindsporeDataProcessor):
-    def _analyze_tensor(self, tensor, suffix):
-        dump_data_name, file_path = self.get_save_file_path(suffix)
-        single_arg = super()._analyze_tensor(tensor, suffix)
-        single_arg.update({"data_name": dump_data_name})
-        save_tensor_as_npy(tensor, file_path)
-        return single_arg
-class OverflowCheckDataProcessor(MindsporeDataProcessor):
-    __slots__ = ["cached_tensors_and_file_paths"]
-    def __init__(self, config, data_writer):
-        super().__init__(config, data_writer)
-        self.cached_tensors_and_file_paths = {}
-        self.real_overflow_nums = 0
-        self.overflow_nums = config.overflow_nums
-    @property
-    def is_terminated(self):
-        if self.overflow_nums == -1:
-            return False
-        if self.real_overflow_nums >= self.overflow_nums:
-            logger.info(f"[msprobe] 超过预设溢出次数 当前溢出次数: {self.real_overflow_nums}")
-            return True
-        return False
-    def analyze_forward(self, name, module, module_input_output: ModuleForwardInputsOutputs):
-        self.has_overflow = False
-        api_info_struct = super().analyze_forward(name, module, module_input_output)
-        self.maybe_save_overflow_data()
-        return api_info_struct if self.has_overflow else None
-    def analyze_backward(self, name, module, module_input_output: ModuleBackwardInputsOutputs):
-        self.has_overflow = False
-        api_info_struct = super().analyze_backward(name, module, module_input_output)
-        self.maybe_save_overflow_data()
-        return api_info_struct if self.has_overflow else None
-    def maybe_save_overflow_data(self):
-        if self.has_overflow:
-            for file_path, tensor in self.cached_tensors_and_file_paths.items():
-                save_tensor_as_npy(tensor, file_path)
-            self.real_overflow_nums += 1
-        self.cached_tensors_and_file_paths = {}
-    def _analyze_maybe_overflow_tensor(self, tensor_json):
-        if tensor_json['Max'] is None:
-            return
-        if np.isinf(tensor_json['Max']) or np.isnan(tensor_json['Max']):
-            self.has_overflow = True
-        if np.isinf(tensor_json['Min']) or np.isnan(tensor_json['Min']):
-            self.has_overflow = True
-    def _analyze_tensor(self, tensor, suffix):
-        dump_data_name, file_path = self.get_save_file_path(suffix)
-        if not path_len_exceeds_limit(file_path):
-            self.cached_tensors_and_file_paths.update({file_path: tensor})
-        else:
-            logger.warning(f'The file path {file_path} length exceeds limit.')
-        single_arg = super()._analyze_tensor(tensor, suffix)
-        self._analyze_maybe_overflow_tensor(single_arg)
-        single_arg.update({"data_name": dump_data_name})
-        return single_arg
+# Copyright 2024 Huawei Technologies Co., Ltd
+#
+# Licensed under the Apache License, Version 2.0 (the "License");
+# you may not use this file except in compliance with the License.
+# You may obtain a copy of the License at
+#
+# http://www.apache.org/licenses/LICENSE-2.0
+#
+# Unless required by applicable law or agreed to in writing, software
+# distributed under the License is distributed on an "AS IS" BASIS,
+# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
+# See the License for the specific language governing permissions and
+# limitations under the License.
+# ============================================================================
+import zlib
+import mindspore as ms
+from mindspore import mint, ops
+from mindspore._c_expression.typing import Number
+import numpy as np
+from msprobe.core.common.const import Const
+from msprobe.core.data_dump.data_processor.base import (BaseDataProcessor, TensorStatInfo,
+                                                        ModuleForwardInputsOutputs, ModuleBackwardInputsOutputs)
+from msprobe.core.common.file_utils import path_len_exceeds_limit
+from msprobe.mindspore.common.utils import convert_bf16_to_fp32, save_tensor_as_npy
+from msprobe.mindspore.common.log import logger
+from msprobe.mindspore.dump.hook_cell.api_registry import api_register
+class MindsporeDataProcessor(BaseDataProcessor):
+    mindspore_special_type = tuple([ms.Tensor, Number])
+    def __init__(self, config, data_writer):
+        super().__init__(config, data_writer)
+        self.mindspore_object_key = {
+            "dtype": self.analyze_dtype_in_kwargs
+        }
+    @staticmethod
+    def get_md5_for_tensor(x):
+        x = convert_bf16_to_fp32(x)
+        tensor_bytes = x.asnumpy().tobytes()
+        crc32_hash = zlib.crc32(tensor_bytes)
+        return f"{crc32_hash:08x}"
+    @staticmethod
+    def analyze_dtype_in_kwargs(element):
+        return {"type": "mindspore.dtype", "value": str(element)}
+    @classmethod
+    def get_special_types(cls):
+        return super().get_special_types() + cls.mindspore_special_type
+    def get_stat_info(self, data):
+        tensor_stat = TensorStatInfo()
+        if data.numel() == 0:
+            return tensor_stat
+        elif data.dtype == ms.bool_:
+            data_np = data.asnumpy()
+            tensor_stat.max = np.max(data_np).item()
+            tensor_stat.min = np.min(data_np).item()
+        elif not data.shape:
+            tensor_stat.max = tensor_stat.min = tensor_stat.mean = tensor_stat.norm = data.item()
+        elif data.dtype == ms.complex64 or data.dtype == ms.complex128:
+            data_abs = np.abs(data.asnumpy())
+            tensor_stat.max = np.max(data_abs).item()
+            tensor_stat.min = np.min(data_abs).item()
+            tensor_stat.mean = np.mean(data_abs).item()
+            tensor_stat.norm = np.linalg.norm(data_abs).item()
+        else:
+            if not ops.is_floating_point(data):
+                data = data.to(ms.float32)
+            api_register.norm_inner_op_set_ori_func()
+            get_max_value = api_register.mint_ops_ori_attr.get("max", mint.max)
+            get_min_value = api_register.mint_ops_ori_attr.get("min", mint.min)
+            get_mean_value = api_register.mint_ops_ori_attr.get("mean", mint.mean)
+            if hasattr(mint, "norm"):
+                get_norm_value = api_register.mint_ops_ori_attr.get("norm", mint.norm)
+            else:
+                get_norm_value = api_register.functional_ori_attr.get("norm", ops.norm)
+            tensor_stat.max = get_max_value(data).item()
+            tensor_stat.min = get_min_value(data).item()
+            tensor_stat.mean = get_mean_value(data).item()
+            tensor_stat.norm = get_norm_value(data).item()
+            api_register.norm_inner_op_set_hook_func()
+        return tensor_stat
+    def analyze_single_element(self, element, suffix_stack):
+        if suffix_stack and suffix_stack[-1] in self.mindspore_object_key:
+            return self.mindspore_object_key[suffix_stack[-1]](element)
+        converted_numpy, numpy_type = self._convert_numpy_to_builtin(element)
+        if converted_numpy is not element:
+            return self._analyze_numpy(converted_numpy, numpy_type)
+        if isinstance(element, Number):
+            return self.analyze_dtype_in_kwargs(element)
+        if isinstance(element, ms.Tensor):
+            return self._analyze_tensor(element, Const.SEP.join(suffix_stack))
+        if isinstance(element, (bool, int, float, str, slice, type(Ellipsis))):
+            return self._analyze_builtin(element)
+        return {}
+    def _analyze_tensor(self, tensor, suffix):
+        tensor_stat = self.get_stat_info(tensor)
+        tensor_json = {
+            'type': 'mindspore.Tensor',
+            'dtype': str(tensor.dtype),
+            'shape': tensor.shape,
+            'Max': self.transfer_type(tensor_stat.max),
+            'Min': self.transfer_type(tensor_stat.min),
+            'Mean': self.transfer_type(tensor_stat.mean),
+            'Norm': self.transfer_type(tensor_stat.norm),
+        }
+        if self.config.summary_mode == Const.MD5:
+            tensor_md5 = self.get_md5_for_tensor(tensor)
+            tensor_json.update({Const.MD5: tensor_md5})
+        return tensor_json
+class StatisticsDataProcessor(MindsporeDataProcessor):
+    pass
+class TensorDataProcessor(MindsporeDataProcessor):
+    def _analyze_tensor(self, tensor, suffix):
+        dump_data_name, file_path = self.get_save_file_path(suffix)
+        single_arg = super()._analyze_tensor(tensor, suffix)
+        single_arg.update({"data_name": dump_data_name})
+        save_tensor_as_npy(tensor, file_path)
+        return single_arg
+class OverflowCheckDataProcessor(MindsporeDataProcessor):
+    __slots__ = ["cached_tensors_and_file_paths"]
+    def __init__(self, config, data_writer):
+        super().__init__(config, data_writer)
+        self.has_overflow = False
+        self.cached_tensors_and_file_paths = {}
+        self.real_overflow_nums = 0
+        self.overflow_nums = config.overflow_nums
+    @property
+    def is_terminated(self):
+        if self.overflow_nums == -1:
+            return False
+        if self.real_overflow_nums >= self.overflow_nums:
+            return True
+        return False
+    def analyze_forward(self, name, module, module_input_output: ModuleForwardInputsOutputs):
+        self.has_overflow = False
+        api_info_struct = super().analyze_forward(name, module, module_input_output)
+        self.maybe_save_overflow_data()
+        return api_info_struct if self.has_overflow else None
+    def analyze_backward(self, name, module, module_input_output: ModuleBackwardInputsOutputs):
+        self.has_overflow = False
+        api_info_struct = super().analyze_backward(name, module, module_input_output)
+        self.maybe_save_overflow_data()
+        return api_info_struct if self.has_overflow else None
+    def maybe_save_overflow_data(self):
+        if self.has_overflow:
+            for file_path, tensor in self.cached_tensors_and_file_paths.items():
+                save_tensor_as_npy(tensor, file_path)
+            self.real_overflow_nums += 1
+            if self.overflow_nums != -1 and self.real_overflow_nums >= self.overflow_nums:
+                logger.info(f"[{Const.TOOL_NAME}] Reached the preset overflow times, "
+                            f"current overflow times: {self.real_overflow_nums}.")
+        self.cached_tensors_and_file_paths = {}
+    def _analyze_maybe_overflow_tensor(self, tensor_json):
+        if tensor_json['Max'] is None:
+            return
+        if np.isinf(tensor_json['Max']) or np.isnan(tensor_json['Max']):
+            self.has_overflow = True
+        if np.isinf(tensor_json['Min']) or np.isnan(tensor_json['Min']):
+            self.has_overflow = True
+    def _analyze_tensor(self, tensor, suffix):
+        dump_data_name, file_path = self.get_save_file_path(suffix)
+        if not path_len_exceeds_limit(file_path):
+            self.cached_tensors_and_file_paths.update({file_path: tensor})
+        else:
+            logger.warning(f'The file path {file_path} length exceeds limit.')
+        single_arg = super()._analyze_tensor(tensor, suffix)
+        self._analyze_maybe_overflow_tensor(single_arg)
+        single_arg.update({"data_name": dump_data_name})
+        return single_arg

mindstudio-probe 1.0.3__py3-none-any.whl → 1.1.0__py3-none-any.whl

mindstudio-probe 1.0.3py3-none-any.whl → 1.1.0py3-none-any.whl