PyPI - mindstudio-probe - Versions diffs - 8.3.2__py3-none-any.whl → 26.0.0a1__py3-none-any.whl - Mend

mindstudio-probe 8.3.2py3-none-any.whl → 26.0.0a1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (689) hide show

{mindstudio_probe-8.3.2.dist-info → mindstudio_probe-26.0.0a1.dist-info}/METADATA +26 -14
mindstudio_probe-26.0.0a1.dist-info/RECORD +498 -0
{mindstudio_probe-8.3.2.dist-info → mindstudio_probe-26.0.0a1.dist-info}/WHEEL +1 -1
mindstudio_probe-26.0.0a1.dist-info/entry_points.txt +5 -0
mindstudio_probe-26.0.0a1.dist-info/licenses/LICENSE +124 -0
mindstudio_probe-26.0.0a1.dist-info/top_level.txt +2 -0
msprobe/__init__.py +12 -13
msprobe/config.json +9 -31
msprobe/core/__init__.py +12 -11
msprobe/core/acc_check/acc_check_cli.py +145 -0
msprobe/core/common/const.py +97 -38
msprobe/core/common/db_manager.py +133 -12
msprobe/core/common/decorator.py +12 -11
msprobe/core/common/exceptions.py +12 -11
msprobe/core/common/file_utils.py +101 -25
msprobe/core/common/framework_adapter.py +36 -25
msprobe/core/common/global_lock.py +12 -11
msprobe/core/common/inplace_op_checker.py +12 -11
msprobe/core/common/log.py +22 -11
msprobe/core/common/megatron_utils.py +566 -11
msprobe/core/common/parallel_state.py +12 -11
msprobe/core/common/runtime.py +12 -11
msprobe/core/common/utils.py +41 -41
msprobe/core/compare/acc_compare.py +361 -104
msprobe/core/compare/atb_data_compare.py +422 -0
msprobe/core/compare/auto_compare.py +134 -0
msprobe/core/compare/check.py +14 -17
msprobe/core/compare/compare_cli.py +72 -149
msprobe/core/compare/config.py +12 -13
msprobe/core/compare/diff_analyze/first_diff_analyze.py +28 -15
msprobe/core/compare/diff_analyze/ignore_op_list.yaml +3 -0
msprobe/core/compare/find_first/analyzer.py +18 -18
msprobe/core/compare/find_first/graph.py +12 -11
msprobe/core/compare/find_first/utils.py +13 -12
msprobe/core/compare/indicator_analysis/__init__.py +15 -0
msprobe/core/compare/indicator_analysis/algorithm.py +363 -0
msprobe/core/compare/indicator_analysis/api_data.py +141 -0
msprobe/core/compare/indicator_analysis/calculator.py +181 -0
msprobe/core/compare/indicator_analysis/utils.py +116 -0
msprobe/core/compare/layer_mapping/__init__.py +12 -11
msprobe/core/compare/layer_mapping/data_scope_parser.py +20 -11
msprobe/core/compare/layer_mapping/layer_mapping.py +14 -13
msprobe/core/compare/layer_mapping/postprocess_pass.py +13 -11
msprobe/core/compare/merge_result/merge_result.py +12 -11
msprobe/core/compare/merge_result/merge_result_cli.py +12 -11
msprobe/core/compare/merge_result/utils.py +12 -11
msprobe/core/compare/multiprocessing_compute.py +13 -14
msprobe/core/compare/npy_compare.py +13 -11
msprobe/core/compare/offline_data_compare.py +160 -0
msprobe/core/compare/stats_diff_calc.py +39 -0
msprobe/core/compare/torchair_acc_cmp.py +764 -0
msprobe/core/compare/torchair_cmp_utils.py +338 -0
msprobe/core/compare/utils.py +140 -49
msprobe/core/config_check/__init__.py +12 -11
msprobe/core/config_check/checkers/__init__.py +12 -11
msprobe/core/config_check/checkers/base_checker.py +15 -14
msprobe/core/config_check/checkers/dataset_checker.py +13 -12
msprobe/core/config_check/checkers/env_args_checker.py +13 -12
msprobe/core/config_check/checkers/hyperparameter_checker.py +16 -15
msprobe/core/config_check/checkers/pip_checker.py +15 -15
msprobe/core/config_check/checkers/random_checker.py +13 -12
msprobe/core/config_check/checkers/weights_checker.py +14 -12
msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +13 -17
msprobe/core/config_check/ckpt_compare/megatron_loader.py +13 -12
msprobe/core/config_check/ckpt_compare/metrics.py +12 -11
msprobe/core/config_check/config_check_cli.py +18 -17
msprobe/core/config_check/config_checker.py +16 -14
msprobe/core/config_check/resource/dependency.yaml +15 -12
msprobe/core/config_check/resource/env.yaml +12 -11
msprobe/core/config_check/utils/hyperparameter_parser.py +12 -11
msprobe/core/config_check/utils/utils.py +12 -11
msprobe/core/{data_dump → dump/api_dump}/api_registry.py +12 -11
msprobe/core/{common_config.py → dump/common_config.py} +13 -24
msprobe/core/dump/data_dump/data_collector.py +257 -0
msprobe/core/{data_dump → dump/data_dump}/data_processor/base.py +45 -36
msprobe/core/{data_dump → dump/data_dump}/data_processor/factory.py +33 -25
msprobe/core/{data_dump → dump/data_dump}/data_processor/mindspore_processor.py +37 -113
msprobe/core/{data_dump → dump/data_dump}/data_processor/pytorch_processor.py +364 -131
msprobe/core/{data_dump → dump/data_dump}/json_writer.py +24 -31
msprobe/core/{data_dump → dump/data_dump}/scope.py +12 -13
msprobe/core/{debugger → dump/debugger}/precision_debugger.py +15 -23
msprobe/core/dump/dump2db/db_utils.py +215 -0
msprobe/core/dump/dump2db/dump2db.py +409 -0
msprobe/core/{hook_manager.py → dump/hook_manager.py} +38 -87
msprobe/core/dump/kernel_dump/kernel_config.py +34 -0
msprobe/core/{service.py → dump/service.py} +43 -27
msprobe/core/install_deps/install_deps.py +51 -0
msprobe/core/monitor/anomaly_processor.py +13 -11
msprobe/core/monitor/csv2db.py +73 -93
msprobe/core/monitor/db_utils.py +140 -205
msprobe/core/monitor/utils.py +18 -17
msprobe/core/monitor_v2/__init__.py +20 -0
msprobe/core/monitor_v2/base.py +83 -0
msprobe/core/monitor_v2/cc.py +287 -0
msprobe/core/monitor_v2/factory.py +81 -0
msprobe/core/monitor_v2/module.py +201 -0
msprobe/core/monitor_v2/optimizer.py +245 -0
msprobe/core/monitor_v2/param.py +154 -0
msprobe/core/monitor_v2/trainer.py +326 -0
msprobe/core/monitor_v2/utils.py +122 -0
msprobe/core/monitor_v2/weight_grad.py +419 -0
msprobe/core/monitor_v2/writer.py +162 -0
msprobe/core/overflow_check/abnormal_scene.py +12 -11
msprobe/core/overflow_check/api_info.py +12 -11
msprobe/core/overflow_check/checker.py +12 -11
msprobe/core/overflow_check/filter.py +13 -11
msprobe/core/overflow_check/level.py +12 -11
msprobe/core/overflow_check/utils.py +12 -11
msprobe/core/single_save/single_comparator.py +12 -11
msprobe/core/single_save/single_saver.py +12 -11
msprobe/infer/__init__.py +16 -0
msprobe/infer/offline/__init__.py +16 -0
msprobe/infer/offline/compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/args_adapter.py +46 -0
msprobe/infer/offline/compare/msquickcmp/atc/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/atc/atc_utils.py +98 -0
msprobe/infer/offline/compare/msquickcmp/cmp_process.py +328 -0
msprobe/infer/offline/compare/msquickcmp/common/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/common/args_check.py +112 -0
msprobe/infer/offline/compare/msquickcmp/common/convert.py +74 -0
msprobe/infer/offline/compare/msquickcmp/common/dump_data.py +121 -0
msprobe/infer/offline/compare/msquickcmp/common/dynamic_argument_bean.py +39 -0
msprobe/infer/offline/compare/msquickcmp/common/utils.py +669 -0
msprobe/infer/offline/compare/msquickcmp/config.ini +6 -0
msprobe/infer/offline/compare/msquickcmp/dump/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/dump/args_adapter.py +50 -0
msprobe/infer/offline/compare/msquickcmp/dump/dump_process.py +91 -0
msprobe/infer/offline/compare/msquickcmp/install_aclruntime_aisbench.sh +180 -0
msprobe/infer/offline/compare/msquickcmp/main.py +199 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/net_compare.py +277 -0
msprobe/infer/offline/compare/msquickcmp/npu/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/npu/npu_dump_data.py +558 -0
msprobe/infer/offline/compare/msquickcmp/npu/om_parser.py +416 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/onnx_dump_data.py +374 -0
msprobe/infer/utils/__init__.py +15 -0
msprobe/infer/utils/acc_cmp.py +94 -0
msprobe/infer/utils/check/__init__.py +37 -0
msprobe/infer/utils/check/args_checker.py +35 -0
msprobe/infer/utils/check/checker.py +227 -0
msprobe/infer/utils/check/dict_checker.py +78 -0
msprobe/infer/utils/check/func_wrapper.py +96 -0
msprobe/infer/utils/check/list_checker.py +56 -0
msprobe/infer/utils/check/number_checker.py +64 -0
msprobe/infer/utils/check/obj_checker.py +41 -0
msprobe/infer/utils/check/path_checker.py +249 -0
msprobe/infer/utils/check/rule.py +126 -0
msprobe/infer/utils/check/string_checker.py +66 -0
msprobe/infer/utils/cmp_algorithm.py +261 -0
msprobe/infer/utils/constants.py +112 -0
msprobe/infer/utils/file_open_check.py +337 -0
msprobe/infer/utils/util.py +177 -0
msprobe/mindspore/__init__.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_info.py +12 -11
msprobe/mindspore/api_accuracy_checker/api_runner.py +12 -11
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +12 -11
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +12 -11
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +15 -14
msprobe/mindspore/api_accuracy_checker/compute_element.py +12 -11
msprobe/mindspore/api_accuracy_checker/data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/main.py +12 -11
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +14 -12
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +12 -11
msprobe/mindspore/api_accuracy_checker/type_mapping.py +12 -11
msprobe/mindspore/api_accuracy_checker/utils.py +12 -11
msprobe/mindspore/common/const.py +15 -74
msprobe/mindspore/common/log.py +12 -11
msprobe/mindspore/common/utils.py +30 -15
msprobe/mindspore/compare/common_dir_compare.py +21 -23
msprobe/mindspore/compare/distributed_compare.py +18 -16
msprobe/mindspore/compare/ms_compare.py +14 -14
msprobe/mindspore/compare/ms_graph_compare.py +26 -20
msprobe/mindspore/compare/utils.py +14 -12
msprobe/mindspore/{cell_processor.py → dump/cell_processor.py} +15 -14
msprobe/mindspore/{debugger → dump/debugger}/debugger_config.py +12 -30
msprobe/mindspore/{debugger → dump/debugger}/precision_debugger.py +43 -45
msprobe/mindspore/dump/{cell_dump_process.py → dump_processor/cell_dump_process.py} +31 -17
msprobe/mindspore/dump/{cell_dump_with_insert_gradient.py → dump_processor/cell_dump_with_insert_gradient.py} +18 -14
msprobe/mindspore/dump/{dump_tool_factory.py → dump_processor/dump_tool_factory.py} +16 -15
msprobe/mindspore/dump/{graph_mode_cell_dump.py → dump_processor/graph_mode_cell_dump.py} +16 -15
msprobe/mindspore/dump/{graph_tensor_dump.py → dump_processor/graph_tensor_dump.py} +134 -133
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/api_register.py +15 -14
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/hook_cell.py +12 -11
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/ms_hook_manager.py +47 -20
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/primitive_hooks.py +14 -13
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/support_wrap_ops.yaml +13 -11
msprobe/mindspore/dump/{jit_dump.py → dump_processor/jit_dump.py} +14 -13
msprobe/mindspore/dump/{kernel_graph_dump.py → dump_processor/kernel_graph_dump.py} +13 -12
msprobe/mindspore/dump/{kernel_kbyk_dump.py → dump_processor/kernel_kbyk_dump.py} +13 -12
msprobe/mindspore/{exception_dump → dump/exception_dump}/exception_dump_tool_factory.py +14 -13
msprobe/mindspore/{exception_dump → dump/exception_dump}/kernel_graph_exception_dump.py +13 -12
msprobe/mindspore/{mindspore_service.py → dump/mindspore_service.py} +18 -17
msprobe/mindspore/dump/mindtorch/__init__.py +19 -0
msprobe/mindspore/dump/ms_config.py +105 -0
msprobe/mindspore/{overflow_check → dump/overflow_check}/kernel_graph_overflow_check.py +13 -12
msprobe/mindspore/{overflow_check → dump/overflow_check}/overflow_check_tool_factory.py +14 -13
msprobe/mindspore/dump/task_handler_factory.py +43 -0
msprobe/mindspore/monitor/common_func.py +12 -11
msprobe/mindspore/monitor/data_writers.py +12 -11
msprobe/mindspore/monitor/distributed/wrap_distributed.py +93 -39
msprobe/mindspore/monitor/features.py +12 -11
msprobe/mindspore/monitor/module_hook.py +19 -22
msprobe/mindspore/monitor/optimizer_collect.py +29 -25
msprobe/mindspore/monitor/utils.py +13 -11
msprobe/msaccucmp/advisor/__init__.py +16 -0
msprobe/msaccucmp/advisor/advisor_const.py +65 -0
msprobe/msaccucmp/advisor/advisor_result.py +73 -0
msprobe/msaccucmp/advisor/compare_advisor.py +99 -0
msprobe/msaccucmp/advisor/input_advisor.py +66 -0
msprobe/msaccucmp/advisor/node_advisor.py +68 -0
msprobe/msaccucmp/advisor/overflow_advisor.py +58 -0
msprobe/msaccucmp/algorithm_manager/__init__.py +16 -0
msprobe/msaccucmp/algorithm_manager/algorithm_manager.py +464 -0
msprobe/msaccucmp/algorithm_manager/algorithm_parameter.py +42 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_AccumulatedRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_CosineSimilarity.py +58 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_KullbackLeiblerDivergence.py +84 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RelativeEuclideanDistance.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RootMeanSquareError.py +40 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_StandardDeviation.py +47 -0
msprobe/msaccucmp/cmp_utils/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/common.py +113 -0
msprobe/msaccucmp/cmp_utils/constant/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/constant/compare_error.py +81 -0
msprobe/msaccucmp/cmp_utils/constant/const_manager.py +530 -0
msprobe/msaccucmp/cmp_utils/file_utils.py +497 -0
msprobe/msaccucmp/cmp_utils/log.py +257 -0
msprobe/msaccucmp/cmp_utils/multi_process/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/multi_process/multi_convert_process.py +140 -0
msprobe/msaccucmp/cmp_utils/multi_process/progress.py +78 -0
msprobe/msaccucmp/cmp_utils/path_check.py +274 -0
msprobe/msaccucmp/cmp_utils/reg_manager.py +98 -0
msprobe/msaccucmp/cmp_utils/tlv_parse.py +279 -0
msprobe/msaccucmp/cmp_utils/utils.py +356 -0
msprobe/msaccucmp/cmp_utils/utils_type.py +63 -0
msprobe/msaccucmp/compare_vector.py +48 -0
msprobe/msaccucmp/conversion/__init__.py +16 -0
msprobe/msaccucmp/conversion/data_conversion.py +277 -0
msprobe/msaccucmp/conversion/dtype_conversion.py +99 -0
msprobe/msaccucmp/conversion/shape_format_conversion.py +477 -0
msprobe/msaccucmp/conversion/tensor_conversion.py +369 -0
msprobe/msaccucmp/dump_data_conversion.py +46 -0
msprobe/msaccucmp/dump_parse/__init__.py +16 -0
msprobe/msaccucmp/dump_parse/big_dump_data.py +317 -0
msprobe/msaccucmp/dump_parse/dump.py +423 -0
msprobe/msaccucmp/dump_parse/dump_data_object.py +322 -0
msprobe/msaccucmp/dump_parse/dump_data_parser.py +436 -0
msprobe/msaccucmp/dump_parse/dump_utils.py +246 -0
msprobe/msaccucmp/dump_parse/ffts_parser.py +137 -0
msprobe/msaccucmp/dump_parse/mapping.py +62 -0
msprobe/msaccucmp/dump_parse/nano_dump_data.py +392 -0
msprobe/msaccucmp/dump_parse/proto_dump_data.py +308 -0
msprobe/msaccucmp/dump_parser.py +90 -0
msprobe/msaccucmp/format_manager/__init__.py +16 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NCHW.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_ND.py +52 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NHWC.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_HWCN.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_NCHW.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_FRACTAL_Z.py +89 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_HWCN.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NCHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NHWC.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_NCDHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_ND.py +44 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_HWCN.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/format_manager.py +307 -0
msprobe/msaccucmp/inplace_layer_process.py +186 -0
msprobe/msaccucmp/msaccucmp.py +532 -0
msprobe/msaccucmp/mscmp_advisor.py +128 -0
msprobe/msaccucmp/overflow/__init__.py +16 -0
msprobe/msaccucmp/overflow/overflow_analyse.py +305 -0
msprobe/msaccucmp/overflow/overflow_detection.py +143 -0
msprobe/msaccucmp/pytorch_cmp/__init__.py +16 -0
msprobe/msaccucmp/pytorch_cmp/compare_pytorch.py +389 -0
msprobe/msaccucmp/pytorch_cmp/hdf5_parser.py +377 -0
msprobe/msaccucmp/pytorch_cmp/pytorch_dump_data.py +461 -0
msprobe/msaccucmp/shape_conversion.py +41 -0
msprobe/msaccucmp/vector_cmp/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/batch_compare.py +197 -0
msprobe/msaccucmp/vector_cmp/compare_detail/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/compare_detail/compare_detail.py +245 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail.py +182 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail_writer.py +580 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_fusion_op.py +588 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_npu_vs_npu.py +339 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_result.py +326 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_rule.py +156 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_op.py +204 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_rule_parser.py +635 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/quant_filter.py +187 -0
msprobe/msaccucmp/vector_cmp/range_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_manager.py +100 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_mode.py +94 -0
msprobe/msaccucmp/vector_cmp/range_manager/select_mode.py +86 -0
msprobe/msaccucmp/vector_cmp/vector_comparison.py +535 -0
msprobe/msprobe.py +101 -130
msprobe/overflow_check/__init__.py +15 -0
msprobe/{nan_analyze → overflow_check}/analyzer.py +38 -27
msprobe/{nan_analyze → overflow_check}/graph.py +30 -27
msprobe/{nan_analyze → overflow_check}/utils.py +15 -14
msprobe/pytorch/__init__.py +20 -14
msprobe/pytorch/aclgraph_dump/__init__.py +45 -0
msprobe/pytorch/aclgraph_dump/_meta.py +26 -0
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut.py → acc_check/acc_check.py} +50 -45
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut_utils.py → acc_check/acc_check_utils.py} +201 -30
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/data_generate.py +56 -16
msprobe/pytorch/api_accuracy_checker/{run_ut/multi_run_ut.py → acc_check/multi_acc_check.py} +32 -47
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/run_overflow_check.py +19 -18
msprobe/pytorch/api_accuracy_checker/common/config.py +22 -20
msprobe/pytorch/api_accuracy_checker/common/utils.py +72 -13
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +41 -11
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +23 -14
msprobe/pytorch/api_accuracy_checker/compare/compare.py +45 -32
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +12 -11
msprobe/pytorch/api_accuracy_checker/compare/compare_input.py +14 -12
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +14 -12
msprobe/pytorch/api_accuracy_checker/precision_standard/absolute_threshold.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/accumulative_error_compare.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/base_standard.py +21 -19
msprobe/pytorch/api_accuracy_checker/precision_standard/benchmark_compare.py +14 -13
msprobe/pytorch/api_accuracy_checker/precision_standard/binary_consistency.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_config.py +60 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_register.py +27 -16
msprobe/pytorch/api_accuracy_checker/precision_standard/thousandth_standard.py +13 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/ulp_compare.py +39 -18
msprobe/pytorch/bench_functions/__init__.py +12 -11
msprobe/pytorch/bench_functions/apply_adam.py +12 -11
msprobe/pytorch/bench_functions/apply_adam_w.py +12 -11
msprobe/pytorch/bench_functions/confusion_transpose.py +12 -11
msprobe/pytorch/bench_functions/fast_gelu.py +12 -11
msprobe/pytorch/bench_functions/group_norm_silu.py +12 -11
msprobe/pytorch/bench_functions/layer_norm_eval.py +12 -11
msprobe/pytorch/bench_functions/linear.py +12 -11
msprobe/pytorch/bench_functions/matmul_backward.py +12 -11
msprobe/pytorch/bench_functions/mish.py +12 -11
msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +12 -11
msprobe/pytorch/bench_functions/npu_fusion_attention.py +12 -11
msprobe/pytorch/bench_functions/rms_norm.py +12 -11
msprobe/pytorch/bench_functions/rotary_mul.py +12 -11
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +12 -11
msprobe/pytorch/bench_functions/sort_v2.py +12 -11
msprobe/pytorch/bench_functions/swiglu.py +12 -11
msprobe/pytorch/common/__init__.py +12 -11
msprobe/pytorch/common/log.py +12 -11
msprobe/pytorch/common/parse_json.py +12 -11
msprobe/pytorch/common/utils.py +52 -19
msprobe/pytorch/compare/distributed_compare.py +13 -13
msprobe/pytorch/compare/match.py +12 -11
msprobe/pytorch/compare/pt_compare.py +14 -20
msprobe/pytorch/compare/pt_diff_analyze.py +12 -11
msprobe/pytorch/compare/utils.py +12 -11
msprobe/pytorch/{hook_module → dump/api_dump}/api_register.py +18 -16
msprobe/pytorch/{hook_module → dump/api_dump}/hook_module.py +14 -13
msprobe/pytorch/{hook_module → dump/api_dump}/pt_hook_manager.py +68 -23
msprobe/pytorch/{hook_module → dump/api_dump}/register_optimizer_hook.py +13 -11
msprobe/pytorch/{hook_module → dump/api_dump}/script_wrapper.py +17 -14
msprobe/pytorch/{hook_module → dump/api_dump}/utils.py +12 -11
msprobe/pytorch/{debugger → dump/debugger}/debugger_config.py +23 -38
msprobe/pytorch/dump/debugger/precision_debugger.py +130 -0
msprobe/pytorch/{function_factory.py → dump/function_factory.py} +12 -11
msprobe/pytorch/dump/module_dump/hook_wrapper.py +17 -13
msprobe/pytorch/dump/module_dump/module_dump.py +16 -15
msprobe/pytorch/dump/module_dump/{module_processer.py → module_processor.py} +54 -42
msprobe/pytorch/dump/pt_config.py +128 -0
msprobe/pytorch/{pytorch_service.py → dump/pytorch_service.py} +22 -21
msprobe/pytorch/monitor/csv2tb.py +13 -11
msprobe/pytorch/monitor/data_writers.py +13 -11
msprobe/pytorch/monitor/distributed/wrap_distributed.py +13 -11
msprobe/pytorch/monitor/features.py +12 -11
msprobe/pytorch/monitor/module_hook.py +67 -59
msprobe/pytorch/monitor/module_metric.py +13 -11
msprobe/pytorch/monitor/optimizer_collect.py +37 -35
msprobe/pytorch/monitor/utils.py +13 -11
msprobe/pytorch/monitor/visualizer.py +12 -11
msprobe/pytorch/torchair_dump/__init__.py +17 -0
msprobe/pytorch/torchair_dump/torchair_dump.py +114 -0
msprobe/scripts/atb/config_example.json +10 -0
msprobe/scripts/atb/load_atb_probe.sh +101 -0
msprobe/scripts/atb/unload_atb_probe.sh +27 -0
msprobe/scripts/build_msaccucmp.sh +186 -0
msprobe/scripts/conf/help.info +6 -0
msprobe/scripts/conf/version.info +3 -0
msprobe/scripts/run_script/common.sh +538 -0
msprobe/scripts/run_script/main_msaccucmp.sh +232 -0
msprobe/visualization/__init__.py +12 -11
msprobe/visualization/builder/__init__.py +12 -11
msprobe/visualization/builder/graph_builder.py +45 -30
msprobe/visualization/builder/graph_merger.py +53 -32
msprobe/visualization/builder/msprobe_adapter.py +34 -44
msprobe/visualization/compare/__init__.py +12 -11
msprobe/visualization/compare/graph_comparator.py +63 -51
msprobe/visualization/compare/mode_adapter.py +28 -113
msprobe/visualization/db_utils.py +133 -22
msprobe/visualization/graph/__init__.py +12 -11
msprobe/visualization/graph/base_node.py +15 -27
msprobe/visualization/graph/distributed_analyzer.py +97 -40
msprobe/visualization/graph/graph.py +14 -16
msprobe/visualization/graph/node_colors.py +34 -31
msprobe/visualization/graph/node_op.py +12 -11
msprobe/visualization/graph_service.py +580 -205
msprobe/visualization/utils.py +278 -31
tb_graph_ascend/secure_build.py +175 -0
tb_graph_ascend/server/__init__.py +15 -0
tb_graph_ascend/server/app/__init__.py +15 -0
tb_graph_ascend/server/app/model/__init__.py +15 -0
tb_graph_ascend/server/app/model/hierarchy.py +348 -0
tb_graph_ascend/server/app/model/layout_hierarchy_model.py +69 -0
tb_graph_ascend/server/app/model/match_nodes_model.py +573 -0
tb_graph_ascend/server/app/repositories/__init__.py +15 -0
tb_graph_ascend/server/app/repositories/graph_repo_base.py +32 -0
tb_graph_ascend/server/app/repositories/graph_repo_db.py +879 -0
tb_graph_ascend/server/app/repositories/graph_repo_vis.py +83 -0
tb_graph_ascend/server/app/service/__init__.py +18 -0
tb_graph_ascend/server/app/service/graph_service_base.py +158 -0
tb_graph_ascend/server/app/service/graph_service_db.py +438 -0
tb_graph_ascend/server/app/service/graph_service_factory.py +54 -0
tb_graph_ascend/server/app/service/graph_service_vis.py +480 -0
tb_graph_ascend/server/app/utils/__init__.py +15 -0
tb_graph_ascend/server/app/utils/constant.py +80 -0
tb_graph_ascend/server/app/utils/file_check_wrapper.py +46 -0
tb_graph_ascend/server/app/utils/global_state.py +95 -0
tb_graph_ascend/server/app/utils/graph_utils.py +661 -0
tb_graph_ascend/server/app/utils/i18n.py +153 -0
tb_graph_ascend/server/app/utils/request_method.py +46 -0
tb_graph_ascend/server/app/views/__init__.py +15 -0
tb_graph_ascend/server/app/views/graph_views.py +304 -0
tb_graph_ascend/server/plugin.py +108 -0
tb_graph_ascend/server/static/index.html +9250 -0
tb_graph_ascend/server/static/index.js +21 -0
tb_graph_ascend/setup.py +57 -0
mindstudio_probe-8.3.2.dist-info/LICENSE +0 -201
mindstudio_probe-8.3.2.dist-info/RECORD +0 -491
mindstudio_probe-8.3.2.dist-info/entry_points.txt +0 -2
mindstudio_probe-8.3.2.dist-info/top_level.txt +0 -1
msprobe/CMakeLists.txt +0 -5
msprobe/README.md +0 -203
msprobe/core/advisor/advisor.py +0 -129
msprobe/core/advisor/advisor_const.py +0 -58
msprobe/core/advisor/advisor_result.py +0 -58
msprobe/core/compare/find_first/data_processor.py +0 -35
msprobe/core/compare/highlight.py +0 -390
msprobe/core/data_dump/data_collector.py +0 -356
msprobe/core/grad_probe/constant.py +0 -90
msprobe/core/grad_probe/grad_compare.py +0 -187
msprobe/core/grad_probe/utils.py +0 -105
msprobe/core/kernel_dump/kernel_config.py +0 -33
msprobe/docs/01.installation.md +0 -250
msprobe/docs/02.config_introduction.md +0 -221
msprobe/docs/03.config_examples.md +0 -281
msprobe/docs/04.kernel_dump_PyTorch.md +0 -73
msprobe/docs/05.data_dump_PyTorch.md +0 -518
msprobe/docs/06.data_dump_MindSpore.md +0 -618
msprobe/docs/07.accuracy_checker_PyTorch.md +0 -310
msprobe/docs/09.accuracy_checker_MindSpore.md +0 -120
msprobe/docs/10.accuracy_compare_PyTorch.md +0 -637
msprobe/docs/11.accuracy_compare_MindSpore.md +0 -769
msprobe/docs/12.overflow_check_PyTorch.md +0 -82
msprobe/docs/13.overflow_check_MindSpore.md +0 -33
msprobe/docs/14.data_parse_PyTorch.md +0 -282
msprobe/docs/15.free_benchmarking_PyTorch.md +0 -169
msprobe/docs/16.free_benchmarking_MindSpore.md +0 -159
msprobe/docs/17.grad_probe.md +0 -205
msprobe/docs/18.online_dispatch.md +0 -89
msprobe/docs/19.monitor.md +0 -753
msprobe/docs/20.monitor_performance_baseline.md +0 -52
msprobe/docs/21.visualization_PyTorch.md +0 -519
msprobe/docs/22.visualization_MindSpore.md +0 -515
msprobe/docs/23.generate_operator_PyTorch.md +0 -107
msprobe/docs/24.code_mapping_Mindspore.md +0 -29
msprobe/docs/25.tool_function_introduction.md +0 -29
msprobe/docs/26.data_dump_PyTorch_baseline.md +0 -48
msprobe/docs/27.dump_json_instruction.md +0 -795
msprobe/docs/28.debugger_save_instruction.md +0 -288
msprobe/docs/28.kernel_dump_MindSpore.md +0 -69
msprobe/docs/29.data_dump_MSAdapter.md +0 -235
msprobe/docs/30.overflow_check_MSAdapter.md +0 -31
msprobe/docs/31.config_check.md +0 -107
msprobe/docs/32.ckpt_compare.md +0 -69
msprobe/docs/33.generate_operator_MindSpore.md +0 -181
msprobe/docs/34.RL_collect.md +0 -101
msprobe/docs/35.nan_analyze.md +0 -73
msprobe/docs/36.calculation_result_change.md +0 -75
msprobe/docs/FAQ.md +0 -232
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +0 -146
msprobe/docs/accuracy_checker_MindSpore/accuracy_checker_MindSpore_baseline.md +0 -14
msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +0 -33
msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +0 -217
msprobe/docs/img/BLOOM-7B_1.png +0 -0
msprobe/docs/img/BLOOM-7B_2.png +0 -0
msprobe/docs/img/BLOOM-7B_3.png +0 -0
msprobe/docs/img/BLOOM-7B_4.png +0 -0
msprobe/docs/img/GPT-3_1.png +0 -0
msprobe/docs/img/GPT-3_2.png +0 -0
msprobe/docs/img/GPT-3_3.png +0 -0
msprobe/docs/img/GPT-3_4.png +0 -0
msprobe/docs/img/GPT-3_5.png +0 -0
msprobe/docs/img/GPT-3_6.png +0 -0
msprobe/docs/img/GPT-3_7.png +0 -0
msprobe/docs/img/GPT-3_8.png +0 -0
msprobe/docs/img/YOLOV5S_1.png +0 -0
msprobe/docs/img/YOLOV5S_2.png +0 -0
msprobe/docs/img/accuracy_checking_details.png +0 -0
msprobe/docs/img/accuracy_checking_result.png +0 -0
msprobe/docs/img/api_precision_compare_details.png +0 -0
msprobe/docs/img/api_precision_compare_result.png +0 -0
msprobe/docs/img/auto_analyze_log.png +0 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/compare_result_pkl.png +0 -0
msprobe/docs/img/compare_result_pkl_md5.png.png +0 -0
msprobe/docs/img/cpu_info.png +0 -0
msprobe/docs/img/free_benchmark.png +0 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/grad_probe_image-1.png +0 -0
msprobe/docs/img/grad_probe_image-2.png +0 -0
msprobe/docs/img/grad_probe_image-3.png +0 -0
msprobe/docs/img/grad_probe_image-4.png +0 -0
msprobe/docs/img/grad_probe_image.png +0 -0
msprobe/docs/img/merge_result.png +0 -0
msprobe/docs/img/module_compare.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/docs/img/monitor/step_count_per_record.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/docs/img/save_compare_result_sample.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_ms.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_pt.png +0 -0
msprobe/docs/img/visualization/proxy.png +0 -0
msprobe/docs/img/visualization/tensorboard_1.png +0 -0
msprobe/docs/img/visualization/tensorboard_2.png +0 -0
msprobe/docs/img/visualization/vis_browser_1.png +0 -0
msprobe/docs/img/visualization/vis_browser_2.png +0 -0
msprobe/docs/img/visualization/vis_match_info.png +0 -0
msprobe/docs/img/visualization/vis_precision_info.png +0 -0
msprobe/docs/img/visualization/vis_search_info.png +0 -0
msprobe/docs/img/visualization/vis_show_info.png +0 -0
msprobe/docs/img/visualization/vis_showcase.png +0 -0
msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
msprobe/docs/visualization/GPTModel.png +0 -0
msprobe/docs/visualization/ParallelMLP.png +0 -0
msprobe/docs/visualization/layer_mapping_example.md +0 -132
msprobe/docs/visualization/mapping.png +0 -0
msprobe/docs/visualization/mapping1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/3.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/4.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/5.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/6.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/7.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory-qwen25vl.txt +0 -59
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed-mm-qwen25vl.txt +0 -80
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactory_mapping.md +0 -330
msprobe/docs/visualization/module_name.png +0 -0
msprobe/docs/visualization/module_name1.png +0 -0
msprobe/docs/visualization/no_mapping.png +0 -0
msprobe/docs/visualization/no_mapping1.png +0 -0
msprobe/docs/visualization/no_mapping_analyze.png +0 -0
msprobe/docs/visualization/top_layer.png +0 -0
msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +0 -460
msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +0 -2081
msprobe/mindspore/code_mapping/bind.py +0 -283
msprobe/mindspore/code_mapping/cmd_parser.py +0 -40
msprobe/mindspore/code_mapping/graph.py +0 -49
msprobe/mindspore/code_mapping/graph_parser.py +0 -211
msprobe/mindspore/code_mapping/main.py +0 -24
msprobe/mindspore/code_mapping/processor.py +0 -34
msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +0 -111
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +0 -52
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +0 -257
msprobe/mindspore/free_benchmark/common/config.py +0 -27
msprobe/mindspore/free_benchmark/common/handler_params.py +0 -31
msprobe/mindspore/free_benchmark/common/utils.py +0 -100
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -638
msprobe/mindspore/free_benchmark/handler/base_handler.py +0 -105
msprobe/mindspore/free_benchmark/handler/check_handler.py +0 -55
msprobe/mindspore/free_benchmark/handler/fix_handler.py +0 -51
msprobe/mindspore/free_benchmark/handler/handler_factory.py +0 -36
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +0 -82
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +0 -45
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +0 -78
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +0 -77
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +0 -56
msprobe/mindspore/free_benchmark/perturbation/no_change.py +0 -27
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +0 -46
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +0 -51
msprobe/mindspore/grad_probe/global_context.py +0 -127
msprobe/mindspore/grad_probe/grad_analyzer.py +0 -260
msprobe/mindspore/grad_probe/grad_monitor.py +0 -42
msprobe/mindspore/grad_probe/grad_stat_csv.py +0 -161
msprobe/mindspore/grad_probe/hook.py +0 -115
msprobe/mindspore/grad_probe/utils.py +0 -43
msprobe/mindspore/mindtorch/__init__.py +0 -18
msprobe/mindspore/ms_config.py +0 -153
msprobe/mindspore/task_handler_factory.py +0 -44
msprobe/nan_analyze/__init__.py +0 -14
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +0 -9
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +0 -480
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +0 -567
msprobe/pytorch/debugger/precision_debugger.py +0 -181
msprobe/pytorch/free_benchmark/__init__.py +0 -23
msprobe/pytorch/free_benchmark/common/constant.py +0 -85
msprobe/pytorch/free_benchmark/common/counter.py +0 -87
msprobe/pytorch/free_benchmark/common/enums.py +0 -80
msprobe/pytorch/free_benchmark/common/params.py +0 -152
msprobe/pytorch/free_benchmark/common/utils.py +0 -143
msprobe/pytorch/free_benchmark/compare/grad_saver.py +0 -215
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +0 -121
msprobe/pytorch/free_benchmark/main.py +0 -123
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +0 -28
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +0 -56
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +0 -107
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +0 -121
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +0 -89
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +0 -87
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +0 -43
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +0 -60
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +0 -34
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +0 -252
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +0 -54
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +0 -40
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -45
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +0 -181
msprobe/pytorch/grad_probe/__init__.py +0 -0
msprobe/pytorch/grad_probe/grad_monitor.py +0 -108
msprobe/pytorch/grad_probe/grad_stat_csv.py +0 -160
msprobe/pytorch/hook_module/__init__.py +0 -16
msprobe/pytorch/hook_module/wrap_aten.py +0 -111
msprobe/pytorch/online_dispatch/__init__.py +0 -19
msprobe/pytorch/online_dispatch/compare.py +0 -224
msprobe/pytorch/online_dispatch/dispatch.py +0 -332
msprobe/pytorch/online_dispatch/dump_compare.py +0 -179
msprobe/pytorch/online_dispatch/single_compare.py +0 -412
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +0 -58
msprobe/pytorch/online_dispatch/utils.py +0 -158
msprobe/pytorch/parse_tool/__init__.py +0 -0
msprobe/pytorch/parse_tool/cli.py +0 -31
msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
msprobe/pytorch/parse_tool/lib/compare.py +0 -253
msprobe/pytorch/parse_tool/lib/config.py +0 -50
msprobe/pytorch/parse_tool/lib/file_desc.py +0 -45
msprobe/pytorch/parse_tool/lib/interactive_cli.py +0 -97
msprobe/pytorch/parse_tool/lib/parse_exception.py +0 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +0 -161
msprobe/pytorch/parse_tool/lib/utils.py +0 -299
msprobe/pytorch/parse_tool/lib/visualization.py +0 -85
msprobe/pytorch/pt_config.py +0 -299
/msprobe/core/{grad_probe → dump}/__init__.py +0 -0
/msprobe/{mindspore/code_mapping → core/dump/api_dump}/__init__.py +0 -0
/msprobe/{mindspore/debugger → core/dump/data_dump}/__init__.py +0 -0
/msprobe/{mindspore/exception_dump → core/dump/data_dump/data_processor}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark → core/dump/debugger}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark/common → core/dump/kernel_dump}/__init__.py +0 -0
/msprobe/mindspore/{free_benchmark/handler → dump/debugger}/__init__.py +0 -0
/msprobe/mindspore/{grad_probe → dump/dump_processor}/__init__.py +0 -0
/msprobe/mindspore/{overflow_check → dump/exception_dump}/__init__.py +0 -0
/msprobe/mindspore/{mindtorch → dump/mindtorch}/mindtorch_adaptor.py +0 -0
/msprobe/{pytorch/api_accuracy_checker/run_ut → mindspore/dump/overflow_check}/__init__.py +0 -0
/msprobe/{pytorch/debugger → mindspore/monitor}/__init__.py +0 -0
/msprobe/{pytorch/free_benchmark/common → msaccucmp}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/.keep +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers → api_accuracy_checker/acc_check}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/torch_ut_setting.json +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers/npu → dump/api_dump}/__init__.py +0 -0
/msprobe/pytorch/{hook_module → dump/api_dump}/support_wrap_ops.yaml +0 -0
/msprobe/pytorch/{free_benchmark/result_handlers → dump/debugger}/__init__.py +0 -0

msprobe/msaccucmp/vector_cmp/fusion_manager/compare_npu_vs_npu.py ADDED Viewed

@@ -0,0 +1,339 @@
+# coding=utf-8
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
+#
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
+#
+#          http://license.coscl.org.cn/MulanPSL2
+#
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
+"""
+Function:
+NpuVsNpuComparison class. This class mainly involves the compare function.
+"""
+import numpy as np
+from msprobe.msaccucmp.cmp_utils import utils
+from msprobe.msaccucmp.cmp_utils import common
+from msprobe.msaccucmp.cmp_utils import log
+from msprobe.msaccucmp.cmp_utils.constant.const_manager import ConstManager
+from msprobe.msaccucmp.dump_parse.dump import CompareData
+from msprobe.msaccucmp.algorithm_manager.algorithm_manager import AlgorithmManager
+from msprobe.msaccucmp.vector_cmp.fusion_manager.fusion_op import FusionOp
+from msprobe.msaccucmp.vector_cmp.fusion_manager.fusion_op import Tensor
+from msprobe.msaccucmp.vector_cmp.fusion_manager import compare_result
+from msprobe.msaccucmp.cmp_utils.constant.compare_error import CompareError
+from msprobe.msaccucmp.overflow.overflow_detection import OverflowDetection
+from msprobe.msaccucmp.dump_parse.ffts_parser import FFTSParser
+from msprobe.msaccucmp.dump_parse import dump_utils
+from msprobe.msaccucmp.conversion.tensor_conversion import ConvertSingleTensorFormat
+class NpuVsNpuComparison:
+    """
+    The class for npu vs npu comparison
+    """
+    def __init__(self: any, compare_data: CompareData, fusion_op_list: list, algorithm_manager: AlgorithmManager,
+                 overflow_detection: bool = False) -> None:
+        self.compare_data = compare_data
+        self.fusion_op_list = fusion_op_list
+        self.algorithm_manager = algorithm_manager
+        self.op_name = fusion_op_list[0].op_name
+        self.overflow_detection = overflow_detection
+        self.enable_padding_restore = True # 预留用于控制是否开启补齐恢复
+        self._tensor_converter = ConvertSingleTensorFormat()
+    def check_tensor_valid(self: any, my_output_tensor_list: any, ground_truth_tensor_list: any,
+                           tensor_type: str) -> (int, str):
+        """
+        check tensor valid
+        """
+        # check the length is same
+        if len(my_output_tensor_list) != len(ground_truth_tensor_list):
+            message = log.print_not_match_error(
+                self.op_name, 'number of %s' % tensor_type, str(len(my_output_tensor_list)),
+                str(len(ground_truth_tensor_list)))
+            return CompareError.MSACCUCMP_INVALID_DUMP_DATA_ERROR, message
+        if len(my_output_tensor_list) != 0:
+            # check each tensor format and shape valid
+            return self._check_op_data_valid(my_output_tensor_list, ground_truth_tensor_list, tensor_type)
+        message = '[%s] There is no %s. Skip the %s:%s.' % (self.op_name, tensor_type, self.op_name, tensor_type)
+        log.print_info_log(message)
+        return CompareError.MSACCUCMP_INVALID_DUMP_DATA_ERROR, message
+    def _restore_tensor_data_if_needed(self, tensor: Tensor):
+        """
+        根据开关决定是否对 tensor 做格式转换 + 按 original_shape 切掉 padding。
+        """
+        if not self._tensor_converter:
+            return tensor.data
+        try:
+            # ConvertSingleTensorFormat.__call__ 返回的是 np.ndarray
+            restored = self._tensor_converter(tensor)
+        except CompareError as ee:
+            # 出错时回退到原始数据，保证比对流程不中断
+            log.print_error_log(ee)
+            return tensor.data
+        except Exception as ee:  # 兜底
+            log.print_error_log(ee)
+            return tensor.data
+        return restored
+    def compare(self: any) -> (int, bool, list):
+        """
+        Compare for npu vs npu by op_name
+        :return ret: return code
+        :return dump_match: True, at least one operator match;False, no operator match
+        :return result: the compare result by the fusion op list
+        """
+        single_op_cmp_result = compare_result.SingleOpCmpResult()
+        if len(self.fusion_op_list) == 1:
+            return self._make_one_dump_file_result()
+        # get my output and ground truth tensor
+        error_msg = []
+        try:
+            my_output_dump_data = self._get_dump_data(
+                self.fusion_op_list[0], self.compare_data.left_dump_info.path,
+                self.compare_data.left_dump_info.op_name_to_task_mode_map, ConstManager.LEFT_TYPE)
+        except CompareError as error:
+            error_msg.append(error.message)
+            fusion_op_result = compare_result.FusionOpComResult(self.algorithm_manager)
+            _result = fusion_op_result.get_result(self.fusion_op_list[0], None, error_msg)
+            result_info = utils.ResultInfo(
+                self.fusion_op_list[0].op_name, True, _result.result_list, error.code,
+                [], _result.input_result_list, _result.output_result_list, _result.is_ffts,
+                {}, True)
+            single_op_cmp_result.update_attr(result_info)
+            return error.code, True, [single_op_cmp_result]
+        ground_truth_dump_data = self._get_dump_data(
+            self.fusion_op_list[1], self.compare_data.right_dump_info.path,
+            self.compare_data.right_dump_info.op_name_to_task_mode_map, ConstManager.RIGHT_TYPE)
+        compare_vector_result = []
+        # check npu input data valid
+        input_ret, input_error_msg = self.check_tensor_valid(
+            my_output_dump_data.data.input_data, ground_truth_dump_data.data.input_data, ConstManager.INPUT)
+        if input_ret == CompareError.MSACCUCMP_NONE_ERROR:
+            # compare input
+            compare_vector_result += self._compare_by_tensor(my_output_dump_data, ground_truth_dump_data,
+                                                             ConstManager.INPUT)
+        # check npu output data valid
+        output_ret, output_error_msg = self.check_tensor_valid(
+            my_output_dump_data.data.output_data, ground_truth_dump_data.data.output_data, ConstManager.OUTPUT)
+        if output_ret == CompareError.MSACCUCMP_NONE_ERROR:
+            # compare output
+            compare_vector_result += self._compare_by_tensor(my_output_dump_data, ground_truth_dump_data,
+                                                             ConstManager.OUTPUT)
+        if not my_output_dump_data.data.ffts_file_check:
+            msg = "This is a FFTS+ mode dump data, The number of files does not match the number of thread"
+            error_msg.append(msg)
+        # if no input and output, result is NaN
+        if input_ret != CompareError.MSACCUCMP_NONE_ERROR and output_ret != CompareError.MSACCUCMP_NONE_ERROR:
+            error_msg.append(input_error_msg)
+            error_msg.append(output_error_msg)
+            compare_vector_result = None
+        else:
+            output_ret = CompareError.MSACCUCMP_NONE_ERROR
+        fusion_op_result = compare_result.FusionOpComResult(self.algorithm_manager)
+        _result = fusion_op_result.get_result(self.fusion_op_list[0], compare_vector_result, error_msg)
+        result_info = utils.ResultInfo(
+            my_output_dump_data.name, True, _result.result_list, output_ret,
+            [], _result.input_result_list, _result.output_result_list, _result.is_ffts,
+            {}, True)
+        single_op_cmp_result.update_attr(result_info)
+        return output_ret, True, [single_op_cmp_result]
+    def _make_one_dump_file_result(self: any) -> (int, bool, list):
+        error_msg = []
+        # if only left or right has dump file, the result is NaN
+        single_op_cmp_result = compare_result.SingleOpCmpResult()
+        if self.fusion_op_list[0].op_type == ConstManager.LEFT_TYPE:
+            message = '[%s] There is no the ground truth dump file for the op "%s".' % (self.op_name, self.op_name)
+            log.print_warn_log(message)
+            error_msg.append(message)
+        elif self.fusion_op_list[0].op_type == ConstManager.RIGHT_TYPE:
+            message = '[%s] There is no the my output dump file for the op "%s".' % (self.op_name, self.op_name)
+            log.print_warn_log(message)
+            error_msg.append(message)
+        fusion_op_result = compare_result.FusionOpComResult(self.algorithm_manager,
+                                                            overflow_detection=self.overflow_detection)
+        _result = fusion_op_result.get_result(self.fusion_op_list[0], None, error_msg, no_dump_file=True)
+        result_info = utils.ResultInfo(
+            self.fusion_op_list[0].op_name, False, _result.result_list,
+            CompareError.MSACCUCMP_NO_DUMP_FILE_ERROR,
+            self.fusion_op_list[0].input_list, _result.input_result_list,
+            _result.output_result_list, _result.is_ffts, {}, True)
+        single_op_cmp_result.update_attr(result_info)
+        return CompareError.MSACCUCMP_NO_DUMP_FILE_ERROR, False, [single_op_cmp_result]
+    def _get_dump_data(self: any, fusion_op: FusionOp, dump_path: str,
+                       op_name_to_task_mode_map, dump_type: str) -> Tensor:
+        """
+        get dump data by fusion op output_desc
+        """
+        dump_file_list = fusion_op.output_desc
+        if not dump_file_list:
+            raise CompareError(CompareError.MSACCUCMP_NO_DUMP_FILE_ERROR)
+        dump_data_list = [dump_utils.parse_dump_file(dump_file_path, self.compare_data.dump_version)
+                          for dump_file_path in dump_file_list]
+        dump_mode = op_name_to_task_mode_map.get(self.op_name)
+        if dump_mode == ConstManager.AUTOMATIC_MODE or dump_mode == ConstManager.MANUAL_MODE:
+            ffts_parser = FFTSParser(dump_file_list, dump_data_list)
+            dump_file_path, dump_data = ffts_parser.parse_ffts
+            log.print_info_log(
+                'The "%s" in the path "%s" is FFTS+ dump data. After process the output data, the file path is "%s".'
+                % (fusion_op.op_name, dump_path, dump_file_path))
+        else:
+            dump_file_path = dump_file_list[-1]
+            dump_data = dump_data_list[-1]
+        log.print_info_log('[%s] [%s] %s' % (fusion_op.op_name, dump_type, dump_file_path))
+        if dump_data.op_name and dump_data.attr:
+            fusion_op.op_name = dump_data.op_name
+        tensor = Tensor(fusion_op.op_name, 0, '', [])
+        tensor.set_path(dump_file_path)
+        tensor.set_data(dump_data)
+        return tensor
+    def _check_op_data_valid(self: any, my_output_list: any, ground_truth_list: any, tensor_type: str) -> (int, str):
+        """
+        check format and shape of each tensor valid
+        """
+        message = ""
+        tensor_id_prefix = "%s:%s" % (self.op_name, tensor_type)
+        for index, (my_output_tensor, ground_truth_tensor) in enumerate(zip(my_output_list, ground_truth_list)):
+            tensor_id = '%s:%d' % (tensor_id_prefix, index)
+            # check format valid
+            if my_output_tensor.tensor_format != ground_truth_tensor.tensor_format:
+                message = log.print_not_match_error(
+                    self.op_name, 'format',
+                    common.get_format_string(my_output_tensor.tensor_format),
+                    common.get_format_string(ground_truth_tensor.tensor_format), tensor_id)
+                return CompareError.MSACCUCMP_INVALID_DUMP_DATA_ERROR, message
+            # check the length of shape is the same
+            if len(my_output_tensor.shape) != len(ground_truth_tensor.shape):
+                message = log.print_not_match_error(
+                    self.op_name, 'shape',
+                    utils.convert_shape_to_string(my_output_tensor.shape),
+                    utils.convert_shape_to_string(ground_truth_tensor.shape), tensor_id)
+                return CompareError.MSACCUCMP_INVALID_DUMP_DATA_ERROR, message
+            # check each dim in shape is the same
+            for my_output_dim, ground_truth_dim in zip(my_output_tensor.shape, ground_truth_tensor.shape):
+                if my_output_dim != ground_truth_dim:
+                    message = log.print_not_match_error(
+                        self.op_name, 'shape',
+                        utils.convert_shape_to_string(my_output_tensor.shape),
+                        utils.convert_shape_to_string(ground_truth_tensor.shape), tensor_id)
+                    return CompareError.MSACCUCMP_INVALID_DUMP_DATA_ERROR, message
+        return CompareError.MSACCUCMP_NONE_ERROR, message
+    def _compare_by_one_tensor(self: any, my_output_dump_data: Tensor, ground_truth_dump_data: Tensor,
+                               my_output_tensor: any, ground_truth_tensor: any) -> (list, list):
+        error_msg = []
+        tensor_id = f"{self.op_name}_TENSOR"
+        # 1. deserialize output data to array
+        if my_output_tensor and ground_truth_tensor:
+            if self.enable_padding_restore:
+                restored_left = self._restore_tensor_data_if_needed(my_output_tensor)
+                restored_right = self._restore_tensor_data_if_needed(ground_truth_tensor)
+                # 强制 numpy flatten，避免后端 compare 出现 numpy bool 错误
+                my_output_data_array = np.asarray(restored_left).astype(np.float32).flatten()
+                ground_truth_data_array = np.asarray(restored_right).astype(np.float32).flatten()
+                # 若长度不一致，直接报 warning，方便定位问题
+                if my_output_data_array.shape != ground_truth_data_array.shape:
+                    message = f"[{tensor_id}] Shape mismatch after restore: " \
+                              f"{my_output_data_array.shape} vs {ground_truth_data_array.shape}"
+                    log.print_warn_log(message)
+                    raise CompareError(CompareError.MSACCUCMP_INVALID_SHAPE_ERROR, message)
+            else:
+                my_output_data_array = my_output_tensor.data.flatten()
+                ground_truth_data_array = ground_truth_tensor.data.flatten()
+        else:
+            return self.algorithm_manager.make_nan_result(), error_msg
+        try:
+            # 2. compare by support algorithm
+            algorithm_result, error_msg = self.algorithm_manager.compare(
+                my_output_data_array, ground_truth_data_array,
+                {'my_output_dump_file': my_output_dump_data.path,
+                 'ground_truth_dump_file': ground_truth_dump_data.path,
+                 'shape_type': utils.get_shape_type(my_output_tensor.shape)})
+        except CompareError as compare_error:
+            if isinstance(compare_error, CompareError):
+                error_msg.append(compare_error.message)
+            algorithm_result = self.algorithm_manager.make_nan_result()
+        return algorithm_result, error_msg
+    def _compare_by_tensor(self: any, my_output_dump_data: Tensor, ground_truth_dump_data: Tensor,
+                           tensor_type: str) -> list:
+        tensor_result_list = []
+        if tensor_type == ConstManager.INPUT:
+            my_output_tensor_list = my_output_dump_data.data.input_data
+            ground_truth_tensor_list = ground_truth_dump_data.data.input_data
+            is_input = True
+        else:
+            my_output_tensor_list = my_output_dump_data.data.output_data
+            ground_truth_tensor_list = ground_truth_dump_data.data.output_data
+            is_input = False
+        # compare each tensor
+        for index, (my_output_tensor, ground_truth_tensor) in enumerate(
+                zip(my_output_tensor_list, ground_truth_tensor_list)):
+            tensor_id = '%s:%s:%d' % (my_output_dump_data.name, tensor_type, index)
+            log.print_info_log('[%s] compare %s %s for %s.'
+                               % (self.fusion_op_list[0].op_name,
+                                  common.get_format_string(my_output_tensor.tensor_format),
+                                  utils.convert_shape_to_string(my_output_tensor.shape),
+                                  tensor_id))
+            algorithm_result, error_msg = self._compare_by_one_tensor(my_output_dump_data, ground_truth_dump_data,
+                                                                      my_output_tensor, ground_truth_tensor)
+            # Check whether the current input/output data overflows
+            overflow_result = ''
+            if self.overflow_detection:
+                overflow_result = OverflowDetection.process_model_overflow_detection(my_output_dump_data.name,
+                                                                                     index, is_input, my_output_tensor)
+            my_output_tensor_dtype = utils.get_data_type(my_output_tensor.data_type)
+            ground_truth_tensor_dtype = utils.get_data_type(ground_truth_tensor.data_type)
+            my_output_tensor_address = utils.get_address_from_tensor(my_output_tensor)
+            ground_truth_tensor_address = utils.get_address_from_tensor(ground_truth_tensor)
+            op_type = dump_utils.get_op_type_from_file_name(my_output_dump_data.path)
+            # 3. merge result
+            tensor_info = {
+                "tensor_id": tensor_id,
+                "shape": my_output_tensor.shape,
+                "op_type": op_type,
+                "my_output_dtype": my_output_tensor_dtype,
+                "ground_truth_dtype": ground_truth_tensor_dtype,
+                "my_output_address": my_output_tensor_address,
+                "ground_truth_address": ground_truth_tensor_address
+            }
+            tensor_result_list.append(
+                compare_result.TensorResult(
+                    tensor_info, [algorithm_result, overflow_result], error_msg, my_output_tensor.is_ffts))
+        return tensor_result_list

msprobe/msaccucmp/vector_cmp/fusion_manager/compare_result.py ADDED Viewed

@@ -0,0 +1,326 @@
+# coding=utf-8
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
+#
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
+#
+#          http://license.coscl.org.cn/MulanPSL2
+#
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
+"""
+Function:
+This FusionOpComResult class. This file mainly involves the get_result function.
+"""
+import collections
+from msprobe.msaccucmp.vector_cmp.fusion_manager import fusion_rule_parser
+from msprobe.msaccucmp.cmp_utils import log
+from msprobe.msaccucmp.cmp_utils.constant.const_manager import ConstManager
+from msprobe.msaccucmp.vector_cmp.range_manager.range_manager import RangeManager
+from msprobe.msaccucmp.algorithm_manager.algorithm_manager import AlgorithmManager
+from msprobe.msaccucmp.vector_cmp.fusion_manager.fusion_op import FusionOp
+from msprobe.msaccucmp.cmp_utils.constant.compare_error import CompareError
+class TensorResult:
+    """
+    The class for tensor compare result
+    """
+    def __init__(self: any, tensor_info: dict, result: list, error_msg: list, is_ffts: bool) -> None:
+        self.tensor_info = tensor_info
+        self.algorithm_result = result[0]
+        self.error_msg = error_msg
+        self.overflow_result = result[1]
+        self.is_ffts = is_ffts
+    def get_result(self: any) -> list:
+        """
+        Get tensor result list
+        :return [tensor_id, shape, algorithm_result, error_msg]
+        """
+        shape_str = '[%s]' % ",".join(map(str, self.tensor_info.get("shape", ConstManager.NAN)))
+        if self.overflow_result:
+            result = [shape_str] + [self.overflow_result] + self.algorithm_result + [",".join(self.error_msg)]
+        else:
+            result = [shape_str] + self.algorithm_result + [",".join(self.error_msg)]
+        if self.tensor_info.get("tensor_id"):
+            result = [self.tensor_info.get("tensor_id")] + result
+        return result
+    def get_algorithm_result(self: any) -> list:
+        """
+        Get algorithm result
+        """
+        return self.algorithm_result
+    def get_my_output_dtype(self):
+        return self.tensor_info.get("my_output_dtype", ConstManager.NAN)
+    def get_ground_truth_dtype(self):
+        return self.tensor_info.get("ground_truth_dtype", ConstManager.NAN)
+    def get_my_output_address(self):
+        return self.tensor_info.get("my_output_address", ConstManager.NAN)
+    def get_ground_truth_address(self):
+        return self.tensor_info.get("ground_truth_address", ConstManager.NAN)
+    def get_op_type(self):
+        return self.tensor_info.get("op_type", ConstManager.NAN)
+class PytorchOpInfo:
+    """
+    The class for pytorch op info
+    """
+    def __init__(self: any, index: int, op_name: str, my_dump_path: str, ground_truth_dump_path: str) -> None:
+        self.index = index
+        self.op_name = op_name
+        self.my_dump_path = my_dump_path
+        self.ground_truth_dump_path = ground_truth_dump_path
+    def get_result(self: any) -> list:
+        """
+        Get op info result
+        :return [index, op_name, my_dump_path, ground_truth_dump_path]
+        """
+        return [str(self.index), self.op_name, self.my_dump_path, self.ground_truth_dump_path]
+    def get_op_name(self: any) -> str:
+        """
+        Get op name
+        """
+        return self.op_name
+class FusionOpComResult:
+    """
+    The class for fusion op compare result
+    """
+    def __init__(self: any, algorithm_manager: AlgorithmManager, ground_truth_to_my_output_map: any = None,
+                 overflow_detection: bool = False, dump_is_cpu_or_gpu_data: list = None) -> None:
+        self.algorithm_manager = algorithm_manager
+        self.ground_truth_to_my_output_map = ground_truth_to_my_output_map
+        self.overflow_detection = overflow_detection
+        self.is_ground_truth_gpu_or_cpu = dump_is_cpu_or_gpu_data[0] if dump_is_cpu_or_gpu_data else False
+        self.is_my_dump_gpu_or_cpu = dump_is_cpu_or_gpu_data[1] if dump_is_cpu_or_gpu_data else False
+    @staticmethod
+    def _make_ops_without_map(fusion_op: FusionOp, no_dump_file: bool) -> (str, str):
+        my_output_op = fusion_op.op_name
+        ground_truth_op = fusion_op.op_name
+        # if only left or right has dump file
+        if fusion_op.op_type in [ConstManager.LEFT_TYPE, ConstManager.RIGHT_TYPE]:
+            if no_dump_file:
+                if fusion_op.op_type == ConstManager.LEFT_TYPE:
+                    ground_truth_op = '*'
+                elif fusion_op.op_type == ConstManager.RIGHT_TYPE:
+                    my_output_op = '*'
+        else:
+            ground_truth_op = ','.join(fusion_op.attr.original_op_names)
+            if ground_truth_op == '':
+                ground_truth_op = '*'
+        return my_output_op, ground_truth_op
+    @staticmethod
+    def _process_input_and_output(result, input_result_list, output_result_list):
+        if ConstManager.INPUT_PATTERN in result[ConstManager.TENSOR_INDEX]:
+            input_result_list.append(result)
+        elif ConstManager.OUTPUT_PATTERN in result[ConstManager.TENSOR_INDEX]:
+            output_result_list.append(result)
+        return input_result_list, output_result_list
+    def get_result(self: any, fusion_op: FusionOp, tensor_result: any, error_msg: list,
+                   no_dump_file: bool = False) -> any:
+        """
+        Get fusion op compare result list
+        :param fusion_op: the fusion op
+        :param tensor_result: the tensor result list
+        :param error_msg: error message
+        :param no_dump_file: the result no dump file
+        :return [op_id, my_output_op, ground_truth_op, tensor_id, shape, algorithm_result, error_msg]
+        """
+        result_list = []
+        input_result_list = []
+        output_result_list = []
+        is_ffts = False
+        my_output_op, ground_truth_op = self._make_my_output_op_and_ground_truth_op(fusion_op, no_dump_file)
+        if tensor_result:
+            for item in tensor_result:
+                current_tensor_info = [
+                    str(fusion_op.op_id), item.get_op_type(),
+                    my_output_op, str(item.get_my_output_dtype()),
+                    str(item.get_my_output_address()), ground_truth_op,
+                    str(item.get_ground_truth_dtype()), str(item.get_ground_truth_address())
+                ]
+                self._pre_handle_result(current_tensor_info)
+                result = current_tensor_info + item.get_result()
+                if item.is_ffts:
+                    is_ffts = True
+                    input_result_list, output_result_list = \
+                        self._process_input_and_output(result, input_result_list, output_result_list)
+                RangeManager.adjust_data(result, fusion_op.attr.get_op_sequence())
+                log.print_info_log('[{}] Result: {}'.format(fusion_op.op_name, " ".join(result)))
+                result_list.append(result)
+        else:
+            current_tensor_info = [
+                str(fusion_op.op_id), fusion_op.get_real_op_type(),
+                my_output_op, ConstManager.NAN, ConstManager.NAN,
+                ground_truth_op, ConstManager.NAN, ConstManager.NAN,
+                ConstManager.NAN, ConstManager.NAN
+            ]
+            self._pre_handle_result(current_tensor_info)
+            if self.overflow_detection:
+                # using 'NaN' as an overflow detection for 'no tensor_result'
+                # and insert it after the column 'Shape'.
+                result = current_tensor_info + ['NaN'] + self.algorithm_manager.make_nan_result() \
+                         + [",".join(error_msg)]
+            else:
+                result = current_tensor_info + self.algorithm_manager.make_nan_result() + [",".join(error_msg)]
+            RangeManager.adjust_data(result, fusion_op.attr.get_op_sequence())
+            log.print_info_log('[{}] Result: {}'.format(fusion_op.op_name, " ".join(result)))
+            result_list.append(result)
+        Result = collections.namedtuple("Result", ["result_list", "input_result_list", "output_result_list", "is_ffts"])
+        result = Result(result_list, input_result_list, output_result_list, is_ffts)
+        return result
+    def get_pytorch_result(self: any, op_info: PytorchOpInfo, tensor_result: any, error_msg: list) -> list:
+        """
+        Get fusion op compare result list
+        :param op_info: the pytorch op info
+        :param tensor_result: the tensor result list
+        :param error_msg: error message
+        :return [op_id, my_output_op, ground_truth_op, tensor_id, shape, algorithm_result, error_msg]
+        """
+        result_list = []
+        if tensor_result:
+            for item in tensor_result:
+                result = op_info.get_result() + [item.get_my_output_dtype()] + item.get_result()
+                log.print_info_log('[%s:%d] Result: %s' % (op_info.op_name, op_info.index, " ".join(result)))
+                result_list.append(result)
+        else:
+            result = op_info.get_result() + [ConstManager.NAN] + [ConstManager.NAN] + \
+                     self.algorithm_manager.make_nan_result() + [",".join(error_msg)]
+            log.print_info_log('[%s:%d] Result: %s' % (op_info.op_name, op_info.index, " ".join(result)))
+            result_list.append(result)
+        return result_list
+    def _make_my_output_op_and_ground_truth_op(self: any, fusion_op: FusionOp, no_dump_file: bool) -> (str, str):
+        if self.ground_truth_to_my_output_map:
+            my_output_op, ground_truth_op = fusion_rule_parser. \
+                make_left_and_right_string(self.ground_truth_to_my_output_map)
+        else:
+            my_output_op, ground_truth_op = self._make_ops_without_map(fusion_op, no_dump_file)
+        return my_output_op, ground_truth_op
+    def _pre_handle_result(self: any, current_tensor_info: list) -> None:
+        """
+        if dump data is not NPU data, the result will be popped.
+        the index of my dump data address is 3, the index of ground truth data address is 6.
+        args: result list
+        """
+        if self.is_ground_truth_gpu_or_cpu:
+            # op id is inserted as index in header, so address index should plus one.
+            current_tensor_info.pop(ConstManager.GROUND_TRUTH_ADDRESS_INDEX + 1)
+        if self.is_my_dump_gpu_or_cpu:
+            current_tensor_info.pop(ConstManager.MY_OUTPUT_ADDRESS_INDEX + 1)
+def get_result_title(algorithm_manager: AlgorithmManager, op_header: list, overflow_detection: bool = False) -> list:
+    """
+    Get result title
+    :param algorithm_manager: the algorithm manager
+    :param op_header: the op header
+    :param overflow_detection: whether to display overflow info
+    :return  [Index, op_header, shape, algorithm_result, error_msg]
+    """
+    header = ['Index'] + op_header + ['Shape'] + algorithm_manager.get_result_title() + ["CompareFailReason"]
+    # add 'OverFlow' after 'Shape'.
+    if overflow_detection:
+        header.insert(header.index('Shape') + 1, 'OverFlow')
+    RangeManager.adjust_header(header)
+    return header
+class SingleOpCmpResult:
+    """
+    The class for single op result
+    """
+    def __init__(self: any) -> None:
+        self.op_name = ""
+        self.dump_match = False
+        self.result_list = None
+        self.ret = 0
+        self.input_list = None
+        self.input_result_list = None
+        self.output_result_list = None
+        self.is_ffts = False
+        self.op_name_origin_output_index_map = None
+        self.npu_vs_npu = False
+    @staticmethod
+    def get_pre_op_output(op_name: str, index: int, result_mapping: dict) -> list:
+        pre_op_result = result_mapping.get(op_name)
+        if pre_op_result:
+            output_result = pre_op_result.output_result_list[index]
+        else:
+            output_result = None
+            message = "The result of '%s' is not in result mapping" % op_name
+            log.print_warn_log(message)
+        return output_result
+    def update_attr(self: any, result_info: collections.namedtuple) -> None:
+        self.op_name = result_info.op_name
+        self.dump_match = result_info.dump_match
+        self.result_list = result_info.result_list
+        self.ret = result_info.ret
+        self.input_list = result_info.input_list
+        self.input_result_list = result_info.input_result_list
+        self.output_result_list = result_info.output_result_list
+        self.is_ffts = result_info.is_ffts
+        self.op_name_origin_output_index_map = result_info.op_name_origin_output_index_map
+        self.npu_vs_npu = result_info.npu_vs_npu
+    def check_result_list_valid(self: any) -> None:
+        if len(self.result_list) < len(self.input_result_list):
+            message = "The length of input result list is greater than result list, '%s'" % self.op_name
+            log.print_error_log(message)
+            raise CompareError(CompareError.MSACCUCMP_INVALID_INPUT_MAPPING)
+    def find_pre_op(self: any, result_mapping: dict) -> None:
+        """
+        Replace the input of the current operator with the previous output result
+        """
+        self.check_result_list_valid()
+        for index, input_result in enumerate(self.input_result_list):
+            if len(input_result) <= ConstManager.TENSOR_INDEX:
+                log.print_warn_log(f"Broken result, id {index}, skip")
+                continue
+            tensor_id = input_result[ConstManager.TENSOR_INDEX]
+            pre_op = self.op_name_origin_output_index_map.get(tensor_id)
+            if not pre_op or len(pre_op) < 2:
+                message = "The tensor index '%s' is invalid, no input mapping information" % tensor_id
+                log.print_error_log(message)
+                raise CompareError(CompareError.MSACCUCMP_INVALID_INPUT_MAPPING)
+            pre_op_name = pre_op[0]
+            pre_op_index = pre_op[1]
+            output_result = self.get_pre_op_output(pre_op_name, pre_op_index, result_mapping)
+            if not output_result:
+                continue
+            origin_result = self.result_list[index][:ConstManager.TENSOR_INDEX + 1]
+            self.result_list[index] = origin_result + output_result[ConstManager.TENSOR_INDEX + 1:]

mindstudio-probe 8.3.2__py3-none-any.whl → 26.0.0a1__py3-none-any.whl

mindstudio-probe 8.3.2py3-none-any.whl → 26.0.0a1py3-none-any.whl