PyPI - mindstudio-probe - Versions diffs - 8.3.2__py3-none-any.whl → 26.0.0a1__py3-none-any.whl - Mend

mindstudio-probe 8.3.2py3-none-any.whl → 26.0.0a1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (689) hide show

{mindstudio_probe-8.3.2.dist-info → mindstudio_probe-26.0.0a1.dist-info}/METADATA +26 -14
mindstudio_probe-26.0.0a1.dist-info/RECORD +498 -0
{mindstudio_probe-8.3.2.dist-info → mindstudio_probe-26.0.0a1.dist-info}/WHEEL +1 -1
mindstudio_probe-26.0.0a1.dist-info/entry_points.txt +5 -0
mindstudio_probe-26.0.0a1.dist-info/licenses/LICENSE +124 -0
mindstudio_probe-26.0.0a1.dist-info/top_level.txt +2 -0
msprobe/__init__.py +12 -13
msprobe/config.json +9 -31
msprobe/core/__init__.py +12 -11
msprobe/core/acc_check/acc_check_cli.py +145 -0
msprobe/core/common/const.py +97 -38
msprobe/core/common/db_manager.py +133 -12
msprobe/core/common/decorator.py +12 -11
msprobe/core/common/exceptions.py +12 -11
msprobe/core/common/file_utils.py +101 -25
msprobe/core/common/framework_adapter.py +36 -25
msprobe/core/common/global_lock.py +12 -11
msprobe/core/common/inplace_op_checker.py +12 -11
msprobe/core/common/log.py +22 -11
msprobe/core/common/megatron_utils.py +566 -11
msprobe/core/common/parallel_state.py +12 -11
msprobe/core/common/runtime.py +12 -11
msprobe/core/common/utils.py +41 -41
msprobe/core/compare/acc_compare.py +361 -104
msprobe/core/compare/atb_data_compare.py +422 -0
msprobe/core/compare/auto_compare.py +134 -0
msprobe/core/compare/check.py +14 -17
msprobe/core/compare/compare_cli.py +72 -149
msprobe/core/compare/config.py +12 -13
msprobe/core/compare/diff_analyze/first_diff_analyze.py +28 -15
msprobe/core/compare/diff_analyze/ignore_op_list.yaml +3 -0
msprobe/core/compare/find_first/analyzer.py +18 -18
msprobe/core/compare/find_first/graph.py +12 -11
msprobe/core/compare/find_first/utils.py +13 -12
msprobe/core/compare/indicator_analysis/__init__.py +15 -0
msprobe/core/compare/indicator_analysis/algorithm.py +363 -0
msprobe/core/compare/indicator_analysis/api_data.py +141 -0
msprobe/core/compare/indicator_analysis/calculator.py +181 -0
msprobe/core/compare/indicator_analysis/utils.py +116 -0
msprobe/core/compare/layer_mapping/__init__.py +12 -11
msprobe/core/compare/layer_mapping/data_scope_parser.py +20 -11
msprobe/core/compare/layer_mapping/layer_mapping.py +14 -13
msprobe/core/compare/layer_mapping/postprocess_pass.py +13 -11
msprobe/core/compare/merge_result/merge_result.py +12 -11
msprobe/core/compare/merge_result/merge_result_cli.py +12 -11
msprobe/core/compare/merge_result/utils.py +12 -11
msprobe/core/compare/multiprocessing_compute.py +13 -14
msprobe/core/compare/npy_compare.py +13 -11
msprobe/core/compare/offline_data_compare.py +160 -0
msprobe/core/compare/stats_diff_calc.py +39 -0
msprobe/core/compare/torchair_acc_cmp.py +764 -0
msprobe/core/compare/torchair_cmp_utils.py +338 -0
msprobe/core/compare/utils.py +140 -49
msprobe/core/config_check/__init__.py +12 -11
msprobe/core/config_check/checkers/__init__.py +12 -11
msprobe/core/config_check/checkers/base_checker.py +15 -14
msprobe/core/config_check/checkers/dataset_checker.py +13 -12
msprobe/core/config_check/checkers/env_args_checker.py +13 -12
msprobe/core/config_check/checkers/hyperparameter_checker.py +16 -15
msprobe/core/config_check/checkers/pip_checker.py +15 -15
msprobe/core/config_check/checkers/random_checker.py +13 -12
msprobe/core/config_check/checkers/weights_checker.py +14 -12
msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +13 -17
msprobe/core/config_check/ckpt_compare/megatron_loader.py +13 -12
msprobe/core/config_check/ckpt_compare/metrics.py +12 -11
msprobe/core/config_check/config_check_cli.py +18 -17
msprobe/core/config_check/config_checker.py +16 -14
msprobe/core/config_check/resource/dependency.yaml +15 -12
msprobe/core/config_check/resource/env.yaml +12 -11
msprobe/core/config_check/utils/hyperparameter_parser.py +12 -11
msprobe/core/config_check/utils/utils.py +12 -11
msprobe/core/{data_dump → dump/api_dump}/api_registry.py +12 -11
msprobe/core/{common_config.py → dump/common_config.py} +13 -24
msprobe/core/dump/data_dump/data_collector.py +257 -0
msprobe/core/{data_dump → dump/data_dump}/data_processor/base.py +45 -36
msprobe/core/{data_dump → dump/data_dump}/data_processor/factory.py +33 -25
msprobe/core/{data_dump → dump/data_dump}/data_processor/mindspore_processor.py +37 -113
msprobe/core/{data_dump → dump/data_dump}/data_processor/pytorch_processor.py +364 -131
msprobe/core/{data_dump → dump/data_dump}/json_writer.py +24 -31
msprobe/core/{data_dump → dump/data_dump}/scope.py +12 -13
msprobe/core/{debugger → dump/debugger}/precision_debugger.py +15 -23
msprobe/core/dump/dump2db/db_utils.py +215 -0
msprobe/core/dump/dump2db/dump2db.py +409 -0
msprobe/core/{hook_manager.py → dump/hook_manager.py} +38 -87
msprobe/core/dump/kernel_dump/kernel_config.py +34 -0
msprobe/core/{service.py → dump/service.py} +43 -27
msprobe/core/install_deps/install_deps.py +51 -0
msprobe/core/monitor/anomaly_processor.py +13 -11
msprobe/core/monitor/csv2db.py +73 -93
msprobe/core/monitor/db_utils.py +140 -205
msprobe/core/monitor/utils.py +18 -17
msprobe/core/monitor_v2/__init__.py +20 -0
msprobe/core/monitor_v2/base.py +83 -0
msprobe/core/monitor_v2/cc.py +287 -0
msprobe/core/monitor_v2/factory.py +81 -0
msprobe/core/monitor_v2/module.py +201 -0
msprobe/core/monitor_v2/optimizer.py +245 -0
msprobe/core/monitor_v2/param.py +154 -0
msprobe/core/monitor_v2/trainer.py +326 -0
msprobe/core/monitor_v2/utils.py +122 -0
msprobe/core/monitor_v2/weight_grad.py +419 -0
msprobe/core/monitor_v2/writer.py +162 -0
msprobe/core/overflow_check/abnormal_scene.py +12 -11
msprobe/core/overflow_check/api_info.py +12 -11
msprobe/core/overflow_check/checker.py +12 -11
msprobe/core/overflow_check/filter.py +13 -11
msprobe/core/overflow_check/level.py +12 -11
msprobe/core/overflow_check/utils.py +12 -11
msprobe/core/single_save/single_comparator.py +12 -11
msprobe/core/single_save/single_saver.py +12 -11
msprobe/infer/__init__.py +16 -0
msprobe/infer/offline/__init__.py +16 -0
msprobe/infer/offline/compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/args_adapter.py +46 -0
msprobe/infer/offline/compare/msquickcmp/atc/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/atc/atc_utils.py +98 -0
msprobe/infer/offline/compare/msquickcmp/cmp_process.py +328 -0
msprobe/infer/offline/compare/msquickcmp/common/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/common/args_check.py +112 -0
msprobe/infer/offline/compare/msquickcmp/common/convert.py +74 -0
msprobe/infer/offline/compare/msquickcmp/common/dump_data.py +121 -0
msprobe/infer/offline/compare/msquickcmp/common/dynamic_argument_bean.py +39 -0
msprobe/infer/offline/compare/msquickcmp/common/utils.py +669 -0
msprobe/infer/offline/compare/msquickcmp/config.ini +6 -0
msprobe/infer/offline/compare/msquickcmp/dump/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/dump/args_adapter.py +50 -0
msprobe/infer/offline/compare/msquickcmp/dump/dump_process.py +91 -0
msprobe/infer/offline/compare/msquickcmp/install_aclruntime_aisbench.sh +180 -0
msprobe/infer/offline/compare/msquickcmp/main.py +199 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/net_compare.py +277 -0
msprobe/infer/offline/compare/msquickcmp/npu/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/npu/npu_dump_data.py +558 -0
msprobe/infer/offline/compare/msquickcmp/npu/om_parser.py +416 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/onnx_dump_data.py +374 -0
msprobe/infer/utils/__init__.py +15 -0
msprobe/infer/utils/acc_cmp.py +94 -0
msprobe/infer/utils/check/__init__.py +37 -0
msprobe/infer/utils/check/args_checker.py +35 -0
msprobe/infer/utils/check/checker.py +227 -0
msprobe/infer/utils/check/dict_checker.py +78 -0
msprobe/infer/utils/check/func_wrapper.py +96 -0
msprobe/infer/utils/check/list_checker.py +56 -0
msprobe/infer/utils/check/number_checker.py +64 -0
msprobe/infer/utils/check/obj_checker.py +41 -0
msprobe/infer/utils/check/path_checker.py +249 -0
msprobe/infer/utils/check/rule.py +126 -0
msprobe/infer/utils/check/string_checker.py +66 -0
msprobe/infer/utils/cmp_algorithm.py +261 -0
msprobe/infer/utils/constants.py +112 -0
msprobe/infer/utils/file_open_check.py +337 -0
msprobe/infer/utils/util.py +177 -0
msprobe/mindspore/__init__.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_info.py +12 -11
msprobe/mindspore/api_accuracy_checker/api_runner.py +12 -11
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +12 -11
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +12 -11
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +15 -14
msprobe/mindspore/api_accuracy_checker/compute_element.py +12 -11
msprobe/mindspore/api_accuracy_checker/data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/main.py +12 -11
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +14 -12
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +12 -11
msprobe/mindspore/api_accuracy_checker/type_mapping.py +12 -11
msprobe/mindspore/api_accuracy_checker/utils.py +12 -11
msprobe/mindspore/common/const.py +15 -74
msprobe/mindspore/common/log.py +12 -11
msprobe/mindspore/common/utils.py +30 -15
msprobe/mindspore/compare/common_dir_compare.py +21 -23
msprobe/mindspore/compare/distributed_compare.py +18 -16
msprobe/mindspore/compare/ms_compare.py +14 -14
msprobe/mindspore/compare/ms_graph_compare.py +26 -20
msprobe/mindspore/compare/utils.py +14 -12
msprobe/mindspore/{cell_processor.py → dump/cell_processor.py} +15 -14
msprobe/mindspore/{debugger → dump/debugger}/debugger_config.py +12 -30
msprobe/mindspore/{debugger → dump/debugger}/precision_debugger.py +43 -45
msprobe/mindspore/dump/{cell_dump_process.py → dump_processor/cell_dump_process.py} +31 -17
msprobe/mindspore/dump/{cell_dump_with_insert_gradient.py → dump_processor/cell_dump_with_insert_gradient.py} +18 -14
msprobe/mindspore/dump/{dump_tool_factory.py → dump_processor/dump_tool_factory.py} +16 -15
msprobe/mindspore/dump/{graph_mode_cell_dump.py → dump_processor/graph_mode_cell_dump.py} +16 -15
msprobe/mindspore/dump/{graph_tensor_dump.py → dump_processor/graph_tensor_dump.py} +134 -133
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/api_register.py +15 -14
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/hook_cell.py +12 -11
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/ms_hook_manager.py +47 -20
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/primitive_hooks.py +14 -13
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/support_wrap_ops.yaml +13 -11
msprobe/mindspore/dump/{jit_dump.py → dump_processor/jit_dump.py} +14 -13
msprobe/mindspore/dump/{kernel_graph_dump.py → dump_processor/kernel_graph_dump.py} +13 -12
msprobe/mindspore/dump/{kernel_kbyk_dump.py → dump_processor/kernel_kbyk_dump.py} +13 -12
msprobe/mindspore/{exception_dump → dump/exception_dump}/exception_dump_tool_factory.py +14 -13
msprobe/mindspore/{exception_dump → dump/exception_dump}/kernel_graph_exception_dump.py +13 -12
msprobe/mindspore/{mindspore_service.py → dump/mindspore_service.py} +18 -17
msprobe/mindspore/dump/mindtorch/__init__.py +19 -0
msprobe/mindspore/dump/ms_config.py +105 -0
msprobe/mindspore/{overflow_check → dump/overflow_check}/kernel_graph_overflow_check.py +13 -12
msprobe/mindspore/{overflow_check → dump/overflow_check}/overflow_check_tool_factory.py +14 -13
msprobe/mindspore/dump/task_handler_factory.py +43 -0
msprobe/mindspore/monitor/common_func.py +12 -11
msprobe/mindspore/monitor/data_writers.py +12 -11
msprobe/mindspore/monitor/distributed/wrap_distributed.py +93 -39
msprobe/mindspore/monitor/features.py +12 -11
msprobe/mindspore/monitor/module_hook.py +19 -22
msprobe/mindspore/monitor/optimizer_collect.py +29 -25
msprobe/mindspore/monitor/utils.py +13 -11
msprobe/msaccucmp/advisor/__init__.py +16 -0
msprobe/msaccucmp/advisor/advisor_const.py +65 -0
msprobe/msaccucmp/advisor/advisor_result.py +73 -0
msprobe/msaccucmp/advisor/compare_advisor.py +99 -0
msprobe/msaccucmp/advisor/input_advisor.py +66 -0
msprobe/msaccucmp/advisor/node_advisor.py +68 -0
msprobe/msaccucmp/advisor/overflow_advisor.py +58 -0
msprobe/msaccucmp/algorithm_manager/__init__.py +16 -0
msprobe/msaccucmp/algorithm_manager/algorithm_manager.py +464 -0
msprobe/msaccucmp/algorithm_manager/algorithm_parameter.py +42 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_AccumulatedRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_CosineSimilarity.py +58 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_KullbackLeiblerDivergence.py +84 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RelativeEuclideanDistance.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RootMeanSquareError.py +40 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_StandardDeviation.py +47 -0
msprobe/msaccucmp/cmp_utils/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/common.py +113 -0
msprobe/msaccucmp/cmp_utils/constant/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/constant/compare_error.py +81 -0
msprobe/msaccucmp/cmp_utils/constant/const_manager.py +530 -0
msprobe/msaccucmp/cmp_utils/file_utils.py +497 -0
msprobe/msaccucmp/cmp_utils/log.py +257 -0
msprobe/msaccucmp/cmp_utils/multi_process/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/multi_process/multi_convert_process.py +140 -0
msprobe/msaccucmp/cmp_utils/multi_process/progress.py +78 -0
msprobe/msaccucmp/cmp_utils/path_check.py +274 -0
msprobe/msaccucmp/cmp_utils/reg_manager.py +98 -0
msprobe/msaccucmp/cmp_utils/tlv_parse.py +279 -0
msprobe/msaccucmp/cmp_utils/utils.py +356 -0
msprobe/msaccucmp/cmp_utils/utils_type.py +63 -0
msprobe/msaccucmp/compare_vector.py +48 -0
msprobe/msaccucmp/conversion/__init__.py +16 -0
msprobe/msaccucmp/conversion/data_conversion.py +277 -0
msprobe/msaccucmp/conversion/dtype_conversion.py +99 -0
msprobe/msaccucmp/conversion/shape_format_conversion.py +477 -0
msprobe/msaccucmp/conversion/tensor_conversion.py +369 -0
msprobe/msaccucmp/dump_data_conversion.py +46 -0
msprobe/msaccucmp/dump_parse/__init__.py +16 -0
msprobe/msaccucmp/dump_parse/big_dump_data.py +317 -0
msprobe/msaccucmp/dump_parse/dump.py +423 -0
msprobe/msaccucmp/dump_parse/dump_data_object.py +322 -0
msprobe/msaccucmp/dump_parse/dump_data_parser.py +436 -0
msprobe/msaccucmp/dump_parse/dump_utils.py +246 -0
msprobe/msaccucmp/dump_parse/ffts_parser.py +137 -0
msprobe/msaccucmp/dump_parse/mapping.py +62 -0
msprobe/msaccucmp/dump_parse/nano_dump_data.py +392 -0
msprobe/msaccucmp/dump_parse/proto_dump_data.py +308 -0
msprobe/msaccucmp/dump_parser.py +90 -0
msprobe/msaccucmp/format_manager/__init__.py +16 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NCHW.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_ND.py +52 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NHWC.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_HWCN.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_NCHW.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_FRACTAL_Z.py +89 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_HWCN.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NCHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NHWC.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_NCDHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_ND.py +44 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_HWCN.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/format_manager.py +307 -0
msprobe/msaccucmp/inplace_layer_process.py +186 -0
msprobe/msaccucmp/msaccucmp.py +532 -0
msprobe/msaccucmp/mscmp_advisor.py +128 -0
msprobe/msaccucmp/overflow/__init__.py +16 -0
msprobe/msaccucmp/overflow/overflow_analyse.py +305 -0
msprobe/msaccucmp/overflow/overflow_detection.py +143 -0
msprobe/msaccucmp/pytorch_cmp/__init__.py +16 -0
msprobe/msaccucmp/pytorch_cmp/compare_pytorch.py +389 -0
msprobe/msaccucmp/pytorch_cmp/hdf5_parser.py +377 -0
msprobe/msaccucmp/pytorch_cmp/pytorch_dump_data.py +461 -0
msprobe/msaccucmp/shape_conversion.py +41 -0
msprobe/msaccucmp/vector_cmp/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/batch_compare.py +197 -0
msprobe/msaccucmp/vector_cmp/compare_detail/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/compare_detail/compare_detail.py +245 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail.py +182 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail_writer.py +580 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_fusion_op.py +588 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_npu_vs_npu.py +339 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_result.py +326 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_rule.py +156 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_op.py +204 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_rule_parser.py +635 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/quant_filter.py +187 -0
msprobe/msaccucmp/vector_cmp/range_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_manager.py +100 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_mode.py +94 -0
msprobe/msaccucmp/vector_cmp/range_manager/select_mode.py +86 -0
msprobe/msaccucmp/vector_cmp/vector_comparison.py +535 -0
msprobe/msprobe.py +101 -130
msprobe/overflow_check/__init__.py +15 -0
msprobe/{nan_analyze → overflow_check}/analyzer.py +38 -27
msprobe/{nan_analyze → overflow_check}/graph.py +30 -27
msprobe/{nan_analyze → overflow_check}/utils.py +15 -14
msprobe/pytorch/__init__.py +20 -14
msprobe/pytorch/aclgraph_dump/__init__.py +45 -0
msprobe/pytorch/aclgraph_dump/_meta.py +26 -0
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut.py → acc_check/acc_check.py} +50 -45
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut_utils.py → acc_check/acc_check_utils.py} +201 -30
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/data_generate.py +56 -16
msprobe/pytorch/api_accuracy_checker/{run_ut/multi_run_ut.py → acc_check/multi_acc_check.py} +32 -47
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/run_overflow_check.py +19 -18
msprobe/pytorch/api_accuracy_checker/common/config.py +22 -20
msprobe/pytorch/api_accuracy_checker/common/utils.py +72 -13
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +41 -11
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +23 -14
msprobe/pytorch/api_accuracy_checker/compare/compare.py +45 -32
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +12 -11
msprobe/pytorch/api_accuracy_checker/compare/compare_input.py +14 -12
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +14 -12
msprobe/pytorch/api_accuracy_checker/precision_standard/absolute_threshold.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/accumulative_error_compare.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/base_standard.py +21 -19
msprobe/pytorch/api_accuracy_checker/precision_standard/benchmark_compare.py +14 -13
msprobe/pytorch/api_accuracy_checker/precision_standard/binary_consistency.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_config.py +60 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_register.py +27 -16
msprobe/pytorch/api_accuracy_checker/precision_standard/thousandth_standard.py +13 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/ulp_compare.py +39 -18
msprobe/pytorch/bench_functions/__init__.py +12 -11
msprobe/pytorch/bench_functions/apply_adam.py +12 -11
msprobe/pytorch/bench_functions/apply_adam_w.py +12 -11
msprobe/pytorch/bench_functions/confusion_transpose.py +12 -11
msprobe/pytorch/bench_functions/fast_gelu.py +12 -11
msprobe/pytorch/bench_functions/group_norm_silu.py +12 -11
msprobe/pytorch/bench_functions/layer_norm_eval.py +12 -11
msprobe/pytorch/bench_functions/linear.py +12 -11
msprobe/pytorch/bench_functions/matmul_backward.py +12 -11
msprobe/pytorch/bench_functions/mish.py +12 -11
msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +12 -11
msprobe/pytorch/bench_functions/npu_fusion_attention.py +12 -11
msprobe/pytorch/bench_functions/rms_norm.py +12 -11
msprobe/pytorch/bench_functions/rotary_mul.py +12 -11
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +12 -11
msprobe/pytorch/bench_functions/sort_v2.py +12 -11
msprobe/pytorch/bench_functions/swiglu.py +12 -11
msprobe/pytorch/common/__init__.py +12 -11
msprobe/pytorch/common/log.py +12 -11
msprobe/pytorch/common/parse_json.py +12 -11
msprobe/pytorch/common/utils.py +52 -19
msprobe/pytorch/compare/distributed_compare.py +13 -13
msprobe/pytorch/compare/match.py +12 -11
msprobe/pytorch/compare/pt_compare.py +14 -20
msprobe/pytorch/compare/pt_diff_analyze.py +12 -11
msprobe/pytorch/compare/utils.py +12 -11
msprobe/pytorch/{hook_module → dump/api_dump}/api_register.py +18 -16
msprobe/pytorch/{hook_module → dump/api_dump}/hook_module.py +14 -13
msprobe/pytorch/{hook_module → dump/api_dump}/pt_hook_manager.py +68 -23
msprobe/pytorch/{hook_module → dump/api_dump}/register_optimizer_hook.py +13 -11
msprobe/pytorch/{hook_module → dump/api_dump}/script_wrapper.py +17 -14
msprobe/pytorch/{hook_module → dump/api_dump}/utils.py +12 -11
msprobe/pytorch/{debugger → dump/debugger}/debugger_config.py +23 -38
msprobe/pytorch/dump/debugger/precision_debugger.py +130 -0
msprobe/pytorch/{function_factory.py → dump/function_factory.py} +12 -11
msprobe/pytorch/dump/module_dump/hook_wrapper.py +17 -13
msprobe/pytorch/dump/module_dump/module_dump.py +16 -15
msprobe/pytorch/dump/module_dump/{module_processer.py → module_processor.py} +54 -42
msprobe/pytorch/dump/pt_config.py +128 -0
msprobe/pytorch/{pytorch_service.py → dump/pytorch_service.py} +22 -21
msprobe/pytorch/monitor/csv2tb.py +13 -11
msprobe/pytorch/monitor/data_writers.py +13 -11
msprobe/pytorch/monitor/distributed/wrap_distributed.py +13 -11
msprobe/pytorch/monitor/features.py +12 -11
msprobe/pytorch/monitor/module_hook.py +67 -59
msprobe/pytorch/monitor/module_metric.py +13 -11
msprobe/pytorch/monitor/optimizer_collect.py +37 -35
msprobe/pytorch/monitor/utils.py +13 -11
msprobe/pytorch/monitor/visualizer.py +12 -11
msprobe/pytorch/torchair_dump/__init__.py +17 -0
msprobe/pytorch/torchair_dump/torchair_dump.py +114 -0
msprobe/scripts/atb/config_example.json +10 -0
msprobe/scripts/atb/load_atb_probe.sh +101 -0
msprobe/scripts/atb/unload_atb_probe.sh +27 -0
msprobe/scripts/build_msaccucmp.sh +186 -0
msprobe/scripts/conf/help.info +6 -0
msprobe/scripts/conf/version.info +3 -0
msprobe/scripts/run_script/common.sh +538 -0
msprobe/scripts/run_script/main_msaccucmp.sh +232 -0
msprobe/visualization/__init__.py +12 -11
msprobe/visualization/builder/__init__.py +12 -11
msprobe/visualization/builder/graph_builder.py +45 -30
msprobe/visualization/builder/graph_merger.py +53 -32
msprobe/visualization/builder/msprobe_adapter.py +34 -44
msprobe/visualization/compare/__init__.py +12 -11
msprobe/visualization/compare/graph_comparator.py +63 -51
msprobe/visualization/compare/mode_adapter.py +28 -113
msprobe/visualization/db_utils.py +133 -22
msprobe/visualization/graph/__init__.py +12 -11
msprobe/visualization/graph/base_node.py +15 -27
msprobe/visualization/graph/distributed_analyzer.py +97 -40
msprobe/visualization/graph/graph.py +14 -16
msprobe/visualization/graph/node_colors.py +34 -31
msprobe/visualization/graph/node_op.py +12 -11
msprobe/visualization/graph_service.py +580 -205
msprobe/visualization/utils.py +278 -31
tb_graph_ascend/secure_build.py +175 -0
tb_graph_ascend/server/__init__.py +15 -0
tb_graph_ascend/server/app/__init__.py +15 -0
tb_graph_ascend/server/app/model/__init__.py +15 -0
tb_graph_ascend/server/app/model/hierarchy.py +348 -0
tb_graph_ascend/server/app/model/layout_hierarchy_model.py +69 -0
tb_graph_ascend/server/app/model/match_nodes_model.py +573 -0
tb_graph_ascend/server/app/repositories/__init__.py +15 -0
tb_graph_ascend/server/app/repositories/graph_repo_base.py +32 -0
tb_graph_ascend/server/app/repositories/graph_repo_db.py +879 -0
tb_graph_ascend/server/app/repositories/graph_repo_vis.py +83 -0
tb_graph_ascend/server/app/service/__init__.py +18 -0
tb_graph_ascend/server/app/service/graph_service_base.py +158 -0
tb_graph_ascend/server/app/service/graph_service_db.py +438 -0
tb_graph_ascend/server/app/service/graph_service_factory.py +54 -0
tb_graph_ascend/server/app/service/graph_service_vis.py +480 -0
tb_graph_ascend/server/app/utils/__init__.py +15 -0
tb_graph_ascend/server/app/utils/constant.py +80 -0
tb_graph_ascend/server/app/utils/file_check_wrapper.py +46 -0
tb_graph_ascend/server/app/utils/global_state.py +95 -0
tb_graph_ascend/server/app/utils/graph_utils.py +661 -0
tb_graph_ascend/server/app/utils/i18n.py +153 -0
tb_graph_ascend/server/app/utils/request_method.py +46 -0
tb_graph_ascend/server/app/views/__init__.py +15 -0
tb_graph_ascend/server/app/views/graph_views.py +304 -0
tb_graph_ascend/server/plugin.py +108 -0
tb_graph_ascend/server/static/index.html +9250 -0
tb_graph_ascend/server/static/index.js +21 -0
tb_graph_ascend/setup.py +57 -0
mindstudio_probe-8.3.2.dist-info/LICENSE +0 -201
mindstudio_probe-8.3.2.dist-info/RECORD +0 -491
mindstudio_probe-8.3.2.dist-info/entry_points.txt +0 -2
mindstudio_probe-8.3.2.dist-info/top_level.txt +0 -1
msprobe/CMakeLists.txt +0 -5
msprobe/README.md +0 -203
msprobe/core/advisor/advisor.py +0 -129
msprobe/core/advisor/advisor_const.py +0 -58
msprobe/core/advisor/advisor_result.py +0 -58
msprobe/core/compare/find_first/data_processor.py +0 -35
msprobe/core/compare/highlight.py +0 -390
msprobe/core/data_dump/data_collector.py +0 -356
msprobe/core/grad_probe/constant.py +0 -90
msprobe/core/grad_probe/grad_compare.py +0 -187
msprobe/core/grad_probe/utils.py +0 -105
msprobe/core/kernel_dump/kernel_config.py +0 -33
msprobe/docs/01.installation.md +0 -250
msprobe/docs/02.config_introduction.md +0 -221
msprobe/docs/03.config_examples.md +0 -281
msprobe/docs/04.kernel_dump_PyTorch.md +0 -73
msprobe/docs/05.data_dump_PyTorch.md +0 -518
msprobe/docs/06.data_dump_MindSpore.md +0 -618
msprobe/docs/07.accuracy_checker_PyTorch.md +0 -310
msprobe/docs/09.accuracy_checker_MindSpore.md +0 -120
msprobe/docs/10.accuracy_compare_PyTorch.md +0 -637
msprobe/docs/11.accuracy_compare_MindSpore.md +0 -769
msprobe/docs/12.overflow_check_PyTorch.md +0 -82
msprobe/docs/13.overflow_check_MindSpore.md +0 -33
msprobe/docs/14.data_parse_PyTorch.md +0 -282
msprobe/docs/15.free_benchmarking_PyTorch.md +0 -169
msprobe/docs/16.free_benchmarking_MindSpore.md +0 -159
msprobe/docs/17.grad_probe.md +0 -205
msprobe/docs/18.online_dispatch.md +0 -89
msprobe/docs/19.monitor.md +0 -753
msprobe/docs/20.monitor_performance_baseline.md +0 -52
msprobe/docs/21.visualization_PyTorch.md +0 -519
msprobe/docs/22.visualization_MindSpore.md +0 -515
msprobe/docs/23.generate_operator_PyTorch.md +0 -107
msprobe/docs/24.code_mapping_Mindspore.md +0 -29
msprobe/docs/25.tool_function_introduction.md +0 -29
msprobe/docs/26.data_dump_PyTorch_baseline.md +0 -48
msprobe/docs/27.dump_json_instruction.md +0 -795
msprobe/docs/28.debugger_save_instruction.md +0 -288
msprobe/docs/28.kernel_dump_MindSpore.md +0 -69
msprobe/docs/29.data_dump_MSAdapter.md +0 -235
msprobe/docs/30.overflow_check_MSAdapter.md +0 -31
msprobe/docs/31.config_check.md +0 -107
msprobe/docs/32.ckpt_compare.md +0 -69
msprobe/docs/33.generate_operator_MindSpore.md +0 -181
msprobe/docs/34.RL_collect.md +0 -101
msprobe/docs/35.nan_analyze.md +0 -73
msprobe/docs/36.calculation_result_change.md +0 -75
msprobe/docs/FAQ.md +0 -232
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +0 -146
msprobe/docs/accuracy_checker_MindSpore/accuracy_checker_MindSpore_baseline.md +0 -14
msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +0 -33
msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +0 -217
msprobe/docs/img/BLOOM-7B_1.png +0 -0
msprobe/docs/img/BLOOM-7B_2.png +0 -0
msprobe/docs/img/BLOOM-7B_3.png +0 -0
msprobe/docs/img/BLOOM-7B_4.png +0 -0
msprobe/docs/img/GPT-3_1.png +0 -0
msprobe/docs/img/GPT-3_2.png +0 -0
msprobe/docs/img/GPT-3_3.png +0 -0
msprobe/docs/img/GPT-3_4.png +0 -0
msprobe/docs/img/GPT-3_5.png +0 -0
msprobe/docs/img/GPT-3_6.png +0 -0
msprobe/docs/img/GPT-3_7.png +0 -0
msprobe/docs/img/GPT-3_8.png +0 -0
msprobe/docs/img/YOLOV5S_1.png +0 -0
msprobe/docs/img/YOLOV5S_2.png +0 -0
msprobe/docs/img/accuracy_checking_details.png +0 -0
msprobe/docs/img/accuracy_checking_result.png +0 -0
msprobe/docs/img/api_precision_compare_details.png +0 -0
msprobe/docs/img/api_precision_compare_result.png +0 -0
msprobe/docs/img/auto_analyze_log.png +0 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/compare_result_pkl.png +0 -0
msprobe/docs/img/compare_result_pkl_md5.png.png +0 -0
msprobe/docs/img/cpu_info.png +0 -0
msprobe/docs/img/free_benchmark.png +0 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/grad_probe_image-1.png +0 -0
msprobe/docs/img/grad_probe_image-2.png +0 -0
msprobe/docs/img/grad_probe_image-3.png +0 -0
msprobe/docs/img/grad_probe_image-4.png +0 -0
msprobe/docs/img/grad_probe_image.png +0 -0
msprobe/docs/img/merge_result.png +0 -0
msprobe/docs/img/module_compare.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/docs/img/monitor/step_count_per_record.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/docs/img/save_compare_result_sample.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_ms.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_pt.png +0 -0
msprobe/docs/img/visualization/proxy.png +0 -0
msprobe/docs/img/visualization/tensorboard_1.png +0 -0
msprobe/docs/img/visualization/tensorboard_2.png +0 -0
msprobe/docs/img/visualization/vis_browser_1.png +0 -0
msprobe/docs/img/visualization/vis_browser_2.png +0 -0
msprobe/docs/img/visualization/vis_match_info.png +0 -0
msprobe/docs/img/visualization/vis_precision_info.png +0 -0
msprobe/docs/img/visualization/vis_search_info.png +0 -0
msprobe/docs/img/visualization/vis_show_info.png +0 -0
msprobe/docs/img/visualization/vis_showcase.png +0 -0
msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
msprobe/docs/visualization/GPTModel.png +0 -0
msprobe/docs/visualization/ParallelMLP.png +0 -0
msprobe/docs/visualization/layer_mapping_example.md +0 -132
msprobe/docs/visualization/mapping.png +0 -0
msprobe/docs/visualization/mapping1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/3.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/4.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/5.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/6.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/7.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory-qwen25vl.txt +0 -59
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed-mm-qwen25vl.txt +0 -80
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactory_mapping.md +0 -330
msprobe/docs/visualization/module_name.png +0 -0
msprobe/docs/visualization/module_name1.png +0 -0
msprobe/docs/visualization/no_mapping.png +0 -0
msprobe/docs/visualization/no_mapping1.png +0 -0
msprobe/docs/visualization/no_mapping_analyze.png +0 -0
msprobe/docs/visualization/top_layer.png +0 -0
msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +0 -460
msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +0 -2081
msprobe/mindspore/code_mapping/bind.py +0 -283
msprobe/mindspore/code_mapping/cmd_parser.py +0 -40
msprobe/mindspore/code_mapping/graph.py +0 -49
msprobe/mindspore/code_mapping/graph_parser.py +0 -211
msprobe/mindspore/code_mapping/main.py +0 -24
msprobe/mindspore/code_mapping/processor.py +0 -34
msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +0 -111
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +0 -52
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +0 -257
msprobe/mindspore/free_benchmark/common/config.py +0 -27
msprobe/mindspore/free_benchmark/common/handler_params.py +0 -31
msprobe/mindspore/free_benchmark/common/utils.py +0 -100
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -638
msprobe/mindspore/free_benchmark/handler/base_handler.py +0 -105
msprobe/mindspore/free_benchmark/handler/check_handler.py +0 -55
msprobe/mindspore/free_benchmark/handler/fix_handler.py +0 -51
msprobe/mindspore/free_benchmark/handler/handler_factory.py +0 -36
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +0 -82
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +0 -45
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +0 -78
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +0 -77
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +0 -56
msprobe/mindspore/free_benchmark/perturbation/no_change.py +0 -27
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +0 -46
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +0 -51
msprobe/mindspore/grad_probe/global_context.py +0 -127
msprobe/mindspore/grad_probe/grad_analyzer.py +0 -260
msprobe/mindspore/grad_probe/grad_monitor.py +0 -42
msprobe/mindspore/grad_probe/grad_stat_csv.py +0 -161
msprobe/mindspore/grad_probe/hook.py +0 -115
msprobe/mindspore/grad_probe/utils.py +0 -43
msprobe/mindspore/mindtorch/__init__.py +0 -18
msprobe/mindspore/ms_config.py +0 -153
msprobe/mindspore/task_handler_factory.py +0 -44
msprobe/nan_analyze/__init__.py +0 -14
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +0 -9
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +0 -480
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +0 -567
msprobe/pytorch/debugger/precision_debugger.py +0 -181
msprobe/pytorch/free_benchmark/__init__.py +0 -23
msprobe/pytorch/free_benchmark/common/constant.py +0 -85
msprobe/pytorch/free_benchmark/common/counter.py +0 -87
msprobe/pytorch/free_benchmark/common/enums.py +0 -80
msprobe/pytorch/free_benchmark/common/params.py +0 -152
msprobe/pytorch/free_benchmark/common/utils.py +0 -143
msprobe/pytorch/free_benchmark/compare/grad_saver.py +0 -215
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +0 -121
msprobe/pytorch/free_benchmark/main.py +0 -123
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +0 -28
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +0 -56
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +0 -107
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +0 -121
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +0 -89
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +0 -87
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +0 -43
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +0 -60
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +0 -34
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +0 -252
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +0 -54
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +0 -40
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -45
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +0 -181
msprobe/pytorch/grad_probe/__init__.py +0 -0
msprobe/pytorch/grad_probe/grad_monitor.py +0 -108
msprobe/pytorch/grad_probe/grad_stat_csv.py +0 -160
msprobe/pytorch/hook_module/__init__.py +0 -16
msprobe/pytorch/hook_module/wrap_aten.py +0 -111
msprobe/pytorch/online_dispatch/__init__.py +0 -19
msprobe/pytorch/online_dispatch/compare.py +0 -224
msprobe/pytorch/online_dispatch/dispatch.py +0 -332
msprobe/pytorch/online_dispatch/dump_compare.py +0 -179
msprobe/pytorch/online_dispatch/single_compare.py +0 -412
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +0 -58
msprobe/pytorch/online_dispatch/utils.py +0 -158
msprobe/pytorch/parse_tool/__init__.py +0 -0
msprobe/pytorch/parse_tool/cli.py +0 -31
msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
msprobe/pytorch/parse_tool/lib/compare.py +0 -253
msprobe/pytorch/parse_tool/lib/config.py +0 -50
msprobe/pytorch/parse_tool/lib/file_desc.py +0 -45
msprobe/pytorch/parse_tool/lib/interactive_cli.py +0 -97
msprobe/pytorch/parse_tool/lib/parse_exception.py +0 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +0 -161
msprobe/pytorch/parse_tool/lib/utils.py +0 -299
msprobe/pytorch/parse_tool/lib/visualization.py +0 -85
msprobe/pytorch/pt_config.py +0 -299
/msprobe/core/{grad_probe → dump}/__init__.py +0 -0
/msprobe/{mindspore/code_mapping → core/dump/api_dump}/__init__.py +0 -0
/msprobe/{mindspore/debugger → core/dump/data_dump}/__init__.py +0 -0
/msprobe/{mindspore/exception_dump → core/dump/data_dump/data_processor}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark → core/dump/debugger}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark/common → core/dump/kernel_dump}/__init__.py +0 -0
/msprobe/mindspore/{free_benchmark/handler → dump/debugger}/__init__.py +0 -0
/msprobe/mindspore/{grad_probe → dump/dump_processor}/__init__.py +0 -0
/msprobe/mindspore/{overflow_check → dump/exception_dump}/__init__.py +0 -0
/msprobe/mindspore/{mindtorch → dump/mindtorch}/mindtorch_adaptor.py +0 -0
/msprobe/{pytorch/api_accuracy_checker/run_ut → mindspore/dump/overflow_check}/__init__.py +0 -0
/msprobe/{pytorch/debugger → mindspore/monitor}/__init__.py +0 -0
/msprobe/{pytorch/free_benchmark/common → msaccucmp}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/.keep +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers → api_accuracy_checker/acc_check}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/torch_ut_setting.json +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers/npu → dump/api_dump}/__init__.py +0 -0
/msprobe/pytorch/{hook_module → dump/api_dump}/support_wrap_ops.yaml +0 -0
/msprobe/pytorch/{free_benchmark/result_handlers → dump/debugger}/__init__.py +0 -0

msprobe/visualization/graph_service.py CHANGED Viewed

@@ -1,36 +1,43 @@
-# Copyright (c) 2024-2025, Huawei Technologies Co., Ltd.
-# All rights reserved.
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
 #
-# Licensed under the Apache License, Version 2.0  (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
 #
-# http://www.apache.org/licenses/LICENSE-2.0
+#          http://license.coscl.org.cn/MulanPSL2
 #
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
 import os
 import time
+import threading
 from copy import deepcopy
-from multiprocessing import cpu_count, Pool
+from dataclasses import dataclass
+from multiprocessing import cpu_count, Pool, Manager
+from typing import Callable, Optional
+from tqdm import tqdm
 from msprobe.core.common.file_utils import (check_file_type, create_directory, FileChecker,
                                             check_file_or_directory_path, load_json)
 from msprobe.core.common.const import FileCheckConst, Const
 from msprobe.core.common.utils import CompareException, get_dump_mode
 from msprobe.visualization.compare.graph_comparator import GraphComparator
 from msprobe.visualization.utils import GraphConst, check_directory_content, SerializableArgs, load_parallel_param, \
-    sort_rank_number_strings, check_whether_parallel_merge, validate_parallel_param, get_step_or_rank_int
+    sort_rank_number_strings, validate_parallel_param, get_step_or_rank_int, \
+    monitor_progress, ProgressInfo, calculate_list, get_log_msg_wrapper
 from msprobe.visualization.builder.graph_builder import GraphBuilder, GraphExportConfig, GraphInfo, BuildGraphTaskInfo
-from msprobe.core.common.log import logger
+from msprobe.core.common.log import logger, BaseLogger
 from msprobe.visualization.graph.node_colors import NodeColors
 from msprobe.core.compare.layer_mapping import generate_api_mapping_by_layer_mapping
 from msprobe.core.compare.utils import check_and_return_dir_contents
 from msprobe.core.common.utils import detect_framework_by_dump_json
-from msprobe.visualization.graph.distributed_analyzer import DistributedAnalyzer
+from msprobe.visualization.graph.distributed_analyzer import distributed_analyse
 from msprobe.visualization.builder.graph_merger import GraphMerger
 from msprobe.visualization.db_utils import post_process_db
@@ -39,12 +46,12 @@ build_output_db_name = f'build_{current_time}.vis.db'
 compare_output_db_name = f'compare_{current_time}.vis.db'
-def _compare_graph(graph_n: GraphInfo, graph_b: GraphInfo, input_param, args):
+def _compare_graph(graph_n: GraphInfo, graph_b: GraphInfo, input_param, args, pbar_info=None):
     dump_path_param = {
-        'npu_json_path': graph_n.data_path,
-        'bench_json_path': graph_b.data_path,
-        'stack_json_path': graph_n.stack_path,
-        'is_print_compare_log': input_param.get("is_print_compare_log", True)
+        'npu_path': graph_n.data_path,
+        'bench_path': graph_b.data_path,
+        'stack_path': graph_n.stack_path,
+        'is_print_compare_log': input_param.get("is_print_compare_log", False)
     }
     mapping_dict = {}
     if args.layer_mapping:
@@ -61,19 +68,19 @@ def _compare_graph(graph_n: GraphInfo, graph_b: GraphInfo, input_param, args):
         raise CompareException(CompareException.CROSS_FRAME_ERROR)
     graph_comparator = GraphComparator([graph_n.graph, graph_b.graph], dump_path_param, args, is_cross_framework,
-                                       mapping_dict=mapping_dict)
+                                       mapping_dict=mapping_dict, pbar_info=pbar_info)
     graph_comparator.compare()
     return graph_comparator
-def _compare_graph_result(input_param, args):
+def _compare_graph_result(input_param, args, pbar_info=None):
     logger.info('Start building model graphs...')
     # 对两个数据进行构图
-    graph_n = _build_graph_info(input_param.get('npu_path'), args)
-    graph_b = _build_graph_info(input_param.get('bench_path'), args)
+    graph_n = _build_graph_info(input_param.get('npu_path'), args, pbar_info=pbar_info)
+    graph_b = _build_graph_info(input_param.get('bench_path'), args, pbar_info=pbar_info)
     logger.info('Model graphs built successfully, start comparing graphs...')
     # 基于graph、stack和data进行比较
-    graph_comparator = _compare_graph(graph_n, graph_b, input_param, args)
+    graph_comparator = _compare_graph(graph_n, graph_b, input_param, args, pbar_info=pbar_info)
     # 增加micro step标记
     micro_steps = graph_n.graph.paging_by_micro_step(graph_b.graph)
     # 开启溢出检测
@@ -84,7 +91,7 @@ def _compare_graph_result(input_param, args):
     return CompareGraphResult(graph_n.graph, graph_b.graph, graph_comparator, micro_steps)
-def _export_compare_graph_result(args, result):
+def _export_compare_graph_result(args, result, pbar_info=None):
     graphs = [result.graph_n, result.graph_b]
     graph_comparator = result.graph_comparator
     micro_steps = result.micro_steps
@@ -97,7 +104,7 @@ def _export_compare_graph_result(args, result):
                                       args.step_list if hasattr(args, 'step_list') else [0],
                                       args.rank_list if hasattr(args, 'rank_list') else [0])
     try:
-        GraphBuilder.to_db(output_db_path, export_config)
+        GraphBuilder.to_db(output_db_path, export_config, pbar_info=pbar_info)
         logger.info(f'Exporting compare graph result successfully, the result file is saved in {output_db_path}')
         return ''
     except RuntimeError as e:
@@ -105,7 +112,7 @@ def _export_compare_graph_result(args, result):
         return compare_output_db_name
-def _build_graph_info(dump_path, args, graph=None):
+def _build_graph_info(dump_path, args, graph=None, pbar_info=None):
     construct_path = FileChecker(os.path.join(dump_path, GraphConst.CONSTRUCT_FILE), FileCheckConst.FILE,
                                  FileCheckConst.READ_ABLE).common_check()
     data_path = FileChecker(os.path.join(dump_path, GraphConst.DUMP_FILE), FileCheckConst.FILE,
@@ -113,13 +120,13 @@ def _build_graph_info(dump_path, args, graph=None):
     stack_path = FileChecker(os.path.join(dump_path, GraphConst.STACK_FILE), FileCheckConst.FILE,
                              FileCheckConst.READ_ABLE).common_check()
     if not graph:
-        graph = GraphBuilder.build(construct_path, data_path, stack_path)
+        graph = GraphBuilder.build(construct_path, data_path, stack_path, pbar_info=pbar_info)
     return GraphInfo(graph, construct_path, data_path, stack_path)
-def _build_graph_result(dump_path, args):
+def _build_graph_result(dump_path, args, pbar_info=None):
     logger.info('Start building model graphs...')
-    graph = _build_graph_info(dump_path, args).graph
+    graph = _build_graph_info(dump_path, args, pbar_info=pbar_info).graph
     # 增加micro step标记
     micro_steps = graph.paging_by_micro_step()
     # 开启溢出检测
@@ -128,30 +135,39 @@ def _build_graph_result(dump_path, args):
     return BuildGraphResult(graph, micro_steps)
-def _run_build_graph_compare(input_param, args, nr, br):
+def _run_build_graph_compare(input_param, args, nr, br, pbar_info=None):
     logger.info(f'Start building graph for {nr}...')
-    graph_n = _build_graph_info(input_param.get('npu_path'), args)
-    graph_b = _build_graph_info(input_param.get('bench_path'), args)
+    graph_n = _build_graph_info(input_param.get('npu_path'), args, pbar_info=pbar_info)
+    graph_b = _build_graph_info(input_param.get('bench_path'), args, pbar_info=pbar_info)
     logger.info(f'Building graph for {nr} finished.')
     return BuildGraphTaskInfo(graph_n, graph_b, nr, br, current_time)
-def _run_build_graph_single(dump_ranks_path, rank, step, args):
+def _run_build_graph_single(dump_ranks_path, rank, step, args, pbar_info=None):
     logger.info(f'Start building graph for {rank}...')
     dump_path = os.path.join(dump_ranks_path, rank)
-    result = _build_graph_result(dump_path, args)
+    result = _build_graph_result(dump_path, args, pbar_info=pbar_info)
     if rank != Const.RANK:
         result.rank = get_step_or_rank_int(rank, True)
     logger.info(f'Building graph for step: {step}, rank: {rank} finished.')
     return result
-def _run_graph_compare(graph_task_info, input_param, args):
+def _run_build_graph_and_export(dump_ranks_path, rank, step, args, pbar_info=None):
+    result = _run_build_graph_single(dump_ranks_path, rank, step, args, pbar_info)
+    if step is not None:
+        result.step = get_step_or_rank_int(step)
+    create_directory(args.output_path)
+    return _export_build_graph_result(args, result, pbar_info)
+def _run_graph_compare(graph_task_info, input_param, args, pbar_info=None):
     logger.info(f'Start comparing data for {graph_task_info.npu_rank}...')
     graph_n = graph_task_info.graph_info_n
     graph_b = graph_task_info.graph_info_b
     nr = graph_task_info.npu_rank
-    graph_comparator = _compare_graph(graph_n, graph_b, input_param, args)
+    graph_comparator = _compare_graph(graph_n, graph_b, input_param, args, pbar_info=pbar_info)
     micro_steps = graph_n.graph.paging_by_micro_step(graph_b.graph)
     # 开启溢出检测
     if args.overflow_check:
@@ -164,7 +180,7 @@ def _run_graph_compare(graph_task_info, input_param, args):
     return graph_result
-def _export_build_graph_result(args, result):
+def _export_build_graph_result(args, result, pbar_info=None):
     out_path = args.output_path
     graph = result.graph
     micro_steps = result.micro_steps
@@ -175,7 +191,7 @@ def _export_build_graph_result(args, result):
                                step=result.step, rank_list=args.rank_list if hasattr(args, 'rank_list') else [0],
                                step_list=args.step_list if hasattr(args, 'step_list') else [0])
     try:
-        GraphBuilder.to_db(output_db_path, config)
+        GraphBuilder.to_db(output_db_path, config, pbar_info=pbar_info)
         logger.info(f'Model graph exported successfully, the result file is saved in {output_db_path}')
         return None
     except RuntimeError as e:
@@ -189,57 +205,30 @@ def is_real_data_compare(input_param, npu_ranks, bench_ranks):
     has_real_data = False
     for nr, br in zip(npu_ranks, bench_ranks):
         dump_path_param = {
-            'npu_json_path': FileChecker(os.path.join(dump_rank_n, nr, GraphConst.DUMP_FILE), FileCheckConst.FILE,
-                                         FileCheckConst.READ_ABLE).common_check(),
-            'bench_json_path': FileChecker(os.path.join(dump_rank_b, br, GraphConst.DUMP_FILE), FileCheckConst.FILE,
-                                           FileCheckConst.READ_ABLE).common_check()
+            'npu_path': FileChecker(os.path.join(dump_rank_n, nr, GraphConst.DUMP_FILE), FileCheckConst.FILE,
+                                    FileCheckConst.READ_ABLE).common_check(),
+            'bench_path': FileChecker(os.path.join(dump_rank_b, br, GraphConst.DUMP_FILE), FileCheckConst.FILE,
+                                      FileCheckConst.READ_ABLE).common_check()
         }
         has_real_data |= get_dump_mode(dump_path_param) == Const.ALL
     return has_real_data
-def _mp_compare(input_param, serializable_args, nr, br):
-    graph_task_info = _run_build_graph_compare(input_param, serializable_args, nr, br)
-    return _run_graph_compare(graph_task_info, input_param, serializable_args)
-def _compare_graph_ranks(input_param, args, step=None):
-    with Pool(processes=max(int((cpu_count() + 1) // 4), 1)) as pool:
-        def err_call(err):
-            logger.error(f'Error occurred while comparing graph ranks: {err}')
-            try:
-                pool.close()
-            except OSError as e:
-                logger.error(f'Error occurred while terminating the pool: {e}')
-        serializable_args = SerializableArgs(args)
-        # 暂存所有rank的graph，用于匹配rank间的分布式节点
-        compare_graph_results = _get_compare_graph_results(input_param, serializable_args, step, pool, err_call)
+def _mp_compare(input_param, serializable_args, nr, br, pbar_info=None):
+    graph_task_info = _run_build_graph_compare(input_param, serializable_args, nr, br, pbar_info=pbar_info)
+    return _run_graph_compare(graph_task_info, input_param, serializable_args, pbar_info=pbar_info)
-        serializable_args.rank_list = [result.rank for result in compare_graph_results]
-        # 匹配rank间的分布式节点
-        if len(compare_graph_results) > 1:
-            DistributedAnalyzer({obj.rank: obj.graph_n for obj in compare_graph_results},
-                                args.overflow_check).distributed_match()
-            DistributedAnalyzer({obj.rank: obj.graph_b for obj in compare_graph_results},
-                                args.overflow_check).distributed_match()
+def _mp_compare_and_export(input_param, args, rank, step, pbar_info=None):
+    graph_result = _mp_compare(input_param, args, rank, rank, pbar_info=pbar_info)
+    if step is not None:
+        graph_result.step = get_step_or_rank_int(step)
+    create_directory(args.output_path)
-        export_res_task_list = []
-        create_directory(args.output_path)
-        for result in compare_graph_results:
-            export_res_task_list.append(pool.apply_async(_export_compare_graph_result,
-                                                         args=(serializable_args, result),
-                                                         error_callback=err_call))
-        export_res_list = [res.get() for res in export_res_task_list]
-        if any(export_res_list):
-            failed_names = list(filter(lambda x: x, export_res_list))
-            logger.error(f'Unable to export compare graph results: {", ".join(failed_names)}.')
-        else:
-            logger.info('Successfully exported compare graph results.')
+    return _export_compare_graph_result(args, graph_result, pbar_info=pbar_info)
-def _get_compare_graph_results(input_param, serializable_args, step, pool, err_call):
+def _compare_graph_ranks(input_param, args, step=None, pbar_info=None):
     dump_rank_n = input_param.get('npu_path')
     dump_rank_b = input_param.get('bench_path')
     npu_ranks = sort_rank_number_strings(check_and_return_dir_contents(dump_rank_n, Const.RANK))
@@ -251,64 +240,86 @@ def _get_compare_graph_results(input_param, serializable_args, step, pool, err_c
             raise CompareException(CompareException.INVALID_PATH_ERROR)
         npu_ranks = intersection_ranks
         bench_ranks = intersection_ranks
-    compare_graph_results = []
-    if is_real_data_compare(input_param, npu_ranks, bench_ranks):
-        mp_task_dict = {}
-        for nr, br in zip(npu_ranks, bench_ranks):
-            input_param['npu_path'] = os.path.join(dump_rank_n, nr)
-            input_param['bench_path'] = os.path.join(dump_rank_b, br)
-            build_key = f'{step}_{nr}' if step else f'{nr}'
-            input_param_copy = deepcopy(input_param)
-            mp_task_dict[build_key] = pool.apply_async(_run_build_graph_compare,
-                                                       args=(input_param_copy, serializable_args, nr, br),
-                                                       error_callback=err_call)
-        mp_res_dict = {k: v.get() for k, v in mp_task_dict.items()}
-        for mp_res in mp_res_dict.values():
-            compare_graph_results.append(_run_graph_compare(mp_res, input_param, serializable_args))
-    else:
-        compare_graph_tasks = []
-        for nr, br in zip(npu_ranks, bench_ranks):
-            input_param['npu_path'] = os.path.join(dump_rank_n, nr)
-            input_param['bench_path'] = os.path.join(dump_rank_b, br)
-            input_param_copy = deepcopy(input_param)
-            compare_graph_tasks.append(pool.apply_async(_mp_compare,
-                                                        args=(input_param_copy, serializable_args, nr, br),
-                                                        error_callback=err_call))
-        compare_graph_results = [task.get() for task in compare_graph_tasks]
-    if step is not None:
-        for result in compare_graph_results:
-            result.step = get_step_or_rank_int(step)
-    return compare_graph_results
+    args.rank_list = [get_step_or_rank_int(rank, True) for rank in npu_ranks]
+    serializable_args = SerializableArgs(args)
+    with Pool(processes=max(int((cpu_count() + 1) // 4), 1)) as pool:
+        def err_call(err):
+            logger.error(f'Error occurred while comparing graph ranks: {err}')
-def _compare_graph_steps(input_param, args):
-    dump_step_n = input_param.get('npu_path')
-    dump_step_b = input_param.get('bench_path')
+        if is_real_data_compare(input_param, npu_ranks, bench_ranks):
+            # 真实数据模式，考虑到tensor比对过程会使用进程池启用多进程，为了避免嵌套进程池，graph比对使用串行
+            compare_graph_results = []
+            mp_task_dict = {}
+            for nr, br in zip(npu_ranks, bench_ranks):
+                input_param['npu_path'] = os.path.join(dump_rank_n, nr)
+                input_param['bench_path'] = os.path.join(dump_rank_b, br)
+                build_key = f'{step}_{nr}' if step else f'{nr}'
+                input_param_copy = deepcopy(input_param)
+                pbar_info_copy = PbarInfo.update_task_id(pbar_info, nr)
+                mp_task_dict[build_key] = pool.apply_async(_run_build_graph_compare,
+                                                           args=(input_param_copy, serializable_args, nr, br,
+                                                                 pbar_info_copy),
+                                                           error_callback=err_call)
+            mp_res_dict = {k: v.get() for k, v in mp_task_dict.items()}
+            for build_key, mp_res in mp_res_dict.items():
+                if pbar_info:
+                    if Const.REPLACEMENT_CHARACTER in build_key:
+                        build_key = build_key.split(Const.REPLACEMENT_CHARACTER)[-1]
+                    pbar_info.task_id = build_key
+                compare_graph_results.append(_run_graph_compare(mp_res, input_param, serializable_args, pbar_info))
+            if step is not None:
+                for result in compare_graph_results:
+                    result.step = get_step_or_rank_int(step)
+            export_res_task_list = []
+            create_directory(args.output_path)
+            for result in compare_graph_results:
+                export_res_task_list.append(pool.apply_async(_export_compare_graph_result,
+                                                             args=(serializable_args, result),
+                                                             error_callback=err_call))
+            export_res_list = [res.get() for res in export_res_task_list]
+        else:
+            compare_graph_tasks = []
+            for nr, br in zip(npu_ranks, bench_ranks):
+                input_param['npu_path'] = os.path.join(dump_rank_n, nr)
+                input_param['bench_path'] = os.path.join(dump_rank_b, br)
+                input_param_copy = deepcopy(input_param)
+                pbar_info_copy = PbarInfo.update_task_id(pbar_info, nr)
+                compare_graph_tasks.append(pool.apply_async(_mp_compare_and_export,
+                                                            args=(input_param_copy, serializable_args, nr, step,
+                                                                  pbar_info_copy),
+                                                            error_callback=err_call))
+            export_res_list = [res.get() for res in compare_graph_tasks]
+        if any(export_res_list):
+            failed_names = list(filter(lambda x: x, export_res_list))
+            logger.error(f'Unable to export compare graph results: {", ".join(failed_names)}.')
+        else:
+            logger.info('Successfully exported compare graph results.')
-    npu_steps = check_and_return_dir_contents(dump_step_n, Const.STEP)
-    bench_steps = check_and_return_dir_contents(dump_step_b, Const.STEP)
-    if npu_steps != bench_steps:
-        intersection_steps = sort_rank_number_strings(list(set(npu_steps) & set(bench_steps)))
+def _compare_graph_steps(input_param, args, pbar_info=None):
+    dump_step_n = input_param.get('npu_path')
+    dump_step_b = input_param.get('bench_path')
-        if not intersection_steps:
-            logger.error('The steps in the two runs are completely different. Unable to match the steps.')
-            raise CompareException(CompareException.INVALID_PATH_ERROR)
-        npu_steps = intersection_steps
+    npu_steps = calculate_list(dump_step_n, dump_step_b, Const.STEP)
     args.step_list = sorted([get_step_or_rank_int(step) for step in npu_steps])
-    for folder_step in npu_steps:
+    for i, folder_step in enumerate(npu_steps):
         logger.info(f'Start processing data for {folder_step}...')
         input_param['npu_path'] = os.path.join(dump_step_n, folder_step)
         input_param['bench_path'] = os.path.join(dump_step_b, folder_step)
-        _compare_graph_ranks(input_param, args, step=folder_step) if not args.parallel_merge \
-            else _compare_graph_ranks_parallel(input_param, args, step=folder_step)
+        if pbar_info:
+            pbar_info.step = i
+        _compare_graph_ranks(input_param, args, step=folder_step, pbar_info=pbar_info) if not args.parallel_merge \
+            else _compare_graph_ranks_parallel(input_param, args, step=folder_step, pbar_info=pbar_info)
-def _build_graph_ranks(dump_ranks_path, args, step=None):
+def _build_graph_ranks_parallel(args, step=None, pbar_info=None):
+    dump_ranks_path = os.path.join(args.target_path, step) if step is not None else args.target_path
     ranks = sort_rank_number_strings(check_and_return_dir_contents(dump_ranks_path, Const.RANK))
     serializable_args = SerializableArgs(args)
     with Pool(processes=max(int((cpu_count() + 1) // 4), 1)) as pool:
@@ -320,10 +331,13 @@ def _build_graph_ranks(dump_ranks_path, args, step=None):
                 logger.error(f'Error occurred while terminating the pool: {e}')
         build_graph_tasks = []
+        if pbar_info and pbar_info.step:
+            PbarInfo.reset_progress_and_current_stage(pbar_info, ranks)
         for rank in ranks:
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, rank)
             build_graph_tasks.append(pool.apply_async(_run_build_graph_single,
-                                                      args=(dump_ranks_path, rank, step, serializable_args),
-                                                      error_callback=err_call))
+                                                      args=(dump_ranks_path, rank, step, serializable_args,
+                                                            pbar_info_copy), error_callback=err_call))
         build_graph_results = [task.get() for task in build_graph_tasks]
         if step is not None:
@@ -332,18 +346,19 @@ def _build_graph_ranks(dump_ranks_path, args, step=None):
         if args.parallel_params:
             validate_parallel_param(args.parallel_params[0], dump_ranks_path)
-            build_graph_results = GraphMerger(build_graph_results, args.parallel_params[0]).merge_graph()
-        if len(build_graph_results) > 1 and not args.parallel_merge:
-            DistributedAnalyzer({obj.rank: obj.graph for obj in build_graph_results},
-                                args.overflow_check).distributed_match()
+            build_graph_results = GraphMerger(build_graph_results, args.parallel_params[0],
+                                              pbar_info=pbar_info).merge_graph()
+            if pbar_info:
+                PbarInfo.del_progress_dict_item(pbar_info, ranks,
+                                                [f'{Const.RANK}{result.rank}' for result in build_graph_results])
         create_directory(args.output_path)
         export_build_graph_tasks = []
         serializable_args.rank_list = [result.rank for result in build_graph_results]
         for result in build_graph_results:
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, f'{Const.RANK}{result.rank}')
             export_build_graph_tasks.append(pool.apply_async(_export_build_graph_result,
-                                                             args=(serializable_args, result),
+                                                             args=(serializable_args, result, pbar_info_copy),
                                                              error_callback=err_call))
         export_build_graph_result = [task.get() for task in export_build_graph_tasks]
         if any(export_build_graph_result):
@@ -353,30 +368,55 @@ def _build_graph_ranks(dump_ranks_path, args, step=None):
             logger.info(f'Successfully exported build graph results.')
-def _build_graph_steps(dump_steps_path, args):
-    steps = sorted(check_and_return_dir_contents(dump_steps_path, Const.STEP))
+def _build_graph_ranks(args, step=None, pbar_info=None):
+    dump_ranks_path = os.path.join(args.target_path, step) if step is not None else args.target_path
+    ranks = sort_rank_number_strings(check_and_return_dir_contents(dump_ranks_path, Const.RANK))
+    args.rank_list = [get_step_or_rank_int(rank, True) for rank in ranks]
+    serializable_args = SerializableArgs(args)
+    with Pool(processes=max(int((cpu_count() + 1) // 4), 1)) as pool:
+        def err_call(err):
+            logger.error(f'Error occurred while comparing graph ranks: {err}')
+        tasks = []
+        for rank in ranks:
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, rank)
+            tasks.append(pool.apply_async(_run_build_graph_and_export,
+                                          args=(dump_ranks_path, rank, step, serializable_args, pbar_info_copy),
+                                          error_callback=err_call))
+        results = [task.get() for task in tasks]
+        if any(results):
+            failed_names = list(filter(lambda x: x, results))
+            logger.error(f'Unable to export build graph results: {failed_names}.')
+        else:
+            logger.info(f'Successfully exported build graph results.')
+def _build_graph_steps(args, pbar_info=None):
+    steps = sorted(check_and_return_dir_contents(args.target_path, Const.STEP))
     args.step_list = sorted([get_step_or_rank_int(step) for step in steps])
-    for step in steps:
+    for i, step in enumerate(steps):
         logger.info(f'Start processing data for {step}...')
-        dump_ranks_path = os.path.join(dump_steps_path, step)
-        _build_graph_ranks(dump_ranks_path, args, step)
+        if pbar_info:
+            pbar_info.step = i
+        _build_graph_ranks(args, step, pbar_info=pbar_info) if not args.parallel_merge \
+            else _build_graph_ranks_parallel(args, step, pbar_info=pbar_info)
-def _compare_and_export_graph(graph_task_info, input_param, args, step=None):
-    result = _run_graph_compare(graph_task_info, input_param, args)
+def _compare_and_export_graph(graph_task_info, input_param, args, step=None, pbar_info=None):
+    result = _run_graph_compare(graph_task_info, input_param, args, pbar_info=pbar_info)
     if step is not None:
         result.step = get_step_or_rank_int(step)
-    return _export_compare_graph_result(args, result)
+    return _export_compare_graph_result(args, result, pbar_info=pbar_info)
-def _compare_graph_ranks_parallel(input_param, args, step=None):
+def _compare_graph_ranks_parallel(input_param, args, step=None, pbar_info=None):
     args.fuzzy_match = True
     npu_path = input_param.get('npu_path')
     bench_path = input_param.get('bench_path')
     ranks_n = sort_rank_number_strings(check_and_return_dir_contents(npu_path, Const.RANK))
     ranks_b = sort_rank_number_strings(check_and_return_dir_contents(bench_path, Const.RANK))
-    parallel_params = load_parallel_param(input_param)
+    parallel_params = args.parallel_params
     if len(parallel_params) != 2:
         raise RuntimeError('Parallel params error in compare graph!')
     validate_parallel_param(parallel_params[0], npu_path)
@@ -394,24 +434,33 @@ def _compare_graph_ranks_parallel(input_param, args, step=None):
         # 1.并行构图
         build_graph_tasks_n = []
         build_graph_tasks_b = []
+        if pbar_info and pbar_info.step:
+            PbarInfo.reset_progress_and_current_stage(pbar_info, list(set(ranks_n) | set(ranks_b)))
         for rank in ranks_n:
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, rank)
             build_graph_tasks_n.append(pool.apply_async(_run_build_graph_single,
-                                                        args=(npu_path, rank, step, serializable_args),
+                                                        args=(npu_path, rank, step, serializable_args, pbar_info_copy),
                                                         error_callback=err_call))
         for rank in ranks_b:
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, rank)
             build_graph_tasks_b.append(pool.apply_async(_run_build_graph_single,
-                                                        args=(bench_path, rank, step, serializable_args),
-                                                        error_callback=err_call))
+                                                        args=(bench_path, rank, step, serializable_args,
+                                                              pbar_info_copy), error_callback=err_call))
         graph_results_n = [task.get() for task in build_graph_tasks_n]
         graph_results_b = [task.get() for task in build_graph_tasks_b]
         # 2.图合并
-        build_graph_results_n = GraphMerger(graph_results_n, parallel_params[0]).merge_graph()
-        build_graph_results_b = GraphMerger(graph_results_b, parallel_params[1], True).merge_graph()
+        build_graph_results_n = GraphMerger(graph_results_n, parallel_params[0], pbar_info=pbar_info).merge_graph()
+        build_graph_results_b = GraphMerger(graph_results_b, parallel_params[1], True,
+                                            pbar_info=pbar_info).merge_graph()
         if len(build_graph_results_n) != len(build_graph_results_b):
             raise RuntimeError(f'Parallel merge failed because the dp of npu: {len(build_graph_results_n)} '
                                f'is inconsistent with that of bench: {len(build_graph_results_b)}!')
         serializable_args.rank_list = [result.rank for result in build_graph_results_n]
+        if pbar_info:
+            PbarInfo.del_progress_dict_item(pbar_info, list(set(ranks_n) | set(ranks_b)),
+                                            [f'{Const.RANK}{result.rank}' for result in build_graph_results_n])
         # 3.并行图比对和输出
         export_res_task_list = []
         create_directory(args.output_path)
@@ -422,9 +471,10 @@ def _compare_graph_ranks_parallel(input_param, args, step=None):
                 _build_graph_info(os.path.join(npu_path, f'rank{graph_n.root.rank}'), args, graph_n),
                 _build_graph_info(os.path.join(bench_path, f'rank{graph_b.root.rank}'), args, graph_b),
                 f'rank{graph_n.root.rank}', f'rank{graph_b.root.rank}', current_time)
+            pbar_info_copy = PbarInfo.update_task_id(pbar_info, f'{Const.RANK}{result_n.rank}')
             export_res_task_list.append(pool.apply_async(_compare_and_export_graph,
-                                                         args=(graph_task_info, input_param, serializable_args, step),
-                                                         error_callback=err_call))
+                                                         args=(graph_task_info, input_param, serializable_args, step,
+                                                               pbar_info_copy), error_callback=err_call))
         export_res_list = [res.get() for res in export_res_task_list]
         if any(export_res_list):
             failed_names = list(filter(lambda x: x, export_res_list))
@@ -434,80 +484,336 @@ def _compare_graph_ranks_parallel(input_param, args, step=None):
 def _graph_service_parser(parser):
-    parser.add_argument("-i", "--input_path", dest="input_path", type=str,
-                        help="<Required> The compare input path, a dict json.", required=True)
+    # -------------------------- 基础必填参数 --------------------------
+    parser.add_argument("-tp", "--target_path", dest="target_path", type=str,
+                        help="<Required> The target path.", required=True)
     parser.add_argument("-o", "--output_path", dest="output_path", type=str,
-                        help="<Required> The compare task result out path.", required=True)
+                        help="<Required> The visualization task result out path.", required=True)
+    # -------------------------- 基础可选参数 --------------------------
+    parser.add_argument("-gp", "--golden_path", dest="golden_path", type=str,
+                        help="<Optional> The golden path.", required=False)
     parser.add_argument("-lm", "--layer_mapping", dest="layer_mapping", type=str, nargs='?', const=True,
                         help="<Optional> The layer mapping file path.", required=False)
     parser.add_argument("-oc", "--overflow_check", dest="overflow_check", action="store_true",
                         help="<Optional> whether open overflow_check for graph.", required=False)
-    parser.add_argument("-f", "--fuzzy_match", dest="fuzzy_match", action="store_true",
-                        help="<Optional> Whether to perform a fuzzy match on the api name.", required=False)
+    parser.add_argument("-fm", "--fuzzy_match", dest="fuzzy_match", action="store_true",
+                        help="<Optional> whether to perform a fuzzy match on the api name.", required=False)
+    parser.add_argument("-tensor_log", "--is_print_compare_log", dest="is_print_compare_log", action="store_true",
+                        help="<Optional> whether print tensor compare log for visualization task.", required=False)
+    parser.add_argument("-progress_log", "--is_print_progress_log", dest="is_print_progress_log", action="store_true",
+                        help="<Optional> whether print progress log for visualization task.", required=False)
+    # -------------------------- 不同并行切分策略合并可选参数 --------------------------
+    group_n = parser.add_argument_group("Parallel Parameters, "
+                                        "used for graph merging under different parallel partitioning strategies")
+    group_n.add_argument("--rank_size", type=int, nargs='+', help="<Optional> The rank size of dump path.",
+                         required=False)
+    group_n.add_argument("--tp", type=int, nargs='+',
+                         help="<Optional, but required if rank_size is not empty> The tp size of dump path.",
+                         required=False)
+    group_n.add_argument("--pp", type=int, nargs='+',
+                         help="<Optional, but required if rank_size is not empty> The pp size of dump path.",
+                         required=False)
+    group_n.add_argument("--vpp", type=int, nargs='+', default=[1], help="<Optional> The vpp size of dump path.",
+                         required=False)
+    group_n.add_argument("--order", type=str, nargs='+', default=['tp-cp-ep-dp-pp'],
+                         help="<Optional> The order of dump path.", required=False)
 def _graph_service_command(args):
-    input_param = load_json(args.input_path)
-    npu_path = input_param.get("npu_path")
-    bench_path = input_param.get("bench_path")
-    args.parallel_merge = check_whether_parallel_merge(input_param)
-    args.parallel_params = load_parallel_param(input_param) if args.parallel_merge else None
-    check_file_or_directory_path(npu_path, isdir=True)
-    if bench_path:
-        check_file_or_directory_path(bench_path, isdir=True)
-    if check_file_type(npu_path) == FileCheckConst.DIR and not bench_path:
-        content = check_directory_content(npu_path)
-        output_db_path = os.path.join(args.output_path, build_output_db_name)
-        if content == GraphConst.RANKS:
-            _build_graph_ranks(npu_path, args)
-        elif content == GraphConst.STEPS:
-            _build_graph_steps(npu_path, args)
+    try:
+        if args.is_print_progress_log:
+            # 往ProgressInfo中记录error日志，用于前端展示
+            BaseLogger.error = get_log_msg_wrapper(BaseLogger.error)
+        npu_path = args.target_path
+        bench_path = args.golden_path
+        ProgressInfo.print_progress_log = args.is_print_progress_log
+        args.parallel_merge = True if args.rank_size else False
+        args.parallel_params = load_parallel_param(args) if args.parallel_merge else None
+        check_file_or_directory_path(npu_path, isdir=True)
+        if bench_path:
+            check_file_or_directory_path(bench_path, isdir=True)
+        if check_file_type(npu_path) == FileCheckConst.DIR and not bench_path:
+            content = check_directory_content(npu_path)
+            if content == GraphConst.RANKS:
+                _build_graph_ranks_with_pbar(args)
+            elif content == GraphConst.STEPS:
+                _build_graph_steps_with_pbar(args)
+            else:
+                _build_graph_with_pbar(npu_path, args)
+        elif check_file_type(npu_path) == FileCheckConst.DIR and check_file_type(bench_path) == FileCheckConst.DIR:
+            content_n = check_directory_content(npu_path)
+            content_b = check_directory_content(bench_path)
+            if content_n != content_b:
+                raise ValueError('The directory structures of npu_path and bench_path are inconsistent.')
+            input_param = {
+                'npu_path': args.target_path,
+                'bench_path': args.golden_path,
+                'is_print_compare_log': args.is_print_compare_log
+            }
+            if content_n == GraphConst.RANKS:
+                _compare_graph_ranks_with_pbar(input_param, args)
+            elif content_n == GraphConst.STEPS:
+                _compare_graph_steps_with_pbar(input_param, args)
+            else:
+                _compare_graph_with_pbar(input_param, args)
         else:
-            result = _build_graph_result(npu_path, args)
-            create_directory(args.output_path)
-            file_name = _export_build_graph_result(args, result)
-            if file_name:
-                logger.error('Failed to export model build graph.')
-    elif check_file_type(npu_path) == FileCheckConst.DIR and check_file_type(bench_path) == FileCheckConst.DIR:
-        content_n = check_directory_content(npu_path)
-        content_b = check_directory_content(bench_path)
-        output_db_path = os.path.join(args.output_path, compare_output_db_name)
-        if content_n != content_b:
-            raise ValueError('The directory structures of npu_path and bench_path are inconsistent.')
-        if content_n == GraphConst.RANKS:
-            if args.parallel_merge:
-                _compare_graph_ranks_parallel(input_param, args)
+            logger.error("The npu_path or bench_path should be a folder.")
+            raise CompareException(CompareException.INVALID_COMPARE_MODE)
+    except KeyboardInterrupt:
+        logger.warning("Interrupted by user, terminating processes and cleaning up...")
+    except Exception as e:
+        logger.error(f"An unexpected error occurred: {e}")
+        raise e
+    finally:
+        ProgressInfo.update_process_running(False)
+@dataclass
+class ProgressConfig:
+    core_func: Callable
+    get_ranks: Callable
+    db_name: str
+    pbar_info_kwargs: dict = None
+    use_monitor_thread: bool = True
+    tqdm_total: Optional[int] = None
+def _run_with_progress(param, args, config: ProgressConfig):
+    """通用进度条处理"""
+    monitor_thread = None
+    pbar_info = None
+    ranks = None
+    try:
+        if config.use_monitor_thread:
+            manager = Manager()
+            progress_dict = manager.dict()
+            pbar_info = PbarInfo(progress_dict=progress_dict, **config.pbar_info_kwargs)
+            ranks = config.get_ranks(args)
+        else:
+            pbar_info = PbarInfo(**config.pbar_info_kwargs)
+        tqdm_args = {
+            "desc": GraphConst.PBAR_DESC_PREFIX,
+            "total": config.tqdm_total if config.tqdm_total is not None else pbar_info.total,
+            "bar_format": GraphConst.BAR_FORMAT
+        }
+        with tqdm(**tqdm_args) as pbar:
+            # 单进程场景直接更新pbar，多进程场景需要通过monitor thread从共享dict中获取进度更新pbar
+            if config.use_monitor_thread:
+                monitor_thread = threading.Thread(target=monitor_progress,
+                                                  args=(pbar_info, pbar, ranks, args.parallel_merge))
+                monitor_thread.start()
             else:
-                _compare_graph_ranks(input_param, args)
-        elif content_n == GraphConst.STEPS:
-            _compare_graph_steps(input_param, args)
+                pbar_info.pbar = pbar
+            if param:
+                config.core_func(param, args, pbar_info=pbar_info)
+            else:
+                config.core_func(args, pbar_info=pbar_info)
+            db_path = os.path.join(args.output_path, config.db_name)
+            post_process_db(db_path, pbar_info=pbar_info, is_parallel_merge=args.parallel_merge)
+            if not args.parallel_merge and config.use_monitor_thread:
+                distributed_analyse(db_path, args.overflow_check, pbar_info=pbar_info)
+            if config.use_monitor_thread and monitor_thread:
+                monitor_thread.join(timeout=5)
+    except KeyboardInterrupt:
+        logger.warning("Interrupted by user, terminating processes and cleaning up...")
+    except Exception as e:
+        logger.error(f"An unexpected error occurred: {e}")
+        raise e
+    finally:
+        ProgressInfo.update_process_running(False)
+        if config.use_monitor_thread and pbar_info:
+            pbar_info.stop_monitor = True
+def _build_graph_ranks_with_pbar(args):
+    def core_func(args, pbar_info):
+        if args.parallel_merge:
+            _build_graph_ranks_parallel(args, pbar_info=pbar_info)
         else:
-            result = _compare_graph_result(input_param, args)
-            create_directory(args.output_path)
-            file_name = _export_compare_graph_result(args, result)
-            if file_name:
-                logger.error('Failed to export model compare graph.')
-    else:
-        logger.error("The npu_path or bench_path should be a folder.")
-        raise CompareException(CompareException.INVALID_COMPARE_MODE)
-    # 所有数据输出db结束后，添加索引，修改权限
-    post_process_db(output_db_path)
+            _build_graph_ranks(args, pbar_info=pbar_info)
+    def get_ranks(args):
+        return check_and_return_dir_contents(args.target_path, Const.RANK)
-def _pt_graph_service_parser(parser):
-    _graph_service_parser(parser)
+    stage_total = _get_parallel_stage_total(args) if args.parallel_merge else GraphConst.BUILD_STAGES_TOTAL
+    _run_with_progress(
+        param=None,
+        args=args,
+        config=ProgressConfig(
+            core_func=core_func,
+            get_ranks=get_ranks,
+            pbar_info_kwargs={"stage_total": stage_total},
+            db_name=build_output_db_name,
+        )
+    )
-def _pt_graph_service_command(args):
-    _graph_service_command(args)
+def _build_graph_steps_with_pbar(args):
+    steps = check_and_return_dir_contents(args.target_path, Const.STEP)
-def _ms_graph_service_parser(parser):
-    _graph_service_parser(parser)
+    def get_ranks(args):
+        return check_and_return_dir_contents(os.path.join(args.target_path, steps[0]), Const.RANK)
+    stage_total = _get_parallel_stage_total(args, steps) if args.parallel_merge else GraphConst.BUILD_STAGES_TOTAL
-def _ms_graph_service_command(args):
-    _graph_service_command(args)
+    _run_with_progress(
+        param=None,
+        args=args,
+        config=ProgressConfig(
+            core_func=_build_graph_steps,
+            get_ranks=get_ranks,
+            pbar_info_kwargs={"step_total": len(steps), "stage_total": stage_total},
+            db_name=build_output_db_name,
+        )
+    )
+def _build_graph_with_pbar(npu_path, args):
+    def core_func(param, args, pbar_info):
+        result = _build_graph_result(param, args, pbar_info)
+        create_directory(args.output_path)
+        file_name = _export_build_graph_result(args, result, pbar_info)
+        if file_name:
+            logger.error('Failed to export model build graph.')
+    _run_with_progress(
+        param=npu_path,
+        args=args,
+        config=ProgressConfig(
+            core_func=core_func,
+            get_ranks=lambda x: None,
+            pbar_info_kwargs={},
+            db_name=build_output_db_name,
+            use_monitor_thread=False,
+            tqdm_total=GraphConst.PBAR_TOTAL
+        )
+    )
+def _compare_graph_ranks_with_pbar(input_param, args):
+    def core_func(param, args, pbar_info):
+        if args.parallel_merge:
+            _compare_graph_ranks_parallel(param, args, pbar_info=pbar_info)
+        else:
+            _compare_graph_ranks(param, args, pbar_info=pbar_info)
+    def get_ranks(args):
+        if args.parallel_merge:
+            return calculate_list(args.target_path, args.golden_path, mode=GraphConst.UNION)
+        return calculate_list(args.target_path, args.golden_path)
+    stage_total = _get_parallel_stage_total(args, is_compare=True) if args.parallel_merge \
+        else GraphConst.COMPARE_STAGES_TOTAL
+    _run_with_progress(
+        param=input_param,
+        args=args,
+        config=ProgressConfig(
+            core_func=core_func,
+            get_ranks=get_ranks,
+            pbar_info_kwargs={"stage_total": stage_total},
+            db_name=compare_output_db_name
+        )
+    )
+def _compare_graph_steps_with_pbar(input_param, args):
+    steps = calculate_list(args.target_path, args.golden_path, Const.STEP)
+    def get_ranks(args):
+        rank_path_t = os.path.join(args.target_path, steps[0])
+        rank_path_g = os.path.join(args.golden_path, steps[0])
+        if args.parallel_merge:
+            return calculate_list(rank_path_t, rank_path_g, mode=GraphConst.UNION)
+        return calculate_list(rank_path_t, rank_path_g)
+    stage_total = _get_parallel_stage_total(args, steps, is_compare=True) if args.parallel_merge \
+        else GraphConst.COMPARE_STAGES_TOTAL
+    _run_with_progress(
+        param=input_param,
+        args=args,
+        config=ProgressConfig(
+            core_func=_compare_graph_steps,
+            get_ranks=get_ranks,
+            pbar_info_kwargs={"stage_total": stage_total, "step_total": len(steps)},
+            db_name=compare_output_db_name
+        )
+    )
+def _compare_graph_with_pbar(input_param, args):
+    def core_func(param, args, pbar_info):
+        result = _compare_graph_result(param, args, pbar_info=pbar_info)
+        create_directory(args.output_path)
+        file_name = _export_compare_graph_result(args, result, pbar_info=pbar_info)
+        if file_name:
+            logger.error('Failed to export model compare graph.')
+    _run_with_progress(
+        param=input_param,
+        args=args,
+        config=ProgressConfig(
+            core_func=core_func,
+            get_ranks=lambda x: None,
+            pbar_info_kwargs={"pbar": None, "stage_total": GraphConst.COMPARE_STAGES_TOTAL},
+            db_name=compare_output_db_name,
+            use_monitor_thread=False,
+            tqdm_total=GraphConst.PBAR_TOTAL
+        )
+    )
+def _get_parallel_stage_total(args, steps=None, is_compare=False):
+    """
+    获取不同并行切分策略的任务阶段数
+    """
+    parallel_params = args.parallel_params
+    if not is_compare and (not parallel_params or len(parallel_params) != 1):
+        raise RuntimeError('Parallel params error in build graph!')
+    if is_compare and (not parallel_params or len(parallel_params) != 2):
+        raise RuntimeError('Parallel params error in compare graph!')
+    target_path = os.path.join(args.target_path, steps[0]) if steps else args.target_path
+    validate_parallel_param(parallel_params[0], target_path)
+    if is_compare:
+        golden_path = os.path.join(args.golden_path, steps[0]) if steps else args.golden_path
+        validate_parallel_param(parallel_params[1], golden_path, '[Bench]')
+    stage_count_map = {
+        "TPMerger": lambda param: param.rank_size // param.tp,
+        "PPMerger": lambda param: param.rank_size // param.pp,
+        "VPPMerger": lambda param: param.rank_size // param.pp,
+        "TPPPMerger": lambda param: param.rank_size // param.pp + param.rank_size // param.pp // param.tp,
+        "FullMerger": lambda param: param.rank_size // param.pp + param.rank_size // param.pp // param.tp,
+        "NoParallelMerger": 0
+    }
+    def _get_stage_count(parallel_param, merger_name: str) -> int:
+        rule = stage_count_map.get(merger_name, 0)
+        return rule(parallel_param) if callable(rule) else rule
+    merger_name_t = GraphMerger([], parallel_params[0]).strategy.__class__.__name__
+    stage_count_target = _get_stage_count(parallel_params[0], merger_name_t)
+    if is_compare:
+        merger_name_g = GraphMerger([], parallel_params[1]).strategy.__class__.__name__
+        stage_count_golden = _get_stage_count(parallel_params[1], merger_name_g)
+        return GraphConst.COMPARE_STAGES_TOTAL + stage_count_target + stage_count_golden
+    return GraphConst.BUILD_STAGES_TOTAL + stage_count_target
 class CompareGraphResult:
@@ -526,3 +832,72 @@ class BuildGraphResult:
         self.micro_steps = micro_steps
         self.rank = rank
         self.step = step
+class PbarInfo:
+    def __init__(self, pbar=None, progress_dict=None, task_id=None, step=0, step_total=1,
+                 stage_total=GraphConst.BUILD_STAGES_TOTAL):
+        self.pbar = pbar
+        self.progress_dict = progress_dict
+        self.task_id = task_id
+        self.step = step
+        self.step_total = step_total
+        self.total = GraphConst.PBAR_TOTAL * step_total
+        self.stage_total = stage_total * step_total  # 有几个阶段
+        self.current_stage_dict = Manager().dict()  # 当前阶段，进程共享
+        self.stage_progress = round(self.total / self.stage_total, 2)  # 每个阶段的最大进度
+        self.stop_monitor = False
+        self.wait_monitor = False
+        self.continue_monitor = True
+    def __deepcopy__(self, memo):
+        new_obj = PbarInfo()
+        new_obj.progress_dict = self.progress_dict
+        new_obj.task_id = self.task_id
+        new_obj.step = self.step
+        new_obj.step_total = self.step_total
+        new_obj.stage_total = self.stage_total
+        new_obj.current_stage_dict = self.current_stage_dict
+        new_obj.stage_progress = self.stage_progress
+        new_obj.total = self.total
+        new_obj.stop_monitor = self.stop_monitor
+        new_obj.wait_monitor = self.wait_monitor
+        new_obj.continue_monitor = self.continue_monitor
+        return new_obj
+    @staticmethod
+    def update_task_id(pbar_info, task_id):
+        """
+        在进程池中，实例作为入参，修改实例属性，需要深拷贝实例使修改生效
+        """
+        if pbar_info:
+            pbar_info.task_id = task_id
+            return deepcopy(pbar_info)
+        return pbar_info
+    @staticmethod
+    def del_progress_dict_item(pbar_info, origin_ranks, merged_ranks):
+        """
+        不同并行切分策略的图合并场景下，graph合并到一些rank中，剩余的rank作为task_id不再需要
+        """
+        diff_ranks = list(set(origin_ranks) - set(merged_ranks))
+        for rank in diff_ranks:
+            if rank in pbar_info.progress_dict:
+                del pbar_info.progress_dict[rank]
+    @staticmethod
+    def reset_progress_and_current_stage(pbar_info, task_ids):
+        """
+        不同并行切分策略的图合并场景下，每个step需要重置进度信息
+        """
+        for task_id in task_ids:
+            pbar_info.progress_dict[task_id] = GraphConst.PBAR_TOTAL * pbar_info.step
+            pbar_info.current_stage_dict[task_id] = pbar_info.stage_total // pbar_info.step_total * pbar_info.step
+    def set_continue_monitor(self, value: bool):
+        self.continue_monitor = value
+        self.wait_monitor = not value
+    def set_wait_monitor(self, value: bool):
+        self.wait_monitor = value
+        self.continue_monitor = not value

mindstudio-probe 8.3.2__py3-none-any.whl → 26.0.0a1__py3-none-any.whl

mindstudio-probe 8.3.2py3-none-any.whl → 26.0.0a1py3-none-any.whl