PyPI - mindstudio-probe - Versions diffs - 8.3.3__py3-none-any.whl → 26.0.0a1__py3-none-any.whl - Mend

mindstudio-probe 8.3.3py3-none-any.whl → 26.0.0a1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (689) hide show

{mindstudio_probe-8.3.3.dist-info → mindstudio_probe-26.0.0a1.dist-info}/METADATA +26 -14
mindstudio_probe-26.0.0a1.dist-info/RECORD +498 -0
{mindstudio_probe-8.3.3.dist-info → mindstudio_probe-26.0.0a1.dist-info}/WHEEL +1 -1
mindstudio_probe-26.0.0a1.dist-info/entry_points.txt +5 -0
mindstudio_probe-26.0.0a1.dist-info/licenses/LICENSE +124 -0
mindstudio_probe-26.0.0a1.dist-info/top_level.txt +2 -0
msprobe/__init__.py +12 -13
msprobe/config.json +9 -31
msprobe/core/__init__.py +12 -11
msprobe/core/acc_check/acc_check_cli.py +145 -0
msprobe/core/common/const.py +97 -38
msprobe/core/common/db_manager.py +133 -12
msprobe/core/common/decorator.py +12 -11
msprobe/core/common/exceptions.py +12 -11
msprobe/core/common/file_utils.py +101 -25
msprobe/core/common/framework_adapter.py +36 -25
msprobe/core/common/global_lock.py +12 -11
msprobe/core/common/inplace_op_checker.py +12 -11
msprobe/core/common/log.py +22 -11
msprobe/core/common/megatron_utils.py +566 -11
msprobe/core/common/parallel_state.py +12 -11
msprobe/core/common/runtime.py +12 -11
msprobe/core/common/utils.py +41 -41
msprobe/core/compare/acc_compare.py +361 -104
msprobe/core/compare/atb_data_compare.py +422 -0
msprobe/core/compare/auto_compare.py +134 -0
msprobe/core/compare/check.py +14 -17
msprobe/core/compare/compare_cli.py +72 -149
msprobe/core/compare/config.py +12 -13
msprobe/core/compare/diff_analyze/first_diff_analyze.py +28 -15
msprobe/core/compare/diff_analyze/ignore_op_list.yaml +3 -0
msprobe/core/compare/find_first/analyzer.py +18 -18
msprobe/core/compare/find_first/graph.py +12 -11
msprobe/core/compare/find_first/utils.py +13 -12
msprobe/core/compare/indicator_analysis/__init__.py +15 -0
msprobe/core/compare/indicator_analysis/algorithm.py +363 -0
msprobe/core/compare/indicator_analysis/api_data.py +141 -0
msprobe/core/compare/indicator_analysis/calculator.py +181 -0
msprobe/core/compare/indicator_analysis/utils.py +116 -0
msprobe/core/compare/layer_mapping/__init__.py +12 -11
msprobe/core/compare/layer_mapping/data_scope_parser.py +20 -11
msprobe/core/compare/layer_mapping/layer_mapping.py +14 -13
msprobe/core/compare/layer_mapping/postprocess_pass.py +13 -11
msprobe/core/compare/merge_result/merge_result.py +12 -11
msprobe/core/compare/merge_result/merge_result_cli.py +12 -11
msprobe/core/compare/merge_result/utils.py +12 -11
msprobe/core/compare/multiprocessing_compute.py +13 -14
msprobe/core/compare/npy_compare.py +13 -11
msprobe/core/compare/offline_data_compare.py +160 -0
msprobe/core/compare/stats_diff_calc.py +39 -0
msprobe/core/compare/torchair_acc_cmp.py +764 -0
msprobe/core/compare/torchair_cmp_utils.py +338 -0
msprobe/core/compare/utils.py +140 -49
msprobe/core/config_check/__init__.py +12 -11
msprobe/core/config_check/checkers/__init__.py +12 -11
msprobe/core/config_check/checkers/base_checker.py +15 -14
msprobe/core/config_check/checkers/dataset_checker.py +13 -12
msprobe/core/config_check/checkers/env_args_checker.py +13 -12
msprobe/core/config_check/checkers/hyperparameter_checker.py +16 -15
msprobe/core/config_check/checkers/pip_checker.py +15 -15
msprobe/core/config_check/checkers/random_checker.py +13 -12
msprobe/core/config_check/checkers/weights_checker.py +14 -12
msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +13 -17
msprobe/core/config_check/ckpt_compare/megatron_loader.py +13 -12
msprobe/core/config_check/ckpt_compare/metrics.py +12 -11
msprobe/core/config_check/config_check_cli.py +18 -17
msprobe/core/config_check/config_checker.py +16 -14
msprobe/core/config_check/resource/dependency.yaml +15 -12
msprobe/core/config_check/resource/env.yaml +12 -11
msprobe/core/config_check/utils/hyperparameter_parser.py +12 -11
msprobe/core/config_check/utils/utils.py +12 -11
msprobe/core/{data_dump → dump/api_dump}/api_registry.py +12 -11
msprobe/core/{common_config.py → dump/common_config.py} +13 -24
msprobe/core/dump/data_dump/data_collector.py +257 -0
msprobe/core/{data_dump → dump/data_dump}/data_processor/base.py +45 -36
msprobe/core/{data_dump → dump/data_dump}/data_processor/factory.py +33 -25
msprobe/core/{data_dump → dump/data_dump}/data_processor/mindspore_processor.py +37 -113
msprobe/core/{data_dump → dump/data_dump}/data_processor/pytorch_processor.py +364 -131
msprobe/core/{data_dump → dump/data_dump}/json_writer.py +24 -31
msprobe/core/{data_dump → dump/data_dump}/scope.py +12 -13
msprobe/core/{debugger → dump/debugger}/precision_debugger.py +15 -23
msprobe/core/dump/dump2db/db_utils.py +215 -0
msprobe/core/dump/dump2db/dump2db.py +409 -0
msprobe/core/{hook_manager.py → dump/hook_manager.py} +38 -87
msprobe/core/dump/kernel_dump/kernel_config.py +34 -0
msprobe/core/{service.py → dump/service.py} +43 -27
msprobe/core/install_deps/install_deps.py +51 -0
msprobe/core/monitor/anomaly_processor.py +13 -11
msprobe/core/monitor/csv2db.py +73 -93
msprobe/core/monitor/db_utils.py +140 -205
msprobe/core/monitor/utils.py +18 -17
msprobe/core/monitor_v2/__init__.py +20 -0
msprobe/core/monitor_v2/base.py +83 -0
msprobe/core/monitor_v2/cc.py +287 -0
msprobe/core/monitor_v2/factory.py +81 -0
msprobe/core/monitor_v2/module.py +201 -0
msprobe/core/monitor_v2/optimizer.py +245 -0
msprobe/core/monitor_v2/param.py +154 -0
msprobe/core/monitor_v2/trainer.py +326 -0
msprobe/core/monitor_v2/utils.py +122 -0
msprobe/core/monitor_v2/weight_grad.py +419 -0
msprobe/core/monitor_v2/writer.py +162 -0
msprobe/core/overflow_check/abnormal_scene.py +12 -11
msprobe/core/overflow_check/api_info.py +12 -11
msprobe/core/overflow_check/checker.py +12 -11
msprobe/core/overflow_check/filter.py +13 -11
msprobe/core/overflow_check/level.py +12 -11
msprobe/core/overflow_check/utils.py +12 -11
msprobe/core/single_save/single_comparator.py +12 -11
msprobe/core/single_save/single_saver.py +12 -11
msprobe/infer/__init__.py +16 -0
msprobe/infer/offline/__init__.py +16 -0
msprobe/infer/offline/compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/args_adapter.py +46 -0
msprobe/infer/offline/compare/msquickcmp/atc/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/atc/atc_utils.py +98 -0
msprobe/infer/offline/compare/msquickcmp/cmp_process.py +328 -0
msprobe/infer/offline/compare/msquickcmp/common/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/common/args_check.py +112 -0
msprobe/infer/offline/compare/msquickcmp/common/convert.py +74 -0
msprobe/infer/offline/compare/msquickcmp/common/dump_data.py +121 -0
msprobe/infer/offline/compare/msquickcmp/common/dynamic_argument_bean.py +39 -0
msprobe/infer/offline/compare/msquickcmp/common/utils.py +669 -0
msprobe/infer/offline/compare/msquickcmp/config.ini +6 -0
msprobe/infer/offline/compare/msquickcmp/dump/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/dump/args_adapter.py +50 -0
msprobe/infer/offline/compare/msquickcmp/dump/dump_process.py +91 -0
msprobe/infer/offline/compare/msquickcmp/install_aclruntime_aisbench.sh +180 -0
msprobe/infer/offline/compare/msquickcmp/main.py +199 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/net_compare.py +277 -0
msprobe/infer/offline/compare/msquickcmp/npu/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/npu/npu_dump_data.py +558 -0
msprobe/infer/offline/compare/msquickcmp/npu/om_parser.py +416 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/onnx_dump_data.py +374 -0
msprobe/infer/utils/__init__.py +15 -0
msprobe/infer/utils/acc_cmp.py +94 -0
msprobe/infer/utils/check/__init__.py +37 -0
msprobe/infer/utils/check/args_checker.py +35 -0
msprobe/infer/utils/check/checker.py +227 -0
msprobe/infer/utils/check/dict_checker.py +78 -0
msprobe/infer/utils/check/func_wrapper.py +96 -0
msprobe/infer/utils/check/list_checker.py +56 -0
msprobe/infer/utils/check/number_checker.py +64 -0
msprobe/infer/utils/check/obj_checker.py +41 -0
msprobe/infer/utils/check/path_checker.py +249 -0
msprobe/infer/utils/check/rule.py +126 -0
msprobe/infer/utils/check/string_checker.py +66 -0
msprobe/infer/utils/cmp_algorithm.py +261 -0
msprobe/infer/utils/constants.py +112 -0
msprobe/infer/utils/file_open_check.py +337 -0
msprobe/infer/utils/util.py +177 -0
msprobe/mindspore/__init__.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_info.py +12 -11
msprobe/mindspore/api_accuracy_checker/api_runner.py +12 -11
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +12 -11
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +12 -11
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +15 -14
msprobe/mindspore/api_accuracy_checker/compute_element.py +12 -11
msprobe/mindspore/api_accuracy_checker/data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/main.py +12 -11
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +14 -12
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +12 -11
msprobe/mindspore/api_accuracy_checker/type_mapping.py +12 -11
msprobe/mindspore/api_accuracy_checker/utils.py +12 -11
msprobe/mindspore/common/const.py +15 -74
msprobe/mindspore/common/log.py +12 -11
msprobe/mindspore/common/utils.py +30 -15
msprobe/mindspore/compare/common_dir_compare.py +21 -23
msprobe/mindspore/compare/distributed_compare.py +18 -16
msprobe/mindspore/compare/ms_compare.py +14 -14
msprobe/mindspore/compare/ms_graph_compare.py +26 -20
msprobe/mindspore/compare/utils.py +14 -12
msprobe/mindspore/{cell_processor.py → dump/cell_processor.py} +15 -14
msprobe/mindspore/{debugger → dump/debugger}/debugger_config.py +12 -30
msprobe/mindspore/{debugger → dump/debugger}/precision_debugger.py +43 -45
msprobe/mindspore/dump/{cell_dump_process.py → dump_processor/cell_dump_process.py} +31 -17
msprobe/mindspore/dump/{cell_dump_with_insert_gradient.py → dump_processor/cell_dump_with_insert_gradient.py} +18 -14
msprobe/mindspore/dump/{dump_tool_factory.py → dump_processor/dump_tool_factory.py} +16 -15
msprobe/mindspore/dump/{graph_mode_cell_dump.py → dump_processor/graph_mode_cell_dump.py} +16 -15
msprobe/mindspore/dump/{graph_tensor_dump.py → dump_processor/graph_tensor_dump.py} +134 -133
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/api_register.py +15 -14
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/hook_cell.py +12 -11
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/ms_hook_manager.py +47 -20
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/primitive_hooks.py +14 -13
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/support_wrap_ops.yaml +13 -11
msprobe/mindspore/dump/{jit_dump.py → dump_processor/jit_dump.py} +14 -13
msprobe/mindspore/dump/{kernel_graph_dump.py → dump_processor/kernel_graph_dump.py} +13 -12
msprobe/mindspore/dump/{kernel_kbyk_dump.py → dump_processor/kernel_kbyk_dump.py} +13 -12
msprobe/mindspore/{exception_dump → dump/exception_dump}/exception_dump_tool_factory.py +14 -13
msprobe/mindspore/{exception_dump → dump/exception_dump}/kernel_graph_exception_dump.py +13 -12
msprobe/mindspore/{mindspore_service.py → dump/mindspore_service.py} +18 -17
msprobe/mindspore/dump/mindtorch/__init__.py +19 -0
msprobe/mindspore/dump/ms_config.py +105 -0
msprobe/mindspore/{overflow_check → dump/overflow_check}/kernel_graph_overflow_check.py +13 -12
msprobe/mindspore/{overflow_check → dump/overflow_check}/overflow_check_tool_factory.py +14 -13
msprobe/mindspore/dump/task_handler_factory.py +43 -0
msprobe/mindspore/monitor/common_func.py +12 -11
msprobe/mindspore/monitor/data_writers.py +12 -11
msprobe/mindspore/monitor/distributed/wrap_distributed.py +93 -39
msprobe/mindspore/monitor/features.py +12 -11
msprobe/mindspore/monitor/module_hook.py +19 -22
msprobe/mindspore/monitor/optimizer_collect.py +29 -25
msprobe/mindspore/monitor/utils.py +13 -11
msprobe/msaccucmp/advisor/__init__.py +16 -0
msprobe/msaccucmp/advisor/advisor_const.py +65 -0
msprobe/msaccucmp/advisor/advisor_result.py +73 -0
msprobe/msaccucmp/advisor/compare_advisor.py +99 -0
msprobe/msaccucmp/advisor/input_advisor.py +66 -0
msprobe/msaccucmp/advisor/node_advisor.py +68 -0
msprobe/msaccucmp/advisor/overflow_advisor.py +58 -0
msprobe/msaccucmp/algorithm_manager/__init__.py +16 -0
msprobe/msaccucmp/algorithm_manager/algorithm_manager.py +464 -0
msprobe/msaccucmp/algorithm_manager/algorithm_parameter.py +42 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_AccumulatedRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_CosineSimilarity.py +58 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_KullbackLeiblerDivergence.py +84 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RelativeEuclideanDistance.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RootMeanSquareError.py +40 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_StandardDeviation.py +47 -0
msprobe/msaccucmp/cmp_utils/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/common.py +113 -0
msprobe/msaccucmp/cmp_utils/constant/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/constant/compare_error.py +81 -0
msprobe/msaccucmp/cmp_utils/constant/const_manager.py +530 -0
msprobe/msaccucmp/cmp_utils/file_utils.py +497 -0
msprobe/msaccucmp/cmp_utils/log.py +257 -0
msprobe/msaccucmp/cmp_utils/multi_process/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/multi_process/multi_convert_process.py +140 -0
msprobe/msaccucmp/cmp_utils/multi_process/progress.py +78 -0
msprobe/msaccucmp/cmp_utils/path_check.py +274 -0
msprobe/msaccucmp/cmp_utils/reg_manager.py +98 -0
msprobe/msaccucmp/cmp_utils/tlv_parse.py +279 -0
msprobe/msaccucmp/cmp_utils/utils.py +356 -0
msprobe/msaccucmp/cmp_utils/utils_type.py +63 -0
msprobe/msaccucmp/compare_vector.py +48 -0
msprobe/msaccucmp/conversion/__init__.py +16 -0
msprobe/msaccucmp/conversion/data_conversion.py +277 -0
msprobe/msaccucmp/conversion/dtype_conversion.py +99 -0
msprobe/msaccucmp/conversion/shape_format_conversion.py +477 -0
msprobe/msaccucmp/conversion/tensor_conversion.py +369 -0
msprobe/msaccucmp/dump_data_conversion.py +46 -0
msprobe/msaccucmp/dump_parse/__init__.py +16 -0
msprobe/msaccucmp/dump_parse/big_dump_data.py +317 -0
msprobe/msaccucmp/dump_parse/dump.py +423 -0
msprobe/msaccucmp/dump_parse/dump_data_object.py +322 -0
msprobe/msaccucmp/dump_parse/dump_data_parser.py +436 -0
msprobe/msaccucmp/dump_parse/dump_utils.py +246 -0
msprobe/msaccucmp/dump_parse/ffts_parser.py +137 -0
msprobe/msaccucmp/dump_parse/mapping.py +62 -0
msprobe/msaccucmp/dump_parse/nano_dump_data.py +392 -0
msprobe/msaccucmp/dump_parse/proto_dump_data.py +308 -0
msprobe/msaccucmp/dump_parser.py +90 -0
msprobe/msaccucmp/format_manager/__init__.py +16 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NCHW.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_ND.py +52 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NHWC.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_HWCN.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_NCHW.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_FRACTAL_Z.py +89 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_HWCN.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NCHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NHWC.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_NCDHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_ND.py +44 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_HWCN.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/format_manager.py +307 -0
msprobe/msaccucmp/inplace_layer_process.py +186 -0
msprobe/msaccucmp/msaccucmp.py +532 -0
msprobe/msaccucmp/mscmp_advisor.py +128 -0
msprobe/msaccucmp/overflow/__init__.py +16 -0
msprobe/msaccucmp/overflow/overflow_analyse.py +305 -0
msprobe/msaccucmp/overflow/overflow_detection.py +143 -0
msprobe/msaccucmp/pytorch_cmp/__init__.py +16 -0
msprobe/msaccucmp/pytorch_cmp/compare_pytorch.py +389 -0
msprobe/msaccucmp/pytorch_cmp/hdf5_parser.py +377 -0
msprobe/msaccucmp/pytorch_cmp/pytorch_dump_data.py +461 -0
msprobe/msaccucmp/shape_conversion.py +41 -0
msprobe/msaccucmp/vector_cmp/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/batch_compare.py +197 -0
msprobe/msaccucmp/vector_cmp/compare_detail/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/compare_detail/compare_detail.py +245 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail.py +182 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail_writer.py +580 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_fusion_op.py +588 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_npu_vs_npu.py +339 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_result.py +326 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_rule.py +156 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_op.py +204 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_rule_parser.py +635 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/quant_filter.py +187 -0
msprobe/msaccucmp/vector_cmp/range_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_manager.py +100 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_mode.py +94 -0
msprobe/msaccucmp/vector_cmp/range_manager/select_mode.py +86 -0
msprobe/msaccucmp/vector_cmp/vector_comparison.py +535 -0
msprobe/msprobe.py +101 -130
msprobe/overflow_check/__init__.py +15 -0
msprobe/{nan_analyze → overflow_check}/analyzer.py +38 -27
msprobe/{nan_analyze → overflow_check}/graph.py +28 -27
msprobe/{nan_analyze → overflow_check}/utils.py +15 -14
msprobe/pytorch/__init__.py +20 -14
msprobe/pytorch/aclgraph_dump/__init__.py +45 -0
msprobe/pytorch/aclgraph_dump/_meta.py +26 -0
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut.py → acc_check/acc_check.py} +50 -45
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut_utils.py → acc_check/acc_check_utils.py} +201 -30
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/data_generate.py +56 -16
msprobe/pytorch/api_accuracy_checker/{run_ut/multi_run_ut.py → acc_check/multi_acc_check.py} +32 -47
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/run_overflow_check.py +19 -18
msprobe/pytorch/api_accuracy_checker/common/config.py +22 -20
msprobe/pytorch/api_accuracy_checker/common/utils.py +72 -13
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +41 -11
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +23 -14
msprobe/pytorch/api_accuracy_checker/compare/compare.py +45 -32
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +12 -11
msprobe/pytorch/api_accuracy_checker/compare/compare_input.py +14 -12
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +14 -12
msprobe/pytorch/api_accuracy_checker/precision_standard/absolute_threshold.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/accumulative_error_compare.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/base_standard.py +21 -19
msprobe/pytorch/api_accuracy_checker/precision_standard/benchmark_compare.py +14 -13
msprobe/pytorch/api_accuracy_checker/precision_standard/binary_consistency.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_config.py +60 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_register.py +27 -16
msprobe/pytorch/api_accuracy_checker/precision_standard/thousandth_standard.py +13 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/ulp_compare.py +39 -18
msprobe/pytorch/bench_functions/__init__.py +12 -11
msprobe/pytorch/bench_functions/apply_adam.py +12 -11
msprobe/pytorch/bench_functions/apply_adam_w.py +12 -11
msprobe/pytorch/bench_functions/confusion_transpose.py +12 -11
msprobe/pytorch/bench_functions/fast_gelu.py +12 -11
msprobe/pytorch/bench_functions/group_norm_silu.py +12 -11
msprobe/pytorch/bench_functions/layer_norm_eval.py +12 -11
msprobe/pytorch/bench_functions/linear.py +12 -11
msprobe/pytorch/bench_functions/matmul_backward.py +12 -11
msprobe/pytorch/bench_functions/mish.py +12 -11
msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +12 -11
msprobe/pytorch/bench_functions/npu_fusion_attention.py +12 -11
msprobe/pytorch/bench_functions/rms_norm.py +12 -11
msprobe/pytorch/bench_functions/rotary_mul.py +12 -11
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +12 -11
msprobe/pytorch/bench_functions/sort_v2.py +12 -11
msprobe/pytorch/bench_functions/swiglu.py +12 -11
msprobe/pytorch/common/__init__.py +12 -11
msprobe/pytorch/common/log.py +12 -11
msprobe/pytorch/common/parse_json.py +12 -11
msprobe/pytorch/common/utils.py +52 -19
msprobe/pytorch/compare/distributed_compare.py +13 -13
msprobe/pytorch/compare/match.py +12 -11
msprobe/pytorch/compare/pt_compare.py +14 -20
msprobe/pytorch/compare/pt_diff_analyze.py +12 -11
msprobe/pytorch/compare/utils.py +12 -11
msprobe/pytorch/{hook_module → dump/api_dump}/api_register.py +18 -16
msprobe/pytorch/{hook_module → dump/api_dump}/hook_module.py +14 -13
msprobe/pytorch/{hook_module → dump/api_dump}/pt_hook_manager.py +68 -23
msprobe/pytorch/{hook_module → dump/api_dump}/register_optimizer_hook.py +13 -11
msprobe/pytorch/{hook_module → dump/api_dump}/script_wrapper.py +17 -14
msprobe/pytorch/{hook_module → dump/api_dump}/utils.py +12 -11
msprobe/pytorch/{debugger → dump/debugger}/debugger_config.py +23 -38
msprobe/pytorch/dump/debugger/precision_debugger.py +130 -0
msprobe/pytorch/{function_factory.py → dump/function_factory.py} +12 -11
msprobe/pytorch/dump/module_dump/hook_wrapper.py +17 -13
msprobe/pytorch/dump/module_dump/module_dump.py +16 -15
msprobe/pytorch/dump/module_dump/{module_processer.py → module_processor.py} +54 -42
msprobe/pytorch/dump/pt_config.py +128 -0
msprobe/pytorch/{pytorch_service.py → dump/pytorch_service.py} +22 -21
msprobe/pytorch/monitor/csv2tb.py +13 -11
msprobe/pytorch/monitor/data_writers.py +13 -11
msprobe/pytorch/monitor/distributed/wrap_distributed.py +13 -11
msprobe/pytorch/monitor/features.py +12 -11
msprobe/pytorch/monitor/module_hook.py +67 -59
msprobe/pytorch/monitor/module_metric.py +13 -11
msprobe/pytorch/monitor/optimizer_collect.py +37 -35
msprobe/pytorch/monitor/utils.py +13 -11
msprobe/pytorch/monitor/visualizer.py +12 -11
msprobe/pytorch/torchair_dump/__init__.py +17 -0
msprobe/pytorch/torchair_dump/torchair_dump.py +114 -0
msprobe/scripts/atb/config_example.json +10 -0
msprobe/scripts/atb/load_atb_probe.sh +101 -0
msprobe/scripts/atb/unload_atb_probe.sh +27 -0
msprobe/scripts/build_msaccucmp.sh +186 -0
msprobe/scripts/conf/help.info +6 -0
msprobe/scripts/conf/version.info +3 -0
msprobe/scripts/run_script/common.sh +538 -0
msprobe/scripts/run_script/main_msaccucmp.sh +232 -0
msprobe/visualization/__init__.py +12 -11
msprobe/visualization/builder/__init__.py +12 -11
msprobe/visualization/builder/graph_builder.py +45 -30
msprobe/visualization/builder/graph_merger.py +53 -32
msprobe/visualization/builder/msprobe_adapter.py +34 -44
msprobe/visualization/compare/__init__.py +12 -11
msprobe/visualization/compare/graph_comparator.py +63 -51
msprobe/visualization/compare/mode_adapter.py +28 -113
msprobe/visualization/db_utils.py +133 -22
msprobe/visualization/graph/__init__.py +12 -11
msprobe/visualization/graph/base_node.py +15 -27
msprobe/visualization/graph/distributed_analyzer.py +97 -40
msprobe/visualization/graph/graph.py +14 -16
msprobe/visualization/graph/node_colors.py +34 -31
msprobe/visualization/graph/node_op.py +12 -11
msprobe/visualization/graph_service.py +580 -205
msprobe/visualization/utils.py +278 -31
tb_graph_ascend/secure_build.py +175 -0
tb_graph_ascend/server/__init__.py +15 -0
tb_graph_ascend/server/app/__init__.py +15 -0
tb_graph_ascend/server/app/model/__init__.py +15 -0
tb_graph_ascend/server/app/model/hierarchy.py +348 -0
tb_graph_ascend/server/app/model/layout_hierarchy_model.py +69 -0
tb_graph_ascend/server/app/model/match_nodes_model.py +573 -0
tb_graph_ascend/server/app/repositories/__init__.py +15 -0
tb_graph_ascend/server/app/repositories/graph_repo_base.py +32 -0
tb_graph_ascend/server/app/repositories/graph_repo_db.py +879 -0
tb_graph_ascend/server/app/repositories/graph_repo_vis.py +83 -0
tb_graph_ascend/server/app/service/__init__.py +18 -0
tb_graph_ascend/server/app/service/graph_service_base.py +158 -0
tb_graph_ascend/server/app/service/graph_service_db.py +438 -0
tb_graph_ascend/server/app/service/graph_service_factory.py +54 -0
tb_graph_ascend/server/app/service/graph_service_vis.py +480 -0
tb_graph_ascend/server/app/utils/__init__.py +15 -0
tb_graph_ascend/server/app/utils/constant.py +80 -0
tb_graph_ascend/server/app/utils/file_check_wrapper.py +46 -0
tb_graph_ascend/server/app/utils/global_state.py +95 -0
tb_graph_ascend/server/app/utils/graph_utils.py +661 -0
tb_graph_ascend/server/app/utils/i18n.py +153 -0
tb_graph_ascend/server/app/utils/request_method.py +46 -0
tb_graph_ascend/server/app/views/__init__.py +15 -0
tb_graph_ascend/server/app/views/graph_views.py +304 -0
tb_graph_ascend/server/plugin.py +108 -0
tb_graph_ascend/server/static/index.html +9250 -0
tb_graph_ascend/server/static/index.js +21 -0
tb_graph_ascend/setup.py +57 -0
mindstudio_probe-8.3.3.dist-info/LICENSE +0 -201
mindstudio_probe-8.3.3.dist-info/RECORD +0 -491
mindstudio_probe-8.3.3.dist-info/entry_points.txt +0 -2
mindstudio_probe-8.3.3.dist-info/top_level.txt +0 -1
msprobe/CMakeLists.txt +0 -5
msprobe/README.md +0 -203
msprobe/core/advisor/advisor.py +0 -129
msprobe/core/advisor/advisor_const.py +0 -58
msprobe/core/advisor/advisor_result.py +0 -58
msprobe/core/compare/find_first/data_processor.py +0 -35
msprobe/core/compare/highlight.py +0 -390
msprobe/core/data_dump/data_collector.py +0 -356
msprobe/core/grad_probe/constant.py +0 -90
msprobe/core/grad_probe/grad_compare.py +0 -187
msprobe/core/grad_probe/utils.py +0 -105
msprobe/core/kernel_dump/kernel_config.py +0 -33
msprobe/docs/01.installation.md +0 -250
msprobe/docs/02.config_introduction.md +0 -221
msprobe/docs/03.config_examples.md +0 -281
msprobe/docs/04.kernel_dump_PyTorch.md +0 -73
msprobe/docs/05.data_dump_PyTorch.md +0 -518
msprobe/docs/06.data_dump_MindSpore.md +0 -618
msprobe/docs/07.accuracy_checker_PyTorch.md +0 -310
msprobe/docs/09.accuracy_checker_MindSpore.md +0 -120
msprobe/docs/10.accuracy_compare_PyTorch.md +0 -637
msprobe/docs/11.accuracy_compare_MindSpore.md +0 -769
msprobe/docs/12.overflow_check_PyTorch.md +0 -82
msprobe/docs/13.overflow_check_MindSpore.md +0 -33
msprobe/docs/14.data_parse_PyTorch.md +0 -282
msprobe/docs/15.free_benchmarking_PyTorch.md +0 -169
msprobe/docs/16.free_benchmarking_MindSpore.md +0 -159
msprobe/docs/17.grad_probe.md +0 -205
msprobe/docs/18.online_dispatch.md +0 -89
msprobe/docs/19.monitor.md +0 -753
msprobe/docs/20.monitor_performance_baseline.md +0 -52
msprobe/docs/21.visualization_PyTorch.md +0 -519
msprobe/docs/22.visualization_MindSpore.md +0 -515
msprobe/docs/23.generate_operator_PyTorch.md +0 -107
msprobe/docs/24.code_mapping_Mindspore.md +0 -29
msprobe/docs/25.tool_function_introduction.md +0 -29
msprobe/docs/26.data_dump_PyTorch_baseline.md +0 -48
msprobe/docs/27.dump_json_instruction.md +0 -795
msprobe/docs/28.debugger_save_instruction.md +0 -288
msprobe/docs/28.kernel_dump_MindSpore.md +0 -69
msprobe/docs/29.data_dump_MSAdapter.md +0 -235
msprobe/docs/30.overflow_check_MSAdapter.md +0 -31
msprobe/docs/31.config_check.md +0 -107
msprobe/docs/32.ckpt_compare.md +0 -69
msprobe/docs/33.generate_operator_MindSpore.md +0 -181
msprobe/docs/34.RL_collect.md +0 -101
msprobe/docs/35.nan_analyze.md +0 -73
msprobe/docs/36.calculation_result_change.md +0 -75
msprobe/docs/FAQ.md +0 -232
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +0 -146
msprobe/docs/accuracy_checker_MindSpore/accuracy_checker_MindSpore_baseline.md +0 -14
msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +0 -33
msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +0 -217
msprobe/docs/img/BLOOM-7B_1.png +0 -0
msprobe/docs/img/BLOOM-7B_2.png +0 -0
msprobe/docs/img/BLOOM-7B_3.png +0 -0
msprobe/docs/img/BLOOM-7B_4.png +0 -0
msprobe/docs/img/GPT-3_1.png +0 -0
msprobe/docs/img/GPT-3_2.png +0 -0
msprobe/docs/img/GPT-3_3.png +0 -0
msprobe/docs/img/GPT-3_4.png +0 -0
msprobe/docs/img/GPT-3_5.png +0 -0
msprobe/docs/img/GPT-3_6.png +0 -0
msprobe/docs/img/GPT-3_7.png +0 -0
msprobe/docs/img/GPT-3_8.png +0 -0
msprobe/docs/img/YOLOV5S_1.png +0 -0
msprobe/docs/img/YOLOV5S_2.png +0 -0
msprobe/docs/img/accuracy_checking_details.png +0 -0
msprobe/docs/img/accuracy_checking_result.png +0 -0
msprobe/docs/img/api_precision_compare_details.png +0 -0
msprobe/docs/img/api_precision_compare_result.png +0 -0
msprobe/docs/img/auto_analyze_log.png +0 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/compare_result_pkl.png +0 -0
msprobe/docs/img/compare_result_pkl_md5.png.png +0 -0
msprobe/docs/img/cpu_info.png +0 -0
msprobe/docs/img/free_benchmark.png +0 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/grad_probe_image-1.png +0 -0
msprobe/docs/img/grad_probe_image-2.png +0 -0
msprobe/docs/img/grad_probe_image-3.png +0 -0
msprobe/docs/img/grad_probe_image-4.png +0 -0
msprobe/docs/img/grad_probe_image.png +0 -0
msprobe/docs/img/merge_result.png +0 -0
msprobe/docs/img/module_compare.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/docs/img/monitor/step_count_per_record.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/docs/img/save_compare_result_sample.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_ms.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_pt.png +0 -0
msprobe/docs/img/visualization/proxy.png +0 -0
msprobe/docs/img/visualization/tensorboard_1.png +0 -0
msprobe/docs/img/visualization/tensorboard_2.png +0 -0
msprobe/docs/img/visualization/vis_browser_1.png +0 -0
msprobe/docs/img/visualization/vis_browser_2.png +0 -0
msprobe/docs/img/visualization/vis_match_info.png +0 -0
msprobe/docs/img/visualization/vis_precision_info.png +0 -0
msprobe/docs/img/visualization/vis_search_info.png +0 -0
msprobe/docs/img/visualization/vis_show_info.png +0 -0
msprobe/docs/img/visualization/vis_showcase.png +0 -0
msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
msprobe/docs/visualization/GPTModel.png +0 -0
msprobe/docs/visualization/ParallelMLP.png +0 -0
msprobe/docs/visualization/layer_mapping_example.md +0 -132
msprobe/docs/visualization/mapping.png +0 -0
msprobe/docs/visualization/mapping1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/3.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/4.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/5.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/6.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/7.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory-qwen25vl.txt +0 -59
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed-mm-qwen25vl.txt +0 -80
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactory_mapping.md +0 -330
msprobe/docs/visualization/module_name.png +0 -0
msprobe/docs/visualization/module_name1.png +0 -0
msprobe/docs/visualization/no_mapping.png +0 -0
msprobe/docs/visualization/no_mapping1.png +0 -0
msprobe/docs/visualization/no_mapping_analyze.png +0 -0
msprobe/docs/visualization/top_layer.png +0 -0
msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +0 -460
msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +0 -2081
msprobe/mindspore/code_mapping/bind.py +0 -283
msprobe/mindspore/code_mapping/cmd_parser.py +0 -40
msprobe/mindspore/code_mapping/graph.py +0 -49
msprobe/mindspore/code_mapping/graph_parser.py +0 -211
msprobe/mindspore/code_mapping/main.py +0 -24
msprobe/mindspore/code_mapping/processor.py +0 -34
msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +0 -111
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +0 -52
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +0 -257
msprobe/mindspore/free_benchmark/common/config.py +0 -27
msprobe/mindspore/free_benchmark/common/handler_params.py +0 -31
msprobe/mindspore/free_benchmark/common/utils.py +0 -100
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -638
msprobe/mindspore/free_benchmark/handler/base_handler.py +0 -105
msprobe/mindspore/free_benchmark/handler/check_handler.py +0 -55
msprobe/mindspore/free_benchmark/handler/fix_handler.py +0 -51
msprobe/mindspore/free_benchmark/handler/handler_factory.py +0 -36
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +0 -82
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +0 -45
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +0 -78
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +0 -77
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +0 -56
msprobe/mindspore/free_benchmark/perturbation/no_change.py +0 -27
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +0 -46
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +0 -51
msprobe/mindspore/grad_probe/global_context.py +0 -127
msprobe/mindspore/grad_probe/grad_analyzer.py +0 -260
msprobe/mindspore/grad_probe/grad_monitor.py +0 -42
msprobe/mindspore/grad_probe/grad_stat_csv.py +0 -161
msprobe/mindspore/grad_probe/hook.py +0 -115
msprobe/mindspore/grad_probe/utils.py +0 -43
msprobe/mindspore/mindtorch/__init__.py +0 -18
msprobe/mindspore/ms_config.py +0 -153
msprobe/mindspore/task_handler_factory.py +0 -44
msprobe/nan_analyze/__init__.py +0 -14
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +0 -9
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +0 -480
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +0 -567
msprobe/pytorch/debugger/precision_debugger.py +0 -181
msprobe/pytorch/free_benchmark/__init__.py +0 -23
msprobe/pytorch/free_benchmark/common/constant.py +0 -85
msprobe/pytorch/free_benchmark/common/counter.py +0 -87
msprobe/pytorch/free_benchmark/common/enums.py +0 -80
msprobe/pytorch/free_benchmark/common/params.py +0 -152
msprobe/pytorch/free_benchmark/common/utils.py +0 -143
msprobe/pytorch/free_benchmark/compare/grad_saver.py +0 -215
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +0 -121
msprobe/pytorch/free_benchmark/main.py +0 -123
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +0 -28
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +0 -56
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +0 -107
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +0 -121
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +0 -89
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +0 -87
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +0 -43
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +0 -60
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +0 -34
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +0 -252
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +0 -54
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +0 -40
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -45
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +0 -181
msprobe/pytorch/grad_probe/__init__.py +0 -0
msprobe/pytorch/grad_probe/grad_monitor.py +0 -108
msprobe/pytorch/grad_probe/grad_stat_csv.py +0 -160
msprobe/pytorch/hook_module/__init__.py +0 -16
msprobe/pytorch/hook_module/wrap_aten.py +0 -111
msprobe/pytorch/online_dispatch/__init__.py +0 -19
msprobe/pytorch/online_dispatch/compare.py +0 -224
msprobe/pytorch/online_dispatch/dispatch.py +0 -332
msprobe/pytorch/online_dispatch/dump_compare.py +0 -179
msprobe/pytorch/online_dispatch/single_compare.py +0 -412
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +0 -58
msprobe/pytorch/online_dispatch/utils.py +0 -158
msprobe/pytorch/parse_tool/__init__.py +0 -0
msprobe/pytorch/parse_tool/cli.py +0 -31
msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
msprobe/pytorch/parse_tool/lib/compare.py +0 -253
msprobe/pytorch/parse_tool/lib/config.py +0 -50
msprobe/pytorch/parse_tool/lib/file_desc.py +0 -45
msprobe/pytorch/parse_tool/lib/interactive_cli.py +0 -97
msprobe/pytorch/parse_tool/lib/parse_exception.py +0 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +0 -161
msprobe/pytorch/parse_tool/lib/utils.py +0 -299
msprobe/pytorch/parse_tool/lib/visualization.py +0 -85
msprobe/pytorch/pt_config.py +0 -299
/msprobe/core/{grad_probe → dump}/__init__.py +0 -0
/msprobe/{mindspore/code_mapping → core/dump/api_dump}/__init__.py +0 -0
/msprobe/{mindspore/debugger → core/dump/data_dump}/__init__.py +0 -0
/msprobe/{mindspore/exception_dump → core/dump/data_dump/data_processor}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark → core/dump/debugger}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark/common → core/dump/kernel_dump}/__init__.py +0 -0
/msprobe/mindspore/{free_benchmark/handler → dump/debugger}/__init__.py +0 -0
/msprobe/mindspore/{grad_probe → dump/dump_processor}/__init__.py +0 -0
/msprobe/mindspore/{overflow_check → dump/exception_dump}/__init__.py +0 -0
/msprobe/mindspore/{mindtorch → dump/mindtorch}/mindtorch_adaptor.py +0 -0
/msprobe/{pytorch/api_accuracy_checker/run_ut → mindspore/dump/overflow_check}/__init__.py +0 -0
/msprobe/{pytorch/debugger → mindspore/monitor}/__init__.py +0 -0
/msprobe/{pytorch/free_benchmark/common → msaccucmp}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/.keep +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers → api_accuracy_checker/acc_check}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/torch_ut_setting.json +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers/npu → dump/api_dump}/__init__.py +0 -0
/msprobe/pytorch/{hook_module → dump/api_dump}/support_wrap_ops.yaml +0 -0
/msprobe/pytorch/{free_benchmark/result_handlers → dump/debugger}/__init__.py +0 -0

msprobe/core/compare/acc_compare.py CHANGED Viewed

@@ -1,17 +1,18 @@
-# Copyright (c) 2024-2025, Huawei Technologies Co., Ltd.
-# All rights reserved.
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
 #
-# Licensed under the Apache License, Version 2.0  (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
 #
-# http://www.apache.org/licenses/LICENSE-2.0
+#          http://license.coscl.org.cn/MulanPSL2
 #
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
 import os
 import re
@@ -22,7 +23,6 @@ import numpy as np
 import pandas as pd
 from tqdm import tqdm
-from msprobe.core.advisor.advisor import Advisor
 from msprobe.core.common.const import CompareConst, Const
 from msprobe.core.common.exceptions import FileCheckException
 from msprobe.core.common.file_utils import load_json, remove_path, create_directory, save_excel, save_json
@@ -31,21 +31,19 @@ from msprobe.core.common.utils import CompareException, add_time_with_xlsx, chec
     set_dump_path, get_dump_mode, check_compare_param, load_stack_json, get_file_type, add_time_with_json
 from msprobe.core.compare.check import check_dump_json_str, check_stack_json_str, cross_dtype_mapping, \
     check_configuration_param
-from msprobe.core.compare.utils import merge_tensor, print_compare_ends_info, read_op, set_stack_json_path, \
-    reorder_index
+from msprobe.core.compare.utils import print_compare_ends_info, read_op, set_stack_json_path, reorder_index
 from msprobe.core.compare.config import ModeConfig, MappingConfig, MappingDict
 from msprobe.core.compare.multiprocessing_compute import CompareRealData
-from msprobe.core.compare.highlight import HighLight
 from msprobe.core.compare.diff_analyze.first_diff_analyze import FirstDiffAnalyze
+from msprobe.core.compare.indicator_analysis.calculator import calculate_excel_result_df
+from msprobe.core.compare.stats_diff_calc import ValType, ALL_TYPES
 @dataclass
 class ComparisonConfig:
     dump_mode: str
     stack_mode: bool
-    auto_analyze: bool
     fuzzy_match: bool
-    highlight: bool
     data_mapping: dict
     suffix: str
     cell_mapping: dict
@@ -107,13 +105,16 @@ class Comparator:
         file_path = self.process_output_file(output_path, suffix, self.mode_config.compared_file_type)
         # initialize the compare result table and compare general data(name, dtype, shape, statistics/md5, etc.)
-        npu_json = input_param.get("npu_json_path")
-        bench_json = input_param.get("bench_json_path")
-        stack_json = input_param.get("stack_json_path")
+        npu_json = input_param.get("npu_path")
+        bench_json = input_param.get("bench_path")
+        stack_json = input_param.get("stack_path")
         parse_data = ParseData(self.mode_config, rank)  # load and parse json data
         npu_df, bench_df = parse_data.parse([npu_json, bench_json, stack_json])
+        logger.info("Matching APIs/Modules in progress...")
         result_df = self.compare_statistics(npu_df, bench_df)
-        if not result_df.values.tolist():
+        logger.info("APIs/Modules match done.")
+        if result_df.empty:
             logger.warning("Can`t match any op. No compare result file generated.")
             return
@@ -132,28 +133,21 @@ class Comparator:
         # compare real data
         if self.mode_config.dump_mode == Const.ALL:
+            logger.info("Compare real data in progress...")
             compare_real_data = CompareRealData(self.file_reader, self.mode_config, self.cross_frame)
             result_df = compare_real_data.do_multi_process(input_param, result_df)
+            logger.info("Compare real data done.")
-        # save result excel file
-        logger.info(f'Saving result excel file in progress. The file path is: {file_path}.')
-        if self.mode_config.highlight and len(result_df) <= CompareConst.MAX_EXCEL_LENGTH:
-            # highlight if not too long
-            highlight_dict = {"red_rows": set(), "yellow_rows": set(), "red_lines": [], "yellow_lines": []}
-            highlight = HighLight(self.mode_config, rank)
-            if self.mode_config.compared_file_type == Const.DUMP_JSON_FILE:
-                highlight.find_compare_result_error_rows(result_df, highlight_dict)
-            result_df.drop(columns=['state', 'api_origin_name'], inplace=True)  # 删除中间数据，两列不落盘
-            highlight.highlight_rows_xlsx(result_df, highlight_dict, file_path)
-        else:
-            # fallback to simple save without highlight
-            result_df.drop(columns=['state', 'api_origin_name'], inplace=True)  # 删除中间数据，两列不落盘
-            save_excel(file_path, result_df)
+        # calculate Indicators
+        logger.info("Calculating comparison indicators in progress...")
+        calculate_excel_result_df(result_df, self.mode_config.dump_mode)
+        result_df.drop(columns=['state', 'api_origin_name'], inplace=True)  # 删除中间数据，两列不落盘
+        logger.info("Comparison indicators calculation done.")
-        # output compare analysis suggestions
-        if self.mode_config.auto_analyze:
-            advisor = Advisor(result_df, output_path, suffix)
-            advisor.analysis()
+        # save result excel file
+        logger.info("Saving result excel file in progress...")
+        logger.info(f"The result excel file path is: {file_path}.")
+        save_excel(file_path, result_df)
         print_compare_ends_info()
@@ -164,6 +158,10 @@ class Comparator:
         # create new columns for compare op_name and shape
         # process npu_df's COMPARE_KEY whether same or different framework
         process_df = ProcessDf(self.mode_config, self.mapping_config, self.mapping_dict)
+        # 处理重计算对应的backward的序号。反向重计算序号调整属于精确匹配，与模糊匹配互斥。
+        if not self.mode_config.fuzzy_match:
+            npu_df = process_df.update_backward_call(npu_df)
+            bench_df = process_df.update_backward_call(bench_df)
         npu_df, bench_df = process_df.process_compare_key_and_shape(npu_df, bench_df)
         # match npu and bench, match_result contains both npu_info and bench_info
@@ -190,6 +188,33 @@ class ParseData:
         self.mode_config = mode_config
         self.rank = rank
+    @staticmethod
+    def get_direction_and_call_direction(data_name):
+        parts = data_name.split(Const.SEP)
+        if len(parts) < 2:
+            return None, None
+        last = parts[-1]
+        second_last = parts[-2]
+        # direction 判断
+        if Const.BACKWARD in (last, second_last):
+            direction = Const.BACKWARD
+        elif Const.FORWARD in (last, second_last):
+            direction = Const.FORWARD
+        else:
+            return None, None
+        # call_direction 永远取最后两个
+        call_direction = Const.SEP.join((second_last, last))
+        return direction, call_direction
+    @staticmethod
+    def get_op_no_number(data_name):
+        parts = data_name.split(Const.SEP)
+        return Const.SEP.join(parts[:-2]) if len(parts) > 2 else ''
     def parse(self, file_list):
         npu_json_path, bench_json_path, stack_json_path = file_list
         npu_json_data = load_json(npu_json_path)
@@ -202,7 +227,7 @@ class ParseData:
         return npu_df, bench_df
-    def gen_data_df(self, data_json, stack_json_data, device: str):
+    def init_result(self):
         result = {
             CompareConst.OP_NAME: [],
             Const.DTYPE: [],
@@ -211,57 +236,90 @@ class ParseData:
             Const.STACK_INFO: [],
             Const.STATE: [],
             Const.API_ORIGIN_NAME: [],
-            Const.REQ_GRAD: []
+            Const.REQ_GRAD: [],
+            Const.DIRECTION: [],  # 目前三种选择：'forward', 'backward', None
+            Const.CALL_DIRECTION: [],
+            Const.OP_NO_NUMBER: [],  # 删除调用序号
+            Const.BACKWARD_CALL_ORDER: [],  # 计算op反向调用顺序，初始化为0
+            Const.SUFFIX: []
         }
         if self.mode_config.dump_mode == Const.ALL:
             result[Const.DATA_NAME] = []
         elif self.mode_config.dump_mode == Const.MD5:
             result[Const.MD5] = []
+        return result
+    def create_progress_bar(self, api_nums: int, device: str):
+        desc = f'{device} API/Module Read Progress'
+        if self.rank:
+            desc = f'[{self.rank}]' + desc
+        return tqdm(total=api_nums, desc=desc, unit="api/module", ncols=100)
+    def gen_data_df(self, data_json, stack_json_data, device: str):
+        result = self.init_result()
+        op_backward_count = defaultdict(int)  # 记录backward调用次数，用于后续调用序更新
         apis_data = data_json.get('data', None)
         if not apis_data:
             logger.warning('No APIs found in dump.json.')
             return pd.DataFrame(result)
-        api_nums = len(apis_data)
-        default_bar_desc = f'{device} API/Module Read Progress'
-        bar_desc_add_rank = f'[{self.rank}]' + default_bar_desc if self.rank else default_bar_desc
-        progress_bar = tqdm(total=api_nums, desc=bar_desc_add_rank, unit="api/module", ncols=100)
+        progress_bar = self.create_progress_bar(len(apis_data), device)
         # 从json中循环解析API数据，遍历所有API
         for data_name in apis_data:
             check_op_str_pattern_valid(data_name)
             op_parsed_list = self.gen_merge_list(data_json, data_name, stack_json_data)
             if not op_parsed_list:
+                progress_bar.update(1)
+                continue
+            op_no_number = self.get_op_no_number(data_name)
+            if op_no_number == '':
+                progress_bar.update(1)
                 continue
+            direction, call_direction = self.get_direction_and_call_direction(data_name)
+            backward_call_order = op_backward_count.get(op_no_number, 0)
+            if direction == Const.BACKWARD:
+                op_backward_count[op_no_number] += 1
             reordered_index_list = reorder_index(op_parsed_list)
+            stack_info = op_parsed_list[-1].get('full_info') if self.mode_config.stack_mode else None
             for i, index in enumerate(reordered_index_list):
                 op_item = op_parsed_list[index]
+                summary_data = [
+                    str(op_item.get(key)) if op_item.get(key) is None else op_item.get(key)
+                    for key in Const.SUMMARY_METRICS_LIST
+                ]
+                full_op_name = op_item.get(Const.FULL_OP_NAME)
+                suffix = full_op_name.replace(data_name, '')
                 # common key
-                result[CompareConst.OP_NAME].append(op_item.get('full_op_name'))
+                result[CompareConst.OP_NAME].append(full_op_name)
                 result[Const.DTYPE].append(op_item.get(Const.DTYPE))
                 result[Const.SHAPE].append(op_item.get(Const.SHAPE))
                 result[Const.STATE].append(op_item.get(Const.STATE))
                 result[Const.REQ_GRAD].append(op_item.get(Const.REQ_GRAD))
                 result[Const.API_ORIGIN_NAME].append(data_name)
-                summary_data = [
-                    str(op_item.get(key)) if op_item.get(key) is None else op_item.get(key)
-                    for key in Const.SUMMARY_METRICS_LIST
-                ]
                 result[Const.SUMMARY].append(summary_data)
+                result[Const.DIRECTION].append(direction)
+                result[Const.CALL_DIRECTION].append(call_direction)
+                result[Const.OP_NO_NUMBER].append(op_no_number)
+                result[Const.BACKWARD_CALL_ORDER].append(backward_call_order)
+                result[Const.SUFFIX].append(suffix)
                 # dump_mode differ key
                 if self.mode_config.dump_mode == Const.MD5:
-                    result[Const.MD5].append(op_parsed_list[index].get(Const.MD5))
+                    result[Const.MD5].append(op_item.get(Const.MD5))
                 if self.mode_config.dump_mode == Const.ALL:
                     result[Const.DATA_NAME].append(op_item.get(Const.DATA_NAME))
                 # mode_config stack_mode addition key
-                if i == 0 and self.mode_config.stack_mode:
-                    result[Const.STACK_INFO].append(op_parsed_list[-1].get('full_info'))
-                else:
-                    result[Const.STACK_INFO].append(None)
+                result[Const.STACK_INFO].append(stack_info if i == 0 else None)
                 # mode_config first_diff_analyze addition key
                 if self.mode_config.first_diff_analyze:
@@ -307,10 +365,64 @@ class ProcessDf:
             raise CompareException(CompareException.INDEX_OUT_OF_BOUNDS_ERROR) from error
         return api_name
+    @staticmethod
+    def update_backward_call(cmp_df):
+        # ===============================
+        # Step 1: 拆 call_direction 的两部分
+        # ===============================
+        cd_parts = cmp_df[Const.CALL_DIRECTION].str.rsplit(Const.SEP, n=1, expand=True)
+        cd_parts.columns = ["cd_head", "cd_tail"]
+        head_is_digit = cd_parts["cd_head"].str.isdigit()
+        tail_is_digit = cd_parts["cd_tail"].str.isdigit()
+        is_backward = cmp_df[Const.DIRECTION] == Const.BACKWARD
+        # ===============================
+        # Step 2: 矢量化替换 backward_call_order
+        # ===============================
+        mask_head = is_backward & head_is_digit
+        mask_tail = is_backward & tail_is_digit
+        update_mask = mask_head | mask_tail
+        cd_parts.loc[mask_head, "cd_head"] = (
+            cmp_df.loc[mask_head, Const.BACKWARD_CALL_ORDER].astype(str)
+        )
+        cd_parts.loc[mask_tail, "cd_tail"] = (
+            cmp_df.loc[mask_tail, Const.BACKWARD_CALL_ORDER].astype(str)
+        )
+        # 只更新需要更新的 call_direction
+        cmp_df.loc[update_mask, Const.CALL_DIRECTION] = (
+                cd_parts.loc[update_mask, "cd_head"]
+                + Const.SEP
+                + cd_parts.loc[update_mask, "cd_tail"]
+        )
+        # ===============================
+        # Step 3: 初始化 + 局部更新 OP_NAME_UPDATE
+        # ===============================
+        # 默认保持原值
+        cmp_df[CompareConst.OP_NAME_UPDATE] = cmp_df[CompareConst.OP_NAME]
+        # 只更新命中的行
+        cmp_df.loc[update_mask, CompareConst.OP_NAME_UPDATE] = (
+                cmp_df.loc[update_mask, Const.OP_NO_NUMBER]
+                + Const.SEP
+                + cmp_df.loc[update_mask, Const.CALL_DIRECTION]
+                + cmp_df.loc[update_mask, Const.SUFFIX]
+        )
+        return cmp_df
     def process_compare_key_and_shape(self, npu_df, bench_df):
         npu_df = self.assign_npu_df_compare_key(npu_df, bench_df)
         npu_df[CompareConst.CMP_SHAPE] = npu_df[Const.SHAPE]
-        bench_df[CompareConst.CMP_KEY] = bench_df[CompareConst.OP_NAME]
+        bench_cmp_key = (
+            bench_df[CompareConst.OP_NAME_UPDATE]
+            if not self.mode_config.fuzzy_match
+            else bench_df[CompareConst.OP_NAME]
+        )
+        bench_df[CompareConst.CMP_KEY] = bench_cmp_key
         bench_df[CompareConst.CMP_SHAPE] = bench_df[Const.SHAPE]
         return npu_df, bench_df
@@ -336,7 +448,12 @@ class ProcessDf:
         elif self.mapping_config.data_mapping:
             npu_df[CompareConst.CMP_KEY] = npu_df[CompareConst.OP_NAME].apply(self.process_data_mapping)
         else:
-            npu_df[CompareConst.CMP_KEY] = npu_df[CompareConst.OP_NAME]
+            cmp_key = (
+                npu_df[CompareConst.OP_NAME_UPDATE]
+                if not self.mode_config.fuzzy_match
+                else npu_df[CompareConst.OP_NAME]
+            )
+            npu_df[CompareConst.CMP_KEY] = cmp_key
         return npu_df
     def process_internal_api_mapping(self, npu_op_name):
@@ -427,9 +544,22 @@ class ProcessDf:
         if self.mapping_dict.cell_mapping_dict:
             # get cell name & class name from op_name
             # Cell.fc1.Dense.forward.0.input.0
+            # npu_op_name.split(Const.SEP, 1)[-1] 表示Module或Cell字段后面的部分
             cell_name = re.split(r'\.(?:forward|backward|parameters_grad)\.', npu_op_name.split(Const.SEP, 1)[-1])[0]
+            # 1. 精确整段匹配（保持原行为）
             if cell_name in self.mapping_dict.cell_mapping_dict:
-                npu_op_name = npu_op_name.replace(cell_name, self.mapping_dict.cell_mapping_dict[cell_name], 1)
+                new_cell_name = self.mapping_dict.cell_mapping_dict[cell_name]
+            # 2. 兜底：简单字符串替换（不做任何限制）
+            else:
+                new_cell_name = cell_name
+                for target_name, golden_name in self.mapping_dict.cell_mapping_dict.items():
+                    if target_name in new_cell_name:
+                        new_cell_name = new_cell_name.replace(target_name, golden_name, 1)
+            # 3. 应用替换
+            if new_cell_name != cell_name:
+                npu_op_name = npu_op_name.replace(cell_name, new_cell_name, 1)
         return npu_op_name
     def process_data_mapping(self, npu_op_name):
@@ -482,8 +612,7 @@ class Match:
     def check_op_item(self, npu_op_item, bench_op_item):
         name_match = self.rename_api(npu_op_item[CompareConst.CMP_KEY]) == self.rename_api(
             bench_op_item[CompareConst.CMP_KEY])
-        shape_match = npu_op_item[CompareConst.CMP_SHAPE] == bench_op_item[CompareConst.CMP_SHAPE]
-        if name_match and shape_match:
+        if name_match:
             return True
         else:
             npu_op_name = npu_op_item[CompareConst.OP_NAME]
@@ -507,9 +636,13 @@ class Match:
             match_result = match_result.sort_values(CompareConst.OP_NAME_X).reset_index(drop=True)
             match_result[CompareConst.OP_NAME_X] = match_result[CompareConst.OP_NAME_X].astype('object')
         elif not self.mode_config.fuzzy_match:
-            match_result = pd.merge(npu_df, bench_df, on=[CompareConst.CMP_KEY, CompareConst.CMP_SHAPE],
+            match_result = pd.merge(npu_df, bench_df, on=[CompareConst.CMP_KEY],
                                     how='outer')
         else:
+            drop_list = [Const.DIRECTION, Const.CALL_DIRECTION, Const.OP_NO_NUMBER, Const.BACKWARD_CALL_ORDER,
+                         Const.SUFFIX]
+            npu_df.drop(columns=drop_list, inplace=True)
+            bench_df.drop(columns=drop_list, inplace=True)
             match_result = self.process_fuzzy_match(npu_df, bench_df)
         return match_result
@@ -675,52 +808,187 @@ class CreateTable:
 class CalcStatsDiff:
     def __init__(self, mode_config: ModeConfig):
         self.mode_config = mode_config
+        self.rules = None
+        self.build_rules()
+        self.DEFAULT_RULE = self.static_diff(CompareConst.N_A)
     @staticmethod
-    def type_check(val):
+    def is_same_value(a: pd.Series, b: pd.Series) -> pd.Series:
         """
-        检查是否为数值或字符串形式的nan, 如果是返回True
+        检查是否相等
+        """
+        return a.astype(str).eq(b.astype(str))
+    @staticmethod
+    def is_number(val: pd.Series) -> pd.Series:
+        """
+        检查是否为有效的数值，并排除布尔类型
         """
-        check_series = pd.Series(False, index=val.index)
         val_str = val.astype(str)
-        check_series[pd.to_numeric(val_str, errors='coerce').notna() | val_str.str.lower().eq('nan')] = True
-        return check_series
+        mask_bool = val_str.str.lower().eq('true') | val_str.str.lower().eq('false')
+        mask_numeric = pd.to_numeric(val, errors='coerce').notna()
+        return mask_numeric & ~mask_bool
+    @staticmethod
+    def is_nan(val: pd.Series) -> pd.Series:
+        """
+        检查是否为字符串形式的 'nan' (包括大小写) 或实际的 NaN
+        """
+        val_str = val.astype(str)
+        return val.isna() | val_str.str.lower().eq('nan')
+    @staticmethod
+    def is_inf(val: pd.Series) -> pd.Series:
+        """
+        检查是否为正无穷 (inf)
+        """
+        val_str = val.astype(str)
+        return (val == np.inf) | val_str.str.lower().eq('inf')
+    @staticmethod
+    def is_neg_inf(val: pd.Series) -> pd.Series:
+        """
+        检查是否为负无穷 (-inf)
+        """
+        val_str = val.astype(str)
+        return (val == -np.inf) | val_str.str.lower().eq('-inf')
+    @staticmethod
+    def is_device(val: pd.Series) -> pd.Series:
+        """
+        检查是否包含 'npu', 'cpu' 或 'cuda' 字符串
+        """
+        return val.astype(str).str.contains('npu|cpu|cuda', case=False, na=False)
+    @staticmethod
+    def is_na(val: pd.Series) -> pd.Series:
+        """
+        检查是否为 N/A
+        """
+        return val.astype(str).eq(CompareConst.N_A)
+    @staticmethod
+    def rule_num_num(npu_num: pd.Series, bench_num: pd.Series):
+        diff = npu_num - bench_num
+        rel = pd.Series(CompareConst.INF, index=diff.index)
+        mask_nonzero = bench_num != 0
+        rel.loc[mask_nonzero] = (diff[mask_nonzero] / bench_num[mask_nonzero] * 100).abs().astype(str) + "%"
+        return diff, rel
+    @staticmethod
+    def static_diff(diff: str, rel=None):
+        if rel is None:
+            rel = diff
+        return diff, rel
     @staticmethod
     def get_number(val):
         return pd.to_numeric(val.astype(str), errors='coerce')
-    def calc_summary_diff(self, result_df, cond_no_bench, stats_index: str):
+    def build_rules(self):
+        """
+        创建npu、bench不相等规则
+        """
+        # NUM × NUM
+        self.rules = {(ValType.NUM, ValType.NUM): self.rule_num_num}
+        # ---------- NAN 规则 ----------
+        nan_rule = self.static_diff(CompareConst.NAN)
+        nan_range = {ValType.NUM, ValType.NAN, ValType.INF, ValType.NEG_INF}
+        for t in nan_range:
+            self.rules[(ValType.NAN, t)] = nan_rule
+            self.rules[(t, ValType.NAN)] = nan_rule
+        # ---------- INF / -INF 规则 ----------
+        pos_inf = self.static_diff(CompareConst.INF)
+        neg_inf = self.static_diff(CompareConst.NEG_INF)
+        # INF / -INF 在左
+        for r in (ValType.NUM, ValType.NEG_INF):
+            self.rules[(ValType.INF, r)] = pos_inf
+        for r in (ValType.NUM, ValType.INF):
+            self.rules[(ValType.NEG_INF, r)] = neg_inf
+        # INF / -INF 在右
+        self.rules[(ValType.NUM, ValType.INF)] = neg_inf
+        self.rules[(ValType.NUM, ValType.NEG_INF)] = pos_inf
+        # ---------- N/A 规则 ----------
+        na_rule = self.static_diff(CompareConst.N_A)
+        na_range = {ValType.NUM, ValType.NAN, ValType.INF, ValType.NEG_INF, ValType.DEVICE, ValType.NA, ValType.OTHER}
+        for t in na_range:
+            self.rules[(ValType.NA, t)] = na_rule
+            self.rules[(t, ValType.NA)] = na_rule
+        # ---------- DEVICE / OTHER 规则 ----------
+        # 给diff，都是device给N/A
+        diff_rule = self.static_diff(CompareConst.DIFF_FLAG)
+        diff_range = {ValType.NUM, ValType.NAN, ValType.INF, ValType.NEG_INF, ValType.DEVICE, ValType.OTHER}
+        for t in diff_range:
+            self.rules[(ValType.DEVICE, t)] = diff_rule
+            self.rules[(t, ValType.DEVICE)] = diff_rule
+            self.rules[(ValType.OTHER, t)] = diff_rule
+            self.rules[(t, ValType.OTHER)] = diff_rule
+        self.rules[(ValType.DEVICE, ValType.DEVICE)] = na_rule
+    def classify(self, val: pd.Series) -> pd.Series:
+        result_values = np.select(
+            [
+                self.is_nan(val),
+                self.is_inf(val),
+                self.is_neg_inf(val),
+                self.is_number(val),  # 'inf', '-inf'会被pandas认为是number，所以放在inf/-inf判断后面
+                self.is_device(val),
+                self.is_na(val),
+            ],
+            [
+                ValType.NAN.value,
+                ValType.INF.value,
+                ValType.NEG_INF.value,
+                ValType.NUM.value,
+                ValType.DEVICE.value,
+                ValType.NA.value,
+            ],
+            default=ValType.OTHER.value,
+        )
+        val_to_enum = {t.value: t for t in ValType}
+        result_series = pd.Series(result_values, index=val.index).map(val_to_enum)
+        return result_series
+    def calc_summary_diff(self, result_df, stats_index: str):
         npu_val = result_df['NPU ' + stats_index]
         bench_val = result_df['Bench ' + stats_index]
         diff_name = stats_index.capitalize() + ' diff'
         rel_err_name = ('norm' if stats_index == 'l2norm' else stats_index).capitalize() + 'RelativeErr'
-        # npu、bench中统计量均为数字或nan
-        cond_num_nan = self.type_check(npu_val) & self.type_check(bench_val)
+        # ---------------------- 初始化 ----------------------
+        result_df[[diff_name, rel_err_name]] = CompareConst.N_A
-        # 如果统计量不是数字或nan，就赋值统计量差异为N/A
-        result_df.loc[~cond_num_nan, [diff_name, rel_err_name]] = CompareConst.N_A
-        cond_valid_stat = ~cond_no_bench & cond_num_nan  # 有效统计条件：bench_name不是N/A，并且NPU和bench的统计量都是数字或nan
-        result_df.loc[cond_valid_stat, diff_name] = self.get_number(npu_val) - self.get_number(bench_val)
+        # ---------------------- 基础 mask ----------------------
+        npu_num = self.get_number(npu_val)
+        bench_num = self.get_number(bench_val)
+        mask_equal = self.is_same_value(npu_val, bench_val)
+        mask_unequal = ~mask_equal
-        cond_diff_nan = result_df[diff_name].isna()  # 统计量差异是nan
-        cond_nan_diff = cond_valid_stat & cond_diff_nan
-        result_df.loc[cond_nan_diff, [diff_name, rel_err_name]] = CompareConst.NAN
+        # ---------------------- npu, bench统计量相等 ----------------------
+        result_df.loc[mask_equal, [diff_name, rel_err_name]] = 0
-        cond_not_nan_diff = cond_valid_stat & ~cond_diff_nan
-        condition_pt_zero = self.get_number(bench_val) == 0
-        result_df.loc[cond_not_nan_diff & condition_pt_zero, rel_err_name] = CompareConst.N_A
+        # ---------------------- npu, bench统计量不相等 ----------------------
+        npu_type = self.classify(npu_val)
+        bench_type = self.classify(bench_val)
+        for t1 in ALL_TYPES:
+            for t2 in ALL_TYPES:
+                mask = mask_unequal & (npu_type == t1) & (bench_type == t2)
+                if not mask.any():
+                    continue
-        # 相对误差转成百分比字符串
-        cond_ref_err = cond_not_nan_diff & ~condition_pt_zero
-        result_df.loc[cond_ref_err, rel_err_name] = (
-                result_df.loc[cond_ref_err, diff_name] / bench_val[cond_ref_err].astype(float) * 100)
-        result_df.loc[cond_ref_err, rel_err_name] = (result_df.loc[cond_ref_err, rel_err_name].abs().astype(str) + '%')
+                rule = self.rules.get((t1, t2), self.DEFAULT_RULE)
-        magnitude = self.get_number(result_df[diff_name]).abs() / (pd.Series(
-            np.maximum(self.get_number(npu_val), self.get_number(bench_val))).abs() + CompareConst.EPSILON)
-        return magnitude > CompareConst.MAGNITUDE
+                if callable(rule):
+                    diff, rel = rule(npu_num[mask], bench_num[mask])
+                else:
+                    diff, rel = rule
+                result_df.loc[mask, diff_name] = diff
+                result_df.loc[mask, rel_err_name] = rel
     def calc_accuracy(self, result_df, header):
         # bench name N/A represents no bench data, err_msg adds "No bench data matched."
@@ -734,14 +1002,9 @@ class CalcStatsDiff:
             result_df.loc[condition_md5_equal, CompareConst.RESULT] = CompareConst.PASS
             result_df.loc[~condition_md5_equal & ~condition_no_bench, CompareConst.RESULT] = CompareConst.DIFF
         elif self.mode_config.first_diff_analyze or self.mode_config.dump_mode == Const.SUMMARY:
-            warning_list = [
-                self.calc_summary_diff(result_df, condition_no_bench, stats_index)
-                for stats_index in ['max', 'min', 'mean', 'l2norm']
-            ]
-            warning_flag = pd.DataFrame(warning_list).any()
+            for stats_index in ['max', 'min', 'mean', 'l2norm']:
+                self.calc_summary_diff(result_df, stats_index)
             result_df.loc[~condition_no_bench, [CompareConst.RESULT, CompareConst.ERROR_MESSAGE]] = ''
-            result_df.loc[warning_flag, CompareConst.RESULT] = CompareConst.WARNING
-            result_df.loc[warning_flag, CompareConst.ERROR_MESSAGE] = 'Need double check api accuracy. '
             result_df.loc[~condition_req_grad_consist, CompareConst.ERROR_MESSAGE] += 'Requires_grad inconsistent. '
         else:
             fill_cols = [CompareConst.COSINE, CompareConst.EUC_DIST,
@@ -749,7 +1012,6 @@ class CalcStatsDiff:
                          CompareConst.ONE_THOUSANDTH_ERR_RATIO, CompareConst.FIVE_THOUSANDTHS_ERR_RATIO,
                          CompareConst.ERROR_MESSAGE]
             result_df.loc[~condition_no_bench, fill_cols] = ''  # 默认填充'', df默认省缺值为nan，不便后续处理，容易出现意外情况
-            result_df.loc[~condition_no_bench, CompareConst.ACCURACY] = CompareConst.ACCURACY_CHECK_YES
             result_df.loc[~condition_req_grad_consist, CompareConst.ERROR_MESSAGE] = 'Requires_grad inconsistent. '
         return result_df[header]
@@ -761,9 +1023,7 @@ def setup_comparison(input_param, output_path, **kwargs) -> ComparisonConfig:
         config = ComparisonConfig(
             dump_mode='',
             stack_mode=False,
-            auto_analyze=kwargs.get('auto_analyze', True),
             fuzzy_match=kwargs.get('fuzzy_match', False),
-            highlight=kwargs.get('highlight', False),
             data_mapping=kwargs.get('data_mapping', {}),
             suffix=kwargs.get('suffix', ''),
             cell_mapping=kwargs.get('cell_mapping', {}),
@@ -771,18 +1031,15 @@ def setup_comparison(input_param, output_path, **kwargs) -> ComparisonConfig:
             layer_mapping=kwargs.get('layer_mapping', {}),
             first_diff_analyze=kwargs.get('first_diff_analyze', False),
             compared_file_type='',
-            is_print_compare_log=input_param.get('is_print_compare_log', True)
+            is_print_compare_log=kwargs.get('is_print_compare_log', False)
         )
         set_dump_path(input_param)
         config.dump_mode = get_dump_mode(input_param)
-        config.compared_file_type = get_file_type(input_param.get("npu_json_path", None))
+        config.compared_file_type = get_file_type(input_param.get("npu_path", None))
-        # set stack_mode and set "stack_json_path" in input_param
-        if 'stack_json_path' in input_param:
-            config.stack_mode = kwargs.get('stack_mode', False)
-        else:
-            config.stack_mode = set_stack_json_path(input_param)
+        # set stack_mode and set "stack_path" in input_param
+        config.stack_mode, input_param = set_stack_json_path(input_param)
         check_configuration_param(config)
         create_directory(output_path)

mindstudio-probe 8.3.3__py3-none-any.whl → 26.0.0a1__py3-none-any.whl

mindstudio-probe 8.3.3py3-none-any.whl → 26.0.0a1py3-none-any.whl