PyPI - mindstudio-probe - Versions diffs - 8.3.3__py3-none-any.whl → 26.0.0a1__py3-none-any.whl - Mend

mindstudio-probe 8.3.3py3-none-any.whl → 26.0.0a1py3-none-any.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (689) hide show

{mindstudio_probe-8.3.3.dist-info → mindstudio_probe-26.0.0a1.dist-info}/METADATA +26 -14
mindstudio_probe-26.0.0a1.dist-info/RECORD +498 -0
{mindstudio_probe-8.3.3.dist-info → mindstudio_probe-26.0.0a1.dist-info}/WHEEL +1 -1
mindstudio_probe-26.0.0a1.dist-info/entry_points.txt +5 -0
mindstudio_probe-26.0.0a1.dist-info/licenses/LICENSE +124 -0
mindstudio_probe-26.0.0a1.dist-info/top_level.txt +2 -0
msprobe/__init__.py +12 -13
msprobe/config.json +9 -31
msprobe/core/__init__.py +12 -11
msprobe/core/acc_check/acc_check_cli.py +145 -0
msprobe/core/common/const.py +97 -38
msprobe/core/common/db_manager.py +133 -12
msprobe/core/common/decorator.py +12 -11
msprobe/core/common/exceptions.py +12 -11
msprobe/core/common/file_utils.py +101 -25
msprobe/core/common/framework_adapter.py +36 -25
msprobe/core/common/global_lock.py +12 -11
msprobe/core/common/inplace_op_checker.py +12 -11
msprobe/core/common/log.py +22 -11
msprobe/core/common/megatron_utils.py +566 -11
msprobe/core/common/parallel_state.py +12 -11
msprobe/core/common/runtime.py +12 -11
msprobe/core/common/utils.py +41 -41
msprobe/core/compare/acc_compare.py +361 -104
msprobe/core/compare/atb_data_compare.py +422 -0
msprobe/core/compare/auto_compare.py +134 -0
msprobe/core/compare/check.py +14 -17
msprobe/core/compare/compare_cli.py +72 -149
msprobe/core/compare/config.py +12 -13
msprobe/core/compare/diff_analyze/first_diff_analyze.py +28 -15
msprobe/core/compare/diff_analyze/ignore_op_list.yaml +3 -0
msprobe/core/compare/find_first/analyzer.py +18 -18
msprobe/core/compare/find_first/graph.py +12 -11
msprobe/core/compare/find_first/utils.py +13 -12
msprobe/core/compare/indicator_analysis/__init__.py +15 -0
msprobe/core/compare/indicator_analysis/algorithm.py +363 -0
msprobe/core/compare/indicator_analysis/api_data.py +141 -0
msprobe/core/compare/indicator_analysis/calculator.py +181 -0
msprobe/core/compare/indicator_analysis/utils.py +116 -0
msprobe/core/compare/layer_mapping/__init__.py +12 -11
msprobe/core/compare/layer_mapping/data_scope_parser.py +20 -11
msprobe/core/compare/layer_mapping/layer_mapping.py +14 -13
msprobe/core/compare/layer_mapping/postprocess_pass.py +13 -11
msprobe/core/compare/merge_result/merge_result.py +12 -11
msprobe/core/compare/merge_result/merge_result_cli.py +12 -11
msprobe/core/compare/merge_result/utils.py +12 -11
msprobe/core/compare/multiprocessing_compute.py +13 -14
msprobe/core/compare/npy_compare.py +13 -11
msprobe/core/compare/offline_data_compare.py +160 -0
msprobe/core/compare/stats_diff_calc.py +39 -0
msprobe/core/compare/torchair_acc_cmp.py +764 -0
msprobe/core/compare/torchair_cmp_utils.py +338 -0
msprobe/core/compare/utils.py +140 -49
msprobe/core/config_check/__init__.py +12 -11
msprobe/core/config_check/checkers/__init__.py +12 -11
msprobe/core/config_check/checkers/base_checker.py +15 -14
msprobe/core/config_check/checkers/dataset_checker.py +13 -12
msprobe/core/config_check/checkers/env_args_checker.py +13 -12
msprobe/core/config_check/checkers/hyperparameter_checker.py +16 -15
msprobe/core/config_check/checkers/pip_checker.py +15 -15
msprobe/core/config_check/checkers/random_checker.py +13 -12
msprobe/core/config_check/checkers/weights_checker.py +14 -12
msprobe/core/config_check/ckpt_compare/ckpt_comparator.py +13 -17
msprobe/core/config_check/ckpt_compare/megatron_loader.py +13 -12
msprobe/core/config_check/ckpt_compare/metrics.py +12 -11
msprobe/core/config_check/config_check_cli.py +18 -17
msprobe/core/config_check/config_checker.py +16 -14
msprobe/core/config_check/resource/dependency.yaml +15 -12
msprobe/core/config_check/resource/env.yaml +12 -11
msprobe/core/config_check/utils/hyperparameter_parser.py +12 -11
msprobe/core/config_check/utils/utils.py +12 -11
msprobe/core/{data_dump → dump/api_dump}/api_registry.py +12 -11
msprobe/core/{common_config.py → dump/common_config.py} +13 -24
msprobe/core/dump/data_dump/data_collector.py +257 -0
msprobe/core/{data_dump → dump/data_dump}/data_processor/base.py +45 -36
msprobe/core/{data_dump → dump/data_dump}/data_processor/factory.py +33 -25
msprobe/core/{data_dump → dump/data_dump}/data_processor/mindspore_processor.py +37 -113
msprobe/core/{data_dump → dump/data_dump}/data_processor/pytorch_processor.py +364 -131
msprobe/core/{data_dump → dump/data_dump}/json_writer.py +24 -31
msprobe/core/{data_dump → dump/data_dump}/scope.py +12 -13
msprobe/core/{debugger → dump/debugger}/precision_debugger.py +15 -23
msprobe/core/dump/dump2db/db_utils.py +215 -0
msprobe/core/dump/dump2db/dump2db.py +409 -0
msprobe/core/{hook_manager.py → dump/hook_manager.py} +38 -87
msprobe/core/dump/kernel_dump/kernel_config.py +34 -0
msprobe/core/{service.py → dump/service.py} +43 -27
msprobe/core/install_deps/install_deps.py +51 -0
msprobe/core/monitor/anomaly_processor.py +13 -11
msprobe/core/monitor/csv2db.py +73 -93
msprobe/core/monitor/db_utils.py +140 -205
msprobe/core/monitor/utils.py +18 -17
msprobe/core/monitor_v2/__init__.py +20 -0
msprobe/core/monitor_v2/base.py +83 -0
msprobe/core/monitor_v2/cc.py +287 -0
msprobe/core/monitor_v2/factory.py +81 -0
msprobe/core/monitor_v2/module.py +201 -0
msprobe/core/monitor_v2/optimizer.py +245 -0
msprobe/core/monitor_v2/param.py +154 -0
msprobe/core/monitor_v2/trainer.py +326 -0
msprobe/core/monitor_v2/utils.py +122 -0
msprobe/core/monitor_v2/weight_grad.py +419 -0
msprobe/core/monitor_v2/writer.py +162 -0
msprobe/core/overflow_check/abnormal_scene.py +12 -11
msprobe/core/overflow_check/api_info.py +12 -11
msprobe/core/overflow_check/checker.py +12 -11
msprobe/core/overflow_check/filter.py +13 -11
msprobe/core/overflow_check/level.py +12 -11
msprobe/core/overflow_check/utils.py +12 -11
msprobe/core/single_save/single_comparator.py +12 -11
msprobe/core/single_save/single_saver.py +12 -11
msprobe/infer/__init__.py +16 -0
msprobe/infer/offline/__init__.py +16 -0
msprobe/infer/offline/compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/adapter_cli/args_adapter.py +46 -0
msprobe/infer/offline/compare/msquickcmp/atc/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/atc/atc_utils.py +98 -0
msprobe/infer/offline/compare/msquickcmp/cmp_process.py +328 -0
msprobe/infer/offline/compare/msquickcmp/common/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/common/args_check.py +112 -0
msprobe/infer/offline/compare/msquickcmp/common/convert.py +74 -0
msprobe/infer/offline/compare/msquickcmp/common/dump_data.py +121 -0
msprobe/infer/offline/compare/msquickcmp/common/dynamic_argument_bean.py +39 -0
msprobe/infer/offline/compare/msquickcmp/common/utils.py +669 -0
msprobe/infer/offline/compare/msquickcmp/config.ini +6 -0
msprobe/infer/offline/compare/msquickcmp/dump/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/dump/args_adapter.py +50 -0
msprobe/infer/offline/compare/msquickcmp/dump/dump_process.py +91 -0
msprobe/infer/offline/compare/msquickcmp/install_aclruntime_aisbench.sh +180 -0
msprobe/infer/offline/compare/msquickcmp/main.py +199 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/net_compare/net_compare.py +277 -0
msprobe/infer/offline/compare/msquickcmp/npu/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/npu/npu_dump_data.py +558 -0
msprobe/infer/offline/compare/msquickcmp/npu/om_parser.py +416 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/__init__.py +16 -0
msprobe/infer/offline/compare/msquickcmp/onnx_model/onnx_dump_data.py +374 -0
msprobe/infer/utils/__init__.py +15 -0
msprobe/infer/utils/acc_cmp.py +94 -0
msprobe/infer/utils/check/__init__.py +37 -0
msprobe/infer/utils/check/args_checker.py +35 -0
msprobe/infer/utils/check/checker.py +227 -0
msprobe/infer/utils/check/dict_checker.py +78 -0
msprobe/infer/utils/check/func_wrapper.py +96 -0
msprobe/infer/utils/check/list_checker.py +56 -0
msprobe/infer/utils/check/number_checker.py +64 -0
msprobe/infer/utils/check/obj_checker.py +41 -0
msprobe/infer/utils/check/path_checker.py +249 -0
msprobe/infer/utils/check/rule.py +126 -0
msprobe/infer/utils/check/string_checker.py +66 -0
msprobe/infer/utils/cmp_algorithm.py +261 -0
msprobe/infer/utils/constants.py +112 -0
msprobe/infer/utils/file_open_check.py +337 -0
msprobe/infer/utils/util.py +177 -0
msprobe/mindspore/__init__.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_accuracy_checker.py +14 -13
msprobe/mindspore/api_accuracy_checker/api_info.py +12 -11
msprobe/mindspore/api_accuracy_checker/api_runner.py +12 -11
msprobe/mindspore/api_accuracy_checker/base_compare_algorithm.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/flash_attention_score.py +12 -11
msprobe/mindspore/api_accuracy_checker/bench_functions/fusion_operator.py +12 -11
msprobe/mindspore/api_accuracy_checker/checker_support_api.yaml +12 -11
msprobe/mindspore/api_accuracy_checker/cmd_parser.py +15 -14
msprobe/mindspore/api_accuracy_checker/compute_element.py +12 -11
msprobe/mindspore/api_accuracy_checker/data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/main.py +12 -11
msprobe/mindspore/api_accuracy_checker/multi_api_accuracy_checker.py +14 -12
msprobe/mindspore/api_accuracy_checker/multi_data_manager.py +13 -11
msprobe/mindspore/api_accuracy_checker/torch_mindtorch_importer.py +12 -11
msprobe/mindspore/api_accuracy_checker/type_mapping.py +12 -11
msprobe/mindspore/api_accuracy_checker/utils.py +12 -11
msprobe/mindspore/common/const.py +15 -74
msprobe/mindspore/common/log.py +12 -11
msprobe/mindspore/common/utils.py +30 -15
msprobe/mindspore/compare/common_dir_compare.py +21 -23
msprobe/mindspore/compare/distributed_compare.py +18 -16
msprobe/mindspore/compare/ms_compare.py +14 -14
msprobe/mindspore/compare/ms_graph_compare.py +26 -20
msprobe/mindspore/compare/utils.py +14 -12
msprobe/mindspore/{cell_processor.py → dump/cell_processor.py} +15 -14
msprobe/mindspore/{debugger → dump/debugger}/debugger_config.py +12 -30
msprobe/mindspore/{debugger → dump/debugger}/precision_debugger.py +43 -45
msprobe/mindspore/dump/{cell_dump_process.py → dump_processor/cell_dump_process.py} +31 -17
msprobe/mindspore/dump/{cell_dump_with_insert_gradient.py → dump_processor/cell_dump_with_insert_gradient.py} +18 -14
msprobe/mindspore/dump/{dump_tool_factory.py → dump_processor/dump_tool_factory.py} +16 -15
msprobe/mindspore/dump/{graph_mode_cell_dump.py → dump_processor/graph_mode_cell_dump.py} +16 -15
msprobe/mindspore/dump/{graph_tensor_dump.py → dump_processor/graph_tensor_dump.py} +134 -133
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/api_register.py +15 -14
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/hook_cell.py +12 -11
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/ms_hook_manager.py +47 -20
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/primitive_hooks.py +14 -13
msprobe/mindspore/dump/{hook_cell → dump_processor/hook_cell}/support_wrap_ops.yaml +13 -11
msprobe/mindspore/dump/{jit_dump.py → dump_processor/jit_dump.py} +14 -13
msprobe/mindspore/dump/{kernel_graph_dump.py → dump_processor/kernel_graph_dump.py} +13 -12
msprobe/mindspore/dump/{kernel_kbyk_dump.py → dump_processor/kernel_kbyk_dump.py} +13 -12
msprobe/mindspore/{exception_dump → dump/exception_dump}/exception_dump_tool_factory.py +14 -13
msprobe/mindspore/{exception_dump → dump/exception_dump}/kernel_graph_exception_dump.py +13 -12
msprobe/mindspore/{mindspore_service.py → dump/mindspore_service.py} +18 -17
msprobe/mindspore/dump/mindtorch/__init__.py +19 -0
msprobe/mindspore/dump/ms_config.py +105 -0
msprobe/mindspore/{overflow_check → dump/overflow_check}/kernel_graph_overflow_check.py +13 -12
msprobe/mindspore/{overflow_check → dump/overflow_check}/overflow_check_tool_factory.py +14 -13
msprobe/mindspore/dump/task_handler_factory.py +43 -0
msprobe/mindspore/monitor/common_func.py +12 -11
msprobe/mindspore/monitor/data_writers.py +12 -11
msprobe/mindspore/monitor/distributed/wrap_distributed.py +93 -39
msprobe/mindspore/monitor/features.py +12 -11
msprobe/mindspore/monitor/module_hook.py +19 -22
msprobe/mindspore/monitor/optimizer_collect.py +29 -25
msprobe/mindspore/monitor/utils.py +13 -11
msprobe/msaccucmp/advisor/__init__.py +16 -0
msprobe/msaccucmp/advisor/advisor_const.py +65 -0
msprobe/msaccucmp/advisor/advisor_result.py +73 -0
msprobe/msaccucmp/advisor/compare_advisor.py +99 -0
msprobe/msaccucmp/advisor/input_advisor.py +66 -0
msprobe/msaccucmp/advisor/node_advisor.py +68 -0
msprobe/msaccucmp/advisor/overflow_advisor.py +58 -0
msprobe/msaccucmp/algorithm_manager/__init__.py +16 -0
msprobe/msaccucmp/algorithm_manager/algorithm_manager.py +464 -0
msprobe/msaccucmp/algorithm_manager/algorithm_parameter.py +42 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_AccumulatedRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_CosineSimilarity.py +58 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_KullbackLeiblerDivergence.py +84 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MaxRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanAbsoluteError.py +41 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_MeanRelativeError.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RelativeEuclideanDistance.py +46 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_RootMeanSquareError.py +40 -0
msprobe/msaccucmp/algorithm_manager/builtin_algorithm/alg_StandardDeviation.py +47 -0
msprobe/msaccucmp/cmp_utils/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/common.py +113 -0
msprobe/msaccucmp/cmp_utils/constant/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/constant/compare_error.py +81 -0
msprobe/msaccucmp/cmp_utils/constant/const_manager.py +530 -0
msprobe/msaccucmp/cmp_utils/file_utils.py +497 -0
msprobe/msaccucmp/cmp_utils/log.py +257 -0
msprobe/msaccucmp/cmp_utils/multi_process/__init__.py +16 -0
msprobe/msaccucmp/cmp_utils/multi_process/multi_convert_process.py +140 -0
msprobe/msaccucmp/cmp_utils/multi_process/progress.py +78 -0
msprobe/msaccucmp/cmp_utils/path_check.py +274 -0
msprobe/msaccucmp/cmp_utils/reg_manager.py +98 -0
msprobe/msaccucmp/cmp_utils/tlv_parse.py +279 -0
msprobe/msaccucmp/cmp_utils/utils.py +356 -0
msprobe/msaccucmp/cmp_utils/utils_type.py +63 -0
msprobe/msaccucmp/compare_vector.py +48 -0
msprobe/msaccucmp/conversion/__init__.py +16 -0
msprobe/msaccucmp/conversion/data_conversion.py +277 -0
msprobe/msaccucmp/conversion/dtype_conversion.py +99 -0
msprobe/msaccucmp/conversion/shape_format_conversion.py +477 -0
msprobe/msaccucmp/conversion/tensor_conversion.py +369 -0
msprobe/msaccucmp/dump_data_conversion.py +46 -0
msprobe/msaccucmp/dump_parse/__init__.py +16 -0
msprobe/msaccucmp/dump_parse/big_dump_data.py +317 -0
msprobe/msaccucmp/dump_parse/dump.py +423 -0
msprobe/msaccucmp/dump_parse/dump_data_object.py +322 -0
msprobe/msaccucmp/dump_parse/dump_data_parser.py +436 -0
msprobe/msaccucmp/dump_parse/dump_utils.py +246 -0
msprobe/msaccucmp/dump_parse/ffts_parser.py +137 -0
msprobe/msaccucmp/dump_parse/mapping.py +62 -0
msprobe/msaccucmp/dump_parse/nano_dump_data.py +392 -0
msprobe/msaccucmp/dump_parse/proto_dump_data.py +308 -0
msprobe/msaccucmp/dump_parser.py +90 -0
msprobe/msaccucmp/format_manager/__init__.py +16 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NCHW.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_ND.py +52 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_NZ_to_NHWC.py +53 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_HWCN.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_FRACTAL_Z_to_NCHW.py +47 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_FRACTAL_Z.py +89 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_HWCN_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_HWCN.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NCHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NC1HWC0_to_NHWC.py +43 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NCHW_to_NHWC.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_NCDHW.py +48 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NDC1HWC0_to_ND.py +44 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_FRACTAL_Z.py +87 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_HWCN.py +37 -0
msprobe/msaccucmp/format_manager/builtin_format_convert/convert_NHWC_to_NCHW.py +37 -0
msprobe/msaccucmp/format_manager/format_manager.py +307 -0
msprobe/msaccucmp/inplace_layer_process.py +186 -0
msprobe/msaccucmp/msaccucmp.py +532 -0
msprobe/msaccucmp/mscmp_advisor.py +128 -0
msprobe/msaccucmp/overflow/__init__.py +16 -0
msprobe/msaccucmp/overflow/overflow_analyse.py +305 -0
msprobe/msaccucmp/overflow/overflow_detection.py +143 -0
msprobe/msaccucmp/pytorch_cmp/__init__.py +16 -0
msprobe/msaccucmp/pytorch_cmp/compare_pytorch.py +389 -0
msprobe/msaccucmp/pytorch_cmp/hdf5_parser.py +377 -0
msprobe/msaccucmp/pytorch_cmp/pytorch_dump_data.py +461 -0
msprobe/msaccucmp/shape_conversion.py +41 -0
msprobe/msaccucmp/vector_cmp/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/batch_compare.py +197 -0
msprobe/msaccucmp/vector_cmp/compare_detail/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/compare_detail/compare_detail.py +245 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail.py +182 -0
msprobe/msaccucmp/vector_cmp/compare_detail/detail_writer.py +580 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_fusion_op.py +588 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_npu_vs_npu.py +339 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_result.py +326 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/compare_rule.py +156 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_op.py +204 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/fusion_rule_parser.py +635 -0
msprobe/msaccucmp/vector_cmp/fusion_manager/quant_filter.py +187 -0
msprobe/msaccucmp/vector_cmp/range_manager/__init__.py +16 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_manager.py +100 -0
msprobe/msaccucmp/vector_cmp/range_manager/range_mode.py +94 -0
msprobe/msaccucmp/vector_cmp/range_manager/select_mode.py +86 -0
msprobe/msaccucmp/vector_cmp/vector_comparison.py +535 -0
msprobe/msprobe.py +101 -130
msprobe/overflow_check/__init__.py +15 -0
msprobe/{nan_analyze → overflow_check}/analyzer.py +38 -27
msprobe/{nan_analyze → overflow_check}/graph.py +28 -27
msprobe/{nan_analyze → overflow_check}/utils.py +15 -14
msprobe/pytorch/__init__.py +20 -14
msprobe/pytorch/aclgraph_dump/__init__.py +45 -0
msprobe/pytorch/aclgraph_dump/_meta.py +26 -0
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut.py → acc_check/acc_check.py} +50 -45
msprobe/pytorch/api_accuracy_checker/{run_ut/run_ut_utils.py → acc_check/acc_check_utils.py} +201 -30
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/data_generate.py +56 -16
msprobe/pytorch/api_accuracy_checker/{run_ut/multi_run_ut.py → acc_check/multi_acc_check.py} +32 -47
msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/run_overflow_check.py +19 -18
msprobe/pytorch/api_accuracy_checker/common/config.py +22 -20
msprobe/pytorch/api_accuracy_checker/common/utils.py +72 -13
msprobe/pytorch/api_accuracy_checker/compare/algorithm.py +41 -11
msprobe/pytorch/api_accuracy_checker/compare/api_precision_compare.py +23 -14
msprobe/pytorch/api_accuracy_checker/compare/compare.py +45 -32
msprobe/pytorch/api_accuracy_checker/compare/compare_column.py +12 -11
msprobe/pytorch/api_accuracy_checker/compare/compare_input.py +14 -12
msprobe/pytorch/api_accuracy_checker/compare/compare_utils.py +14 -12
msprobe/pytorch/api_accuracy_checker/precision_standard/absolute_threshold.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/accumulative_error_compare.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/base_standard.py +21 -19
msprobe/pytorch/api_accuracy_checker/precision_standard/benchmark_compare.py +14 -13
msprobe/pytorch/api_accuracy_checker/precision_standard/binary_consistency.py +12 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_config.py +60 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/standard_register.py +27 -16
msprobe/pytorch/api_accuracy_checker/precision_standard/thousandth_standard.py +13 -11
msprobe/pytorch/api_accuracy_checker/precision_standard/ulp_compare.py +39 -18
msprobe/pytorch/bench_functions/__init__.py +12 -11
msprobe/pytorch/bench_functions/apply_adam.py +12 -11
msprobe/pytorch/bench_functions/apply_adam_w.py +12 -11
msprobe/pytorch/bench_functions/confusion_transpose.py +12 -11
msprobe/pytorch/bench_functions/fast_gelu.py +12 -11
msprobe/pytorch/bench_functions/group_norm_silu.py +12 -11
msprobe/pytorch/bench_functions/layer_norm_eval.py +12 -11
msprobe/pytorch/bench_functions/linear.py +12 -11
msprobe/pytorch/bench_functions/matmul_backward.py +12 -11
msprobe/pytorch/bench_functions/mish.py +12 -11
msprobe/pytorch/bench_functions/moe_gating_top_k_softmax.py +12 -11
msprobe/pytorch/bench_functions/npu_fusion_attention.py +12 -11
msprobe/pytorch/bench_functions/rms_norm.py +12 -11
msprobe/pytorch/bench_functions/rotary_mul.py +12 -11
msprobe/pytorch/bench_functions/scaled_mask_softmax.py +12 -11
msprobe/pytorch/bench_functions/sort_v2.py +12 -11
msprobe/pytorch/bench_functions/swiglu.py +12 -11
msprobe/pytorch/common/__init__.py +12 -11
msprobe/pytorch/common/log.py +12 -11
msprobe/pytorch/common/parse_json.py +12 -11
msprobe/pytorch/common/utils.py +52 -19
msprobe/pytorch/compare/distributed_compare.py +13 -13
msprobe/pytorch/compare/match.py +12 -11
msprobe/pytorch/compare/pt_compare.py +14 -20
msprobe/pytorch/compare/pt_diff_analyze.py +12 -11
msprobe/pytorch/compare/utils.py +12 -11
msprobe/pytorch/{hook_module → dump/api_dump}/api_register.py +18 -16
msprobe/pytorch/{hook_module → dump/api_dump}/hook_module.py +14 -13
msprobe/pytorch/{hook_module → dump/api_dump}/pt_hook_manager.py +68 -23
msprobe/pytorch/{hook_module → dump/api_dump}/register_optimizer_hook.py +13 -11
msprobe/pytorch/{hook_module → dump/api_dump}/script_wrapper.py +17 -14
msprobe/pytorch/{hook_module → dump/api_dump}/utils.py +12 -11
msprobe/pytorch/{debugger → dump/debugger}/debugger_config.py +23 -38
msprobe/pytorch/dump/debugger/precision_debugger.py +130 -0
msprobe/pytorch/{function_factory.py → dump/function_factory.py} +12 -11
msprobe/pytorch/dump/module_dump/hook_wrapper.py +17 -13
msprobe/pytorch/dump/module_dump/module_dump.py +16 -15
msprobe/pytorch/dump/module_dump/{module_processer.py → module_processor.py} +54 -42
msprobe/pytorch/dump/pt_config.py +128 -0
msprobe/pytorch/{pytorch_service.py → dump/pytorch_service.py} +22 -21
msprobe/pytorch/monitor/csv2tb.py +13 -11
msprobe/pytorch/monitor/data_writers.py +13 -11
msprobe/pytorch/monitor/distributed/wrap_distributed.py +13 -11
msprobe/pytorch/monitor/features.py +12 -11
msprobe/pytorch/monitor/module_hook.py +67 -59
msprobe/pytorch/monitor/module_metric.py +13 -11
msprobe/pytorch/monitor/optimizer_collect.py +37 -35
msprobe/pytorch/monitor/utils.py +13 -11
msprobe/pytorch/monitor/visualizer.py +12 -11
msprobe/pytorch/torchair_dump/__init__.py +17 -0
msprobe/pytorch/torchair_dump/torchair_dump.py +114 -0
msprobe/scripts/atb/config_example.json +10 -0
msprobe/scripts/atb/load_atb_probe.sh +101 -0
msprobe/scripts/atb/unload_atb_probe.sh +27 -0
msprobe/scripts/build_msaccucmp.sh +186 -0
msprobe/scripts/conf/help.info +6 -0
msprobe/scripts/conf/version.info +3 -0
msprobe/scripts/run_script/common.sh +538 -0
msprobe/scripts/run_script/main_msaccucmp.sh +232 -0
msprobe/visualization/__init__.py +12 -11
msprobe/visualization/builder/__init__.py +12 -11
msprobe/visualization/builder/graph_builder.py +45 -30
msprobe/visualization/builder/graph_merger.py +53 -32
msprobe/visualization/builder/msprobe_adapter.py +34 -44
msprobe/visualization/compare/__init__.py +12 -11
msprobe/visualization/compare/graph_comparator.py +63 -51
msprobe/visualization/compare/mode_adapter.py +28 -113
msprobe/visualization/db_utils.py +133 -22
msprobe/visualization/graph/__init__.py +12 -11
msprobe/visualization/graph/base_node.py +15 -27
msprobe/visualization/graph/distributed_analyzer.py +97 -40
msprobe/visualization/graph/graph.py +14 -16
msprobe/visualization/graph/node_colors.py +34 -31
msprobe/visualization/graph/node_op.py +12 -11
msprobe/visualization/graph_service.py +580 -205
msprobe/visualization/utils.py +278 -31
tb_graph_ascend/secure_build.py +175 -0
tb_graph_ascend/server/__init__.py +15 -0
tb_graph_ascend/server/app/__init__.py +15 -0
tb_graph_ascend/server/app/model/__init__.py +15 -0
tb_graph_ascend/server/app/model/hierarchy.py +348 -0
tb_graph_ascend/server/app/model/layout_hierarchy_model.py +69 -0
tb_graph_ascend/server/app/model/match_nodes_model.py +573 -0
tb_graph_ascend/server/app/repositories/__init__.py +15 -0
tb_graph_ascend/server/app/repositories/graph_repo_base.py +32 -0
tb_graph_ascend/server/app/repositories/graph_repo_db.py +879 -0
tb_graph_ascend/server/app/repositories/graph_repo_vis.py +83 -0
tb_graph_ascend/server/app/service/__init__.py +18 -0
tb_graph_ascend/server/app/service/graph_service_base.py +158 -0
tb_graph_ascend/server/app/service/graph_service_db.py +438 -0
tb_graph_ascend/server/app/service/graph_service_factory.py +54 -0
tb_graph_ascend/server/app/service/graph_service_vis.py +480 -0
tb_graph_ascend/server/app/utils/__init__.py +15 -0
tb_graph_ascend/server/app/utils/constant.py +80 -0
tb_graph_ascend/server/app/utils/file_check_wrapper.py +46 -0
tb_graph_ascend/server/app/utils/global_state.py +95 -0
tb_graph_ascend/server/app/utils/graph_utils.py +661 -0
tb_graph_ascend/server/app/utils/i18n.py +153 -0
tb_graph_ascend/server/app/utils/request_method.py +46 -0
tb_graph_ascend/server/app/views/__init__.py +15 -0
tb_graph_ascend/server/app/views/graph_views.py +304 -0
tb_graph_ascend/server/plugin.py +108 -0
tb_graph_ascend/server/static/index.html +9250 -0
tb_graph_ascend/server/static/index.js +21 -0
tb_graph_ascend/setup.py +57 -0
mindstudio_probe-8.3.3.dist-info/LICENSE +0 -201
mindstudio_probe-8.3.3.dist-info/RECORD +0 -491
mindstudio_probe-8.3.3.dist-info/entry_points.txt +0 -2
mindstudio_probe-8.3.3.dist-info/top_level.txt +0 -1
msprobe/CMakeLists.txt +0 -5
msprobe/README.md +0 -203
msprobe/core/advisor/advisor.py +0 -129
msprobe/core/advisor/advisor_const.py +0 -58
msprobe/core/advisor/advisor_result.py +0 -58
msprobe/core/compare/find_first/data_processor.py +0 -35
msprobe/core/compare/highlight.py +0 -390
msprobe/core/data_dump/data_collector.py +0 -356
msprobe/core/grad_probe/constant.py +0 -90
msprobe/core/grad_probe/grad_compare.py +0 -187
msprobe/core/grad_probe/utils.py +0 -105
msprobe/core/kernel_dump/kernel_config.py +0 -33
msprobe/docs/01.installation.md +0 -250
msprobe/docs/02.config_introduction.md +0 -221
msprobe/docs/03.config_examples.md +0 -281
msprobe/docs/04.kernel_dump_PyTorch.md +0 -73
msprobe/docs/05.data_dump_PyTorch.md +0 -518
msprobe/docs/06.data_dump_MindSpore.md +0 -618
msprobe/docs/07.accuracy_checker_PyTorch.md +0 -310
msprobe/docs/09.accuracy_checker_MindSpore.md +0 -120
msprobe/docs/10.accuracy_compare_PyTorch.md +0 -637
msprobe/docs/11.accuracy_compare_MindSpore.md +0 -769
msprobe/docs/12.overflow_check_PyTorch.md +0 -82
msprobe/docs/13.overflow_check_MindSpore.md +0 -33
msprobe/docs/14.data_parse_PyTorch.md +0 -282
msprobe/docs/15.free_benchmarking_PyTorch.md +0 -169
msprobe/docs/16.free_benchmarking_MindSpore.md +0 -159
msprobe/docs/17.grad_probe.md +0 -205
msprobe/docs/18.online_dispatch.md +0 -89
msprobe/docs/19.monitor.md +0 -753
msprobe/docs/20.monitor_performance_baseline.md +0 -52
msprobe/docs/21.visualization_PyTorch.md +0 -519
msprobe/docs/22.visualization_MindSpore.md +0 -515
msprobe/docs/23.generate_operator_PyTorch.md +0 -107
msprobe/docs/24.code_mapping_Mindspore.md +0 -29
msprobe/docs/25.tool_function_introduction.md +0 -29
msprobe/docs/26.data_dump_PyTorch_baseline.md +0 -48
msprobe/docs/27.dump_json_instruction.md +0 -795
msprobe/docs/28.debugger_save_instruction.md +0 -288
msprobe/docs/28.kernel_dump_MindSpore.md +0 -69
msprobe/docs/29.data_dump_MSAdapter.md +0 -235
msprobe/docs/30.overflow_check_MSAdapter.md +0 -31
msprobe/docs/31.config_check.md +0 -107
msprobe/docs/32.ckpt_compare.md +0 -69
msprobe/docs/33.generate_operator_MindSpore.md +0 -181
msprobe/docs/34.RL_collect.md +0 -101
msprobe/docs/35.nan_analyze.md +0 -73
msprobe/docs/36.calculation_result_change.md +0 -75
msprobe/docs/FAQ.md +0 -232
msprobe/docs/S02.report_free_benchmarking_validation_performance_baseline.md +0 -146
msprobe/docs/accuracy_checker_MindSpore/accuracy_checker_MindSpore_baseline.md +0 -14
msprobe/docs/data_dump_MindSpore/data_dump_MindSpore_baseline.md +0 -33
msprobe/docs/data_dump_MindSpore/dynamic_graph_quick_start_example.md +0 -217
msprobe/docs/img/BLOOM-7B_1.png +0 -0
msprobe/docs/img/BLOOM-7B_2.png +0 -0
msprobe/docs/img/BLOOM-7B_3.png +0 -0
msprobe/docs/img/BLOOM-7B_4.png +0 -0
msprobe/docs/img/GPT-3_1.png +0 -0
msprobe/docs/img/GPT-3_2.png +0 -0
msprobe/docs/img/GPT-3_3.png +0 -0
msprobe/docs/img/GPT-3_4.png +0 -0
msprobe/docs/img/GPT-3_5.png +0 -0
msprobe/docs/img/GPT-3_6.png +0 -0
msprobe/docs/img/GPT-3_7.png +0 -0
msprobe/docs/img/GPT-3_8.png +0 -0
msprobe/docs/img/YOLOV5S_1.png +0 -0
msprobe/docs/img/YOLOV5S_2.png +0 -0
msprobe/docs/img/accuracy_checking_details.png +0 -0
msprobe/docs/img/accuracy_checking_result.png +0 -0
msprobe/docs/img/api_precision_compare_details.png +0 -0
msprobe/docs/img/api_precision_compare_result.png +0 -0
msprobe/docs/img/auto_analyze_log.png +0 -0
msprobe/docs/img/compare_result.png +0 -0
msprobe/docs/img/compare_result_pkl.png +0 -0
msprobe/docs/img/compare_result_pkl_md5.png.png +0 -0
msprobe/docs/img/cpu_info.png +0 -0
msprobe/docs/img/free_benchmark.png +0 -0
msprobe/docs/img/free_benchmark_framework.png +0 -0
msprobe/docs/img/grad_probe_image-1.png +0 -0
msprobe/docs/img/grad_probe_image-2.png +0 -0
msprobe/docs/img/grad_probe_image-3.png +0 -0
msprobe/docs/img/grad_probe_image-4.png +0 -0
msprobe/docs/img/grad_probe_image.png +0 -0
msprobe/docs/img/merge_result.png +0 -0
msprobe/docs/img/module_compare.png +0 -0
msprobe/docs/img/monitor/cpu_info.png +0 -0
msprobe/docs/img/monitor/step_count_per_record.png +0 -0
msprobe/docs/img/ms_dump.png +0 -0
msprobe/docs/img/ms_layer.png +0 -0
msprobe/docs/img/pt_dump.png +0 -0
msprobe/docs/img/save_compare_result_sample.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_ms.png +0 -0
msprobe/docs/img/visualization/fuzzy_match_pt.png +0 -0
msprobe/docs/img/visualization/proxy.png +0 -0
msprobe/docs/img/visualization/tensorboard_1.png +0 -0
msprobe/docs/img/visualization/tensorboard_2.png +0 -0
msprobe/docs/img/visualization/vis_browser_1.png +0 -0
msprobe/docs/img/visualization/vis_browser_2.png +0 -0
msprobe/docs/img/visualization/vis_match_info.png +0 -0
msprobe/docs/img/visualization/vis_precision_info.png +0 -0
msprobe/docs/img/visualization/vis_search_info.png +0 -0
msprobe/docs/img/visualization/vis_show_info.png +0 -0
msprobe/docs/img/visualization/vis_showcase.png +0 -0
msprobe/docs/img/visualization/vis_unmatch_info.png +0 -0
msprobe/docs/visualization/GPTModel.png +0 -0
msprobe/docs/visualization/ParallelMLP.png +0 -0
msprobe/docs/visualization/layer_mapping_example.md +0 -132
msprobe/docs/visualization/mapping.png +0 -0
msprobe/docs/visualization/mapping1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/3.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/4.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/5.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/6.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/7.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory-qwen25vl.txt +0 -59
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/llamafactory2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed-mm-qwen25vl.txt +0 -80
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed1.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactoary_img/mindspeed2.png +0 -0
msprobe/docs/visualization/mindspeed_llamafactory_mapping.md +0 -330
msprobe/docs/visualization/module_name.png +0 -0
msprobe/docs/visualization/module_name1.png +0 -0
msprobe/docs/visualization/no_mapping.png +0 -0
msprobe/docs/visualization/no_mapping1.png +0 -0
msprobe/docs/visualization/no_mapping_analyze.png +0 -0
msprobe/docs/visualization/top_layer.png +0 -0
msprobe/mindspore/api_accuracy_checker/generate_op_script/op_generator.py +0 -460
msprobe/mindspore/api_accuracy_checker/generate_op_script/operator_replication.template +0 -2081
msprobe/mindspore/code_mapping/bind.py +0 -283
msprobe/mindspore/code_mapping/cmd_parser.py +0 -40
msprobe/mindspore/code_mapping/graph.py +0 -49
msprobe/mindspore/code_mapping/graph_parser.py +0 -211
msprobe/mindspore/code_mapping/main.py +0 -24
msprobe/mindspore/code_mapping/processor.py +0 -34
msprobe/mindspore/dym_loader/hook_dynamic_loader.cpp +0 -111
msprobe/mindspore/dym_loader/hook_dynamic_loader.h +0 -52
msprobe/mindspore/free_benchmark/api_pynative_self_check.py +0 -257
msprobe/mindspore/free_benchmark/common/config.py +0 -27
msprobe/mindspore/free_benchmark/common/handler_params.py +0 -31
msprobe/mindspore/free_benchmark/common/utils.py +0 -100
msprobe/mindspore/free_benchmark/data/support_wrap_ops.yaml +0 -638
msprobe/mindspore/free_benchmark/handler/base_handler.py +0 -105
msprobe/mindspore/free_benchmark/handler/check_handler.py +0 -55
msprobe/mindspore/free_benchmark/handler/fix_handler.py +0 -51
msprobe/mindspore/free_benchmark/handler/handler_factory.py +0 -36
msprobe/mindspore/free_benchmark/perturbation/add_noise.py +0 -82
msprobe/mindspore/free_benchmark/perturbation/base_perturbation.py +0 -45
msprobe/mindspore/free_benchmark/perturbation/bit_noise.py +0 -78
msprobe/mindspore/free_benchmark/perturbation/exchange_value.py +0 -77
msprobe/mindspore/free_benchmark/perturbation/improve_precision.py +0 -56
msprobe/mindspore/free_benchmark/perturbation/no_change.py +0 -27
msprobe/mindspore/free_benchmark/perturbation/perturbation_factory.py +0 -46
msprobe/mindspore/free_benchmark/self_check_tool_factory.py +0 -51
msprobe/mindspore/grad_probe/global_context.py +0 -127
msprobe/mindspore/grad_probe/grad_analyzer.py +0 -260
msprobe/mindspore/grad_probe/grad_monitor.py +0 -42
msprobe/mindspore/grad_probe/grad_stat_csv.py +0 -161
msprobe/mindspore/grad_probe/hook.py +0 -115
msprobe/mindspore/grad_probe/utils.py +0 -43
msprobe/mindspore/mindtorch/__init__.py +0 -18
msprobe/mindspore/ms_config.py +0 -153
msprobe/mindspore/task_handler_factory.py +0 -44
msprobe/nan_analyze/__init__.py +0 -14
msprobe/pytorch/api_accuracy_checker/generate_op_script/config_op.json +0 -9
msprobe/pytorch/api_accuracy_checker/generate_op_script/op_generator.py +0 -480
msprobe/pytorch/api_accuracy_checker/generate_op_script/operator_replication.template +0 -567
msprobe/pytorch/debugger/precision_debugger.py +0 -181
msprobe/pytorch/free_benchmark/__init__.py +0 -23
msprobe/pytorch/free_benchmark/common/constant.py +0 -85
msprobe/pytorch/free_benchmark/common/counter.py +0 -87
msprobe/pytorch/free_benchmark/common/enums.py +0 -80
msprobe/pytorch/free_benchmark/common/params.py +0 -152
msprobe/pytorch/free_benchmark/common/utils.py +0 -143
msprobe/pytorch/free_benchmark/compare/grad_saver.py +0 -215
msprobe/pytorch/free_benchmark/compare/single_benchmark.py +0 -121
msprobe/pytorch/free_benchmark/main.py +0 -123
msprobe/pytorch/free_benchmark/perturbed_layers/base_layer.py +0 -28
msprobe/pytorch/free_benchmark/perturbed_layers/layer_factory.py +0 -56
msprobe/pytorch/free_benchmark/perturbed_layers/npu/add_noise.py +0 -107
msprobe/pytorch/free_benchmark/perturbed_layers/npu/bit_noise.py +0 -121
msprobe/pytorch/free_benchmark/perturbed_layers/npu/change_value.py +0 -89
msprobe/pytorch/free_benchmark/perturbed_layers/npu/improve_precision.py +0 -87
msprobe/pytorch/free_benchmark/perturbed_layers/npu/no_change.py +0 -43
msprobe/pytorch/free_benchmark/perturbed_layers/npu/npu_base_layser.py +0 -60
msprobe/pytorch/free_benchmark/perturbed_layers/run_cpu.py +0 -34
msprobe/pytorch/free_benchmark/result_handlers/base_handler.py +0 -252
msprobe/pytorch/free_benchmark/result_handlers/check_handler.py +0 -54
msprobe/pytorch/free_benchmark/result_handlers/fix_handler.py +0 -40
msprobe/pytorch/free_benchmark/result_handlers/handler_factory.py +0 -45
msprobe/pytorch/free_benchmark/result_handlers/preheat_handler.py +0 -181
msprobe/pytorch/grad_probe/__init__.py +0 -0
msprobe/pytorch/grad_probe/grad_monitor.py +0 -108
msprobe/pytorch/grad_probe/grad_stat_csv.py +0 -160
msprobe/pytorch/hook_module/__init__.py +0 -16
msprobe/pytorch/hook_module/wrap_aten.py +0 -111
msprobe/pytorch/online_dispatch/__init__.py +0 -19
msprobe/pytorch/online_dispatch/compare.py +0 -224
msprobe/pytorch/online_dispatch/dispatch.py +0 -332
msprobe/pytorch/online_dispatch/dump_compare.py +0 -179
msprobe/pytorch/online_dispatch/single_compare.py +0 -412
msprobe/pytorch/online_dispatch/torch_ops_config.yaml +0 -58
msprobe/pytorch/online_dispatch/utils.py +0 -158
msprobe/pytorch/parse_tool/__init__.py +0 -0
msprobe/pytorch/parse_tool/cli.py +0 -31
msprobe/pytorch/parse_tool/lib/__init__.py +0 -0
msprobe/pytorch/parse_tool/lib/compare.py +0 -253
msprobe/pytorch/parse_tool/lib/config.py +0 -50
msprobe/pytorch/parse_tool/lib/file_desc.py +0 -45
msprobe/pytorch/parse_tool/lib/interactive_cli.py +0 -97
msprobe/pytorch/parse_tool/lib/parse_exception.py +0 -54
msprobe/pytorch/parse_tool/lib/parse_tool.py +0 -161
msprobe/pytorch/parse_tool/lib/utils.py +0 -299
msprobe/pytorch/parse_tool/lib/visualization.py +0 -85
msprobe/pytorch/pt_config.py +0 -299
/msprobe/core/{grad_probe → dump}/__init__.py +0 -0
/msprobe/{mindspore/code_mapping → core/dump/api_dump}/__init__.py +0 -0
/msprobe/{mindspore/debugger → core/dump/data_dump}/__init__.py +0 -0
/msprobe/{mindspore/exception_dump → core/dump/data_dump/data_processor}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark → core/dump/debugger}/__init__.py +0 -0
/msprobe/{mindspore/free_benchmark/common → core/dump/kernel_dump}/__init__.py +0 -0
/msprobe/mindspore/{free_benchmark/handler → dump/debugger}/__init__.py +0 -0
/msprobe/mindspore/{grad_probe → dump/dump_processor}/__init__.py +0 -0
/msprobe/mindspore/{overflow_check → dump/exception_dump}/__init__.py +0 -0
/msprobe/mindspore/{mindtorch → dump/mindtorch}/mindtorch_adaptor.py +0 -0
/msprobe/{pytorch/api_accuracy_checker/run_ut → mindspore/dump/overflow_check}/__init__.py +0 -0
/msprobe/{pytorch/debugger → mindspore/monitor}/__init__.py +0 -0
/msprobe/{pytorch/free_benchmark/common → msaccucmp}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/.keep +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers → api_accuracy_checker/acc_check}/__init__.py +0 -0
/msprobe/pytorch/api_accuracy_checker/{run_ut → acc_check}/torch_ut_setting.json +0 -0
/msprobe/pytorch/{free_benchmark/perturbed_layers/npu → dump/api_dump}/__init__.py +0 -0
/msprobe/pytorch/{hook_module → dump/api_dump}/support_wrap_ops.yaml +0 -0
/msprobe/pytorch/{free_benchmark/result_handlers → dump/debugger}/__init__.py +0 -0

msprobe/core/common/megatron_utils.py CHANGED Viewed

@@ -1,19 +1,32 @@
-# Copyright (c) 2024-2025, Huawei Technologies Co., Ltd.
-# All rights reserved.
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
 #
-# Licensed under the Apache License, Version 2.0  (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
 #
-# http://www.apache.org/licenses/LICENSE-2.0
+#          http://license.coscl.org.cn/MulanPSL2
 #
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
+import os
+from tqdm import tqdm
+from dataclasses import dataclass
 from functools import wraps
+from typing import Any, Dict, List, Tuple
+import matplotlib.pyplot as plt
+import numpy as np
+from matplotlib.patches import Rectangle
+from msprobe.core.common.utils import is_int
+from msprobe.core.common.file_utils import create_directory, remove_path
+from msprobe.core.common.log import logger
+from msprobe.core.common.parallel_state import RankGroupGenerator
 class MegatronStepInfo:
@@ -57,3 +70,545 @@ def get_micro_step():
 def is_megatron():
     return MegatronStepInfo.is_megatron
+@dataclass
+class VisualizationConfig:
+    """可视化配置数据类"""
+    height_per_tp: float = 0.5
+    width_per_stage: float = 2
+    min_width: int = 6
+    max_width: int = 60
+    min_height: int = 4
+    max_height: int = 100
+    legend_width: int = 5
+    font_sizes: Dict[str, int] = None
+    def __post_init__(self):
+        if self.font_sizes is None:
+            self.font_sizes = {
+                'title': 14,
+                'axis': 12,
+                'tick': 10,
+                'legend': 10,
+                'text': 9
+            }
+class ModelParallelismVisualizer:
+    def __init__(self, args, groups_dict, rank_models):
+        """
+        初始化可视化器
+        Args:
+            args: 并行配置参数
+            groups_dict: 并行分组信息
+            rank_models: 每个rank的模型配置字典
+        """
+        self.groups_dict = groups_dict
+        self.rank_models = rank_models
+        self.config = VisualizationConfig()
+        # 计算布局参数
+        self.layout = self._calculate_layout(args)
+    def _calculate_layout(self, args) -> Dict[str, Any]:
+        """计算布局参数"""
+        tp_groups = self.groups_dict["tp"]
+        dp_groups = self.groups_dict.get(
+            "dp", [[rank] for rank in range(args.world_size)])
+        dp_size = args.data_parallel_size
+        dp_groups = list(zip(*dp_groups))  # 转置DP分组
+        vpp_size = args.virtual_pipeline_parallel_size
+        # 计算模型代表rank
+        model_representatives = {}
+        for dp_idx, dp_group in enumerate(dp_groups):
+            for tp_idx, tp_group in enumerate(tp_groups):
+                representative_rank = next(
+                    (r for r in dp_group if r in tp_group), None)
+                if representative_rank is not None:
+                    model_representatives[(dp_idx, tp_idx)
+                                          ] = representative_rank
+        return {
+            'num_layers': args.num_layers,
+            'tp_groups': tp_groups,
+            'dp_groups': dp_groups,
+            'dp_size': dp_size,
+            'tp_size': args.tensor_parallel_size,
+            'pp_size': args.pipeline_parallel_size,
+            'vpp_size': vpp_size,
+            'num_tp': len(tp_groups),
+            'num_model_copies': len(dp_groups),
+            'model_representatives': model_representatives
+        }
+    def _calculate_figure_size(self) -> Tuple[float, float]:
+        """动态计算图表尺寸"""
+        fig_height = min(
+            max(self.config.min_height,
+                self.config.height_per_tp * self.layout['num_tp']),
+            self.config.max_height
+        )
+        fig_width = min(
+            max(self.config.min_width,
+                self.config.width_per_stage * self.layout['vpp_size']),
+            self.config.max_width
+        )
+        # 为图例预留0空间
+        return fig_width + self.config.legend_width, fig_height
+    def _setup_colors(self):
+        """设置颜色配置"""
+        num_copies = self.layout['num_model_copies']
+        if num_copies <= 20:
+            self.model_colors = plt.cm.tab20(range(num_copies))
+        elif num_copies <= 40:
+            # 40个以内使用tab20色板组合
+            self.model_colors = np.vstack(
+                [plt.cm.tab20b(range(20)), plt.cm.tab20c(range(20))])
+        else:
+            # 超过20个使用连续色板
+            colormap = plt.cm.get_cmap('viridis')
+            norm = plt.Normalize(0, num_copies - 1)
+            self.model_colors = [colormap(norm(i)) for i in range(num_copies)]
+    def _setup_axes(self, ax):
+        """设置坐标轴"""
+        ax.set_xlabel('Virtual Pipeline Stage',
+                      fontsize=self.config.font_sizes['axis'])
+        ax.set_ylabel('TP Group', fontsize=self.config.font_sizes['axis'])
+        # 设置标题
+        title = (f'Model Parallelism Configuration | '
+                 f'Total Layers: {self.layout["num_layers"]} | '
+                 f'DP={self.layout["dp_size"]} | '
+                 f'TP={self.layout["tp_size"]} | '
+                 f'PP={self.layout["pp_size"]} | '
+                 f'VPP={self.layout["vpp_size"]}')
+        ax.set_title(title, fontsize=self.config.font_sizes['title'], pad=20)
+        # 设置坐标轴范围
+        ax.set_xlim(-0.5, self.layout['vpp_size'] - 0.5)
+        ax.set_ylim(-0.5, self.layout['num_tp'] - 0.5)
+        ax.grid(True, linestyle='--', alpha=0.3)
+        # 设置刻度
+        self._setup_ticks(ax)
+    def _setup_ticks(self, ax):
+        """设置坐标轴刻度"""
+        # X轴刻度
+        ax.set_xticks(range(self.layout['vpp_size']))
+        ax.set_xticklabels(
+            [f'Stage {i}' for i in range(self.layout['vpp_size'])])
+        # Y轴刻度（TP组标签）
+        tp_labels = []
+        for tp_idx, tp_group in enumerate(self.layout['tp_groups']):
+            min_rank = min(tp_group)
+            max_rank = max(tp_group)
+            if min_rank == max_rank:
+                # 单卡情况
+                tp_labels.append(f'Rank{min_rank}')
+            else:
+                tp_labels.append(f'Group{tp_idx}: Ranks{min_rank}-{max_rank}')
+        ax.set_yticks(range(self.layout['num_tp']))
+        ax.set_yticklabels(tp_labels, fontsize=self.config.font_sizes['tick'])
+    def _create_layer_text(self, layers: List) -> str:
+        """创建层描述文本"""
+        text_parts = []
+        trans_layers = [l for l in layers if isinstance(l, int)]
+        if "Embedding" in layers:
+            text_parts.append("Embed")
+        if trans_layers:
+            text_parts.append(f"L{min(trans_layers)}-{max(trans_layers)}")
+        if "OutputLayer" in layers:
+            text_parts.append("Out")
+        return "+".join(text_parts)
+    def _draw_model_blocks(self, ax):
+        """绘制模型块"""
+        # 计算总块数
+        total_blocks = sum(len(self.rank_models.get(representative_rank, []))
+                           for representative_rank in self.layout['model_representatives'].values())
+        if total_blocks > 5000:
+            logger.warning(
+                f"Large-scale drawing: {total_blocks} model stages, may take a long time")
+        with tqdm(total=total_blocks, desc="Drawing model stages", unit="stage") as pbar:
+            for (dp_idx, tp_idx), representative_rank in self.layout['model_representatives'].items():
+                model_configs = self.rank_models.get(representative_rank, [])
+                for vpp_stage, layers in enumerate(model_configs):
+                    self._draw_single_block(
+                        ax, dp_idx, tp_idx, vpp_stage, layers)
+                    pbar.update(1)
+        if total_blocks > 20000:
+            logger.warning(f"Large-scale visualization: {total_blocks} model stages detected, "
+                           f"this may cause memory overflow")
+    def _draw_single_block(self, ax, dp_idx: int, tp_idx: int, vpp_stage: int, layers: List):
+        """绘制单个模型块"""
+        # 解析层信息
+        layer_text = self._create_layer_text(layers)
+        # 绘制矩形区块
+        rect = Rectangle(
+            (vpp_stage - 0.45, tp_idx - 0.45), 0.9, 0.9,
+            facecolor=self.model_colors[dp_idx],
+            edgecolor='white',
+            linewidth=1,
+            alpha=0.8
+        )
+        ax.add_patch(rect)
+        # 添加文本标签
+        fontsize = self.config.font_sizes['text']
+        ax.text(
+            vpp_stage, tp_idx,
+            layer_text,
+            ha='center', va='center',
+            fontsize=fontsize,
+            bbox=dict(facecolor='white', alpha=0.3, pad=1)
+        )
+    def _add_legend(self, ax):
+        """添加图例"""
+        legend_elements = [
+            plt.Rectangle((0, 0), 1, 1,
+                          facecolor=self.model_colors[i],
+                          alpha=0.8,
+                          label=f'Model Copy {i+1}')
+            for i in range(self.layout['num_model_copies'])
+        ]
+        ax.legend(
+            handles=legend_elements,
+            loc='center left',  # 以左侧中心为基准
+            bbox_to_anchor=(1.02, 0.5),
+            title=f"Model Copies",
+            title_fontsize=self.config.font_sizes['legend'],
+            fontsize=self.config.font_sizes['legend']
+        )
+    def _visualize(self) -> plt.Figure:
+        """
+        执行可视化
+        """
+        # 创建图表
+        fig_width, fig_height = self._calculate_figure_size()
+        fig, ax = plt.subplots(figsize=(fig_width, fig_height), clear=True)
+        self._setup_colors()
+        self._setup_axes(ax)
+        # 调整布局
+        right_margin = 1 - self.config.legend_width / fig_width
+        plt.tight_layout(rect=[0, 0, right_margin, 1])
+        # 添加图例
+        self._add_legend(ax)
+        # 绘制模型块
+        self._draw_model_blocks(ax)
+        return fig
+    def save(self, filepath: str):
+        """
+        保存可视化结果到文件
+        """
+        fig = self._visualize()
+        logger.info(f"Saving visualization result to {filepath}...")
+        fig.savefig(filepath, dpi=300, bbox_inches='tight')
+        plt.close(fig)
+@dataclass
+class ParallelConfig:
+    world_size: int
+    num_layers: int
+    tensor_parallel_size: int = 1
+    pipeline_parallel_size: int = 1
+    # 优先级高于virtual_pipeline_parallel_size
+    num_layers_per_virtual_pipeline_stage: int = None
+    order: str = "tp-cp-ep-dp-pp"
+    standalone_embedding_stage: bool = False
+    output_path: str = './'
+    # _calculate_derived_parameters
+    virtual_pipeline_parallel_size: int = 1
+    data_parallel_size: int = None
+    transformer_pipeline_parallel_size: int = None
+    def __post_init__(self):
+        self._validate()
+        self._calculate_derived_parameters()
+        self._create_output_path()
+    def _calculate_derived_parameters(self):
+        """计算派生参数"""
+        # Pipeline模型并行大小
+        self.pipeline_parallel_size = min(
+            self.pipeline_parallel_size,
+            (self.world_size // self.tensor_parallel_size)
+        )
+        self.transformer_pipeline_parallel_size = (
+            self.pipeline_parallel_size - 1
+            if self.standalone_embedding_stage else
+            self.pipeline_parallel_size
+        )
+        self._validate_pipeline_configs()
+        # 通过num_layers_per_virtual_pipeline_stage配置vpp
+        if self.num_layers_per_virtual_pipeline_stage is not None:
+            num_layers_per_pipeline_stage = self.num_layers // self.transformer_pipeline_parallel_size
+            self.virtual_pipeline_parallel_size = (
+                num_layers_per_pipeline_stage // self.num_layers_per_virtual_pipeline_stage
+            )
+            if self.virtual_pipeline_parallel_size > 1 and self.pipeline_parallel_size <= 1:
+                raise ValueError(
+                    "pipeline-model-parallel size should be greater than 1 with virtual-pipeline"
+                )
+        # 计算数据并行大小
+        self.data_parallel_size = self.world_size // (
+            self.tensor_parallel_size * self.pipeline_parallel_size
+        )
+    def _validate_pipeline_configs(self):
+        """验证流水线层数配置"""
+        if self.transformer_pipeline_parallel_size == 0 or \
+                self.num_layers % self.transformer_pipeline_parallel_size != 0:
+            if self.standalone_embedding_stage:
+                raise ValueError(
+                    f'number of layers ({self.num_layers}) must be divisible by '
+                    f'transformer_pipeline_parallel_size ({self.transformer_pipeline_parallel_size}), '
+                    f'which is pipeline_parallel_size-1 when standalone_embedding_stage is enabled.'
+                )
+            else:
+                raise ValueError(
+                    f'number of layers ({self.num_layers}) must be divisible by '
+                    f'pipeline_parallel_size ({self.pipeline_parallel_size}).'
+                )
+        num_layers_per_pipeline_stage = self.num_layers // self.transformer_pipeline_parallel_size
+        if self.num_layers_per_virtual_pipeline_stage is not None:
+            if num_layers_per_pipeline_stage % self.num_layers_per_virtual_pipeline_stage != 0:
+                raise ValueError(
+                    f'number of layers per pipeline stage ({num_layers_per_pipeline_stage}) must be divisible by '
+                    f'number of layers per virtual pipeline stage ({self.num_layers_per_virtual_pipeline_stage}).'
+                )
+    def _create_output_path(self):
+        create_directory(self.output_path)
+        file_name = f"ws{self.world_size}_ln{self.num_layers}" \
+                    f"_tp{self.tensor_parallel_size}" \
+                    f"_pp{self.pipeline_parallel_size}" \
+                    f"_vpp{self.virtual_pipeline_parallel_size}.png"
+        png_path = os.path.join(self.output_path, file_name)
+        if os.path.exists(png_path):
+            logger.warning(f"Existing path will be recovered: {png_path}")
+            remove_path(png_path)
+        self.output_path = png_path
+    def _validate(self):
+        """
+        验证所有配置输入的类型
+        order 会在RankGroupGenerator类中验证
+        data_parallel_size 会在 _calculate_derived_parameters中计算覆盖
+        """
+        per_vpp = self.num_layers_per_virtual_pipeline_stage if \
+            self.num_layers_per_virtual_pipeline_stage is not None else 1
+        if self.tensor_parallel_size is None:
+            self.tensor_parallel_size = 1
+        if self.pipeline_parallel_size is None:
+            self.pipeline_parallel_size = 1
+        for name, _input in {
+            "world_size": self.world_size,
+            "num_layers": self.num_layers,
+            "tensor_parallel_size": self.tensor_parallel_size,
+            "pipeline_parallel_size": self.pipeline_parallel_size,
+            "num_layers_per_virtual_pipeline_stage": per_vpp
+        }.items():
+            if not is_int(_input) or _input < 1:
+                raise ValueError(f"{name} must be a positive integer")
+        if self.world_size > 1024:
+            raise ValueError(
+                "world_size ({self.world_size}) exceeds the maximum supported value of 1024.")
+        if self.num_layers > 256:
+            raise ValueError(
+                "num_layers ({self.num_layers}) exceeds the maximum supported value of 256.")
+        if (self.world_size % (self.tensor_parallel_size * self.pipeline_parallel_size) != 0):
+            raise ValueError(
+                f"world_size ({self.world_size}) is not divisible by "
+                f"tensor_parallel_size({self.tensor_parallel_size}) x "
+                f"pipeline_parallel_size ({self.pipeline_parallel_size})"
+            )
+        if not isinstance(self.standalone_embedding_stage, bool):
+            raise ValueError(f"standalone_embedding_stage must be a boolean")
+class ModelLayerSimulator:
+    """
+    模型仿真 - 统一处理模型层信息生成
+    """
+    def __init__(self, args: 'ParallelConfig', pp_stage_list: list):
+        self.args = args
+        self.pp_stage_list = pp_stage_list
+    def get_model_for_rank(self, rank: int) -> List[List[str]]:
+        """
+        为指定rank生成模型层
+        """
+        if self._should_use_virtual_pipeline():
+            return self._create_virtual_pipeline_model(rank)
+        else:
+            return self._create_standard_pipeline_model(rank)
+    def _should_use_virtual_pipeline(self) -> bool:
+        """判断是否使用虚拟流水线策略"""
+        return self.args.virtual_pipeline_parallel_size > 1
+    def _create_virtual_pipeline_model(self, rank: int) -> List[List[str]]:
+        """虚拟流水线模式：生成多个虚拟阶段的模型配置"""
+        model_configs = []
+        for vpp_stage in range(self.args.virtual_pipeline_parallel_size):
+            # 确定当前阶段是否为流水线的首尾阶段
+            is_first_stage = self._is_pipeline_first_stage(rank, vpp_stage)
+            is_last_stage = self._is_pipeline_last_stage(rank, vpp_stage)
+            # 生成单个虚拟阶段的模型
+            stage_config = self._create_single_stage_config(
+                rank, vpp_stage, is_first_stage, is_last_stage
+            )
+            model_configs.append(stage_config)
+        return model_configs
+    def _create_standard_pipeline_model(self, rank: int) -> List[List[str]]:
+        """标准流水线模式：生成单个模型配置"""
+        is_first_stage = self._is_pipeline_first_stage(rank, 0)
+        is_last_stage = self._is_pipeline_last_stage(rank, -1)
+        model_config = self._create_single_stage_config(
+            rank, 0, is_first_stage, is_last_stage
+        )
+        return [model_config]
+    def _create_single_stage_config(self, rank: int, vpp_stage: int,
+                                    is_first_stage: bool, is_last_stage: bool) -> List[str]:
+        """
+        生成单个阶段（虚拟阶段或普通阶段）的模型配置
+        """
+        components = []
+        # 前处理组件（嵌入层）
+        if is_first_stage:
+            components.append("Embedding")
+        # Transformer层组件
+        components.extend(self._create_transformer_layers(rank, vpp_stage))
+        # 后处理组件（输出层）
+        if is_last_stage:
+            components.append("OutputLayer")
+        return components
+    def _create_transformer_layers(self, rank: int, vpp_stage: int) -> List[str]:
+        """创建Transformer层组件"""
+        num_layers = self._calculate_transformer_layers(rank)
+        if num_layers == 0:
+            return []
+        # 计算层偏移量
+        offset = self._calculate_layer_offset(rank, vpp_stage)
+        # 生成层名称
+        return [i + 1 + offset for i in range(num_layers)]
+    def _calculate_transformer_layers(self, rank: int) -> int:
+        """计算当前rank需要处理的Transformer层数"""
+        # 流水线并行场景
+        if self.args.pipeline_parallel_size > 1:
+            if (self.args.standalone_embedding_stage and
+                    self._is_pipeline_first_stage(rank, 0)):
+                return 0  # 嵌入阶段不包含Transformer层
+            num_layers = self.args.num_layers // self.args.transformer_pipeline_parallel_size
+            if self._should_use_virtual_pipeline():
+                return num_layers // self.args.virtual_pipeline_parallel_size
+            return num_layers
+        # 非流水线并行场景
+        return self.args.num_layers
+    def _calculate_layer_offset(self, rank: int, vpp_stage: int) -> int:
+        """计算层偏移量"""
+        pipeline_rank = self._get_pipeline_rank(rank)
+        if self.args.standalone_embedding_stage:
+            pipeline_rank -= 1
+        base_layers_per_stage = self.args.num_layers // self.args.transformer_pipeline_parallel_size
+        if self._should_use_virtual_pipeline():
+            # 虚拟流水线：进一步分割每个流水线阶段
+            layers_per_virtual_stage = base_layers_per_stage // self.args.virtual_pipeline_parallel_size
+            return vpp_stage * (self.args.num_layers // self.args.virtual_pipeline_parallel_size) + \
+                (pipeline_rank * layers_per_virtual_stage)
+        else:
+            # 普通流水线：直接按流水线阶段划分
+            return pipeline_rank * base_layers_per_stage
+    def _is_pipeline_first_stage(self, rank: int, vpp_stage: int) -> bool:
+        """判断是否为流水线首阶段"""
+        return (rank in self.pp_stage_list[0] and vpp_stage == 0)
+    def _is_pipeline_last_stage(self, rank: int, vpp_stage: int) -> bool:
+        """判断是否为流水线尾阶段"""
+        # 虚拟流水线：只有最后一个虚拟阶段才算是真正的尾阶段
+        if (self._should_use_virtual_pipeline() and
+                vpp_stage != (self.args.virtual_pipeline_parallel_size - 1)):
+            return False
+        return rank in self.pp_stage_list[-1]
+    def _get_pipeline_rank(self, rank: int) -> int:
+        """获取在流水线中的局部rank"""
+        for local_rank, ranks in enumerate(self.pp_stage_list):
+            if rank in ranks:
+                return local_rank
+        return 0
+    # 批量生成所有rank的模型配置
+    def generate_all_models(self) -> Dict[int, List[List[str]]]:
+        """批量生成所有rank的模型配置"""
+        return {rank: self.get_model_for_rank(rank) for rank in range(self.args.world_size)}
+def plot_model_parallelism(args: 'ParallelConfig'):
+    logger.info("Starting model parallelism visualization")
+    logger.info("Generating model configurations for each rank...")
+    groups_dict = RankGroupGenerator(
+        args.tensor_parallel_size,
+        1,  # expert_parallel
+        args.data_parallel_size,
+        args.pipeline_parallel_size,
+        1,  # context_parallel
+        args.order
+    ).generate_all_ranks()
+    pp_stage_list = list(zip(*groups_dict.get("pp", [])))
+    rank_models = ModelLayerSimulator(
+        args, pp_stage_list).generate_all_models()
+    logger.info(f"Model configuration generation completed: "
+                f"{len(groups_dict.get('tp', []))} TP groups, "
+                f"{len(groups_dict.get('dp', []))} DP groups, "
+                f"{len(groups_dict.get('pp', []))} PP groups")
+    logger.info("Starting visualization...")
+    ModelParallelismVisualizer(
+        args, groups_dict, rank_models).save(args.output_path)
+    logger.info("Done")

msprobe/core/common/parallel_state.py CHANGED Viewed

@@ -1,17 +1,18 @@
-# Copyright (c) 2024-2025, Huawei Technologies Co., Ltd.
-# All rights reserved.
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
 #
-# Licensed under the Apache License, Version 2.0  (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
 #
-# http://www.apache.org/licenses/LICENSE-2.0
+#          http://license.coscl.org.cn/MulanPSL2
 #
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
 from typing import List

msprobe/core/common/runtime.py CHANGED Viewed

@@ -1,17 +1,18 @@
-# Copyright (c) 2025, Huawei Technologies Co., Ltd.
-# All rights reserved.
+# -------------------------------------------------------------------------
+#  This file is part of the MindStudio project.
+# Copyright (c) 2025 Huawei Technologies Co.,Ltd.
 #
-# Licensed under the Apache License, Version 2.0  (the "License");
-# you may not use this file except in compliance with the License.
-# You may obtain a copy of the License at
+# MindStudio is licensed under Mulan PSL v2.
+# You can use this software according to the terms and conditions of the Mulan PSL v2.
+# You may obtain a copy of Mulan PSL v2 at:
 #
-# http://www.apache.org/licenses/LICENSE-2.0
+#          http://license.coscl.org.cn/MulanPSL2
 #
-# Unless required by applicable law or agreed to in writing, software
-# distributed under the License is distributed on an "AS IS" BASIS,
-# WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
-# See the License for the specific language governing permissions and
-# limitations under the License.
+# THIS SOFTWARE IS PROVIDED ON AN "AS IS" BASIS, WITHOUT WARRANTIES OF ANY KIND,
+# EITHER EXPRESS OR IMPLIED, INCLUDING BUT NOT LIMITED TO NON-INFRINGEMENT,
+# MERCHANTABILITY OR FIT FOR A PARTICULAR PURPOSE.
+# See the Mulan PSL v2 for more details.
+# -------------------------------------------------------------------------
 from msprobe.core.common.const import Const

mindstudio-probe 8.3.3__py3-none-any.whl → 26.0.0a1__py3-none-any.whl

mindstudio-probe 8.3.3py3-none-any.whl → 26.0.0a1py3-none-any.whl