PyPI - mindspore - Versions diffs - 2.2.0__cp37-cp37m-manylinux1_x86_64.whl → 2.2.11__cp37-cp37m-manylinux1_x86_64.whl - Mend

mindspore 2.2.0__cp37-cp37m-manylinux1_x86_64.whl → 2.2.11__cp37-cp37m-manylinux1_x86_64.whl

This diff represents the content of publicly available package versions that have been released to one of the supported registries. The information contained in this diff is provided for informational purposes only and reflects changes between package versions as they appear in their respective public registries.

Files changed (170) hide show

mindspore/.commit_id +1 -1
mindspore/_akg/akg/composite/build_module.py +104 -20
mindspore/_akg/akg/utils/ascend_profilier/cann_file_parser.py +76 -0
mindspore/_akg/akg/utils/ascend_profilier/file_manager.py +56 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_bean.py +23 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_headers.py +8 -0
mindspore/_akg/akg/utils/ascend_profilier/op_summary_parser.py +42 -0
mindspore/_akg/akg/utils/ascend_profilier/path_manager.py +65 -0
mindspore/_akg/akg/utils/composite_op_helper.py +7 -2
mindspore/_akg/akg/utils/dump_ascend_meta.py +22 -3
mindspore/_akg/akg/utils/kernel_exec.py +41 -15
mindspore/_akg/akg/utils/tbe_codegen_utils.py +27 -6
mindspore/_akg/akg/utils/util.py +56 -1
mindspore/_c_dataengine.cpython-37m-x86_64-linux-gnu.so +0 -0
mindspore/_c_expression.cpython-37m-x86_64-linux-gnu.so +0 -0
mindspore/_checkparam.py +3 -3
mindspore/_extends/graph_kernel/model/graph_split.py +84 -76
mindspore/_extends/graph_kernel/splitter.py +3 -2
mindspore/_extends/parallel_compile/akg_compiler/build_tbe_kernel.py +83 -66
mindspore/_extends/parallel_compile/akg_compiler/tbe_topi.py +4 -4
mindspore/_extends/parallel_compile/akg_compiler/util.py +10 -7
mindspore/_extends/parallel_compile/tbe_compiler/tbe_helper.py +2 -1
mindspore/_extends/parse/__init__.py +3 -2
mindspore/_extends/parse/parser.py +6 -1
mindspore/_extends/parse/standard_method.py +14 -11
mindspore/_extends/remote/kernel_build_server.py +2 -1
mindspore/_mindspore_offline_debug.cpython-37m-x86_64-linux-gnu.so +0 -0
mindspore/bin/cache_admin +0 -0
mindspore/bin/cache_server +0 -0
mindspore/common/_utils.py +16 -0
mindspore/common/api.py +1 -1
mindspore/common/auto_dynamic_shape.py +81 -85
mindspore/common/dump.py +1 -1
mindspore/common/tensor.py +3 -20
mindspore/config/op_info.config +1 -1
mindspore/context.py +11 -4
mindspore/dataset/engine/cache_client.py +8 -5
mindspore/dataset/engine/datasets_standard_format.py +5 -0
mindspore/dataset/vision/transforms.py +21 -21
mindspore/experimental/optim/adam.py +1 -1
mindspore/gen_ops.py +1 -1
mindspore/include/api/model.h +17 -0
mindspore/include/api/status.h +8 -3
mindspore/lib/libdnnl.so.2 +0 -0
mindspore/lib/libmindspore.so +0 -0
mindspore/lib/libmindspore_backend.so +0 -0
mindspore/lib/libmindspore_common.so +0 -0
mindspore/lib/libmindspore_core.so +0 -0
mindspore/lib/libmindspore_glog.so.0 +0 -0
mindspore/lib/libmindspore_gpr.so.15 +0 -0
mindspore/lib/libmindspore_grpc++.so.1 +0 -0
mindspore/lib/libmindspore_grpc.so.15 +0 -0
mindspore/lib/libmindspore_shared_lib.so +0 -0
mindspore/lib/libnnacl.so +0 -0
mindspore/lib/libopencv_core.so.4.5 +0 -0
mindspore/lib/libopencv_imgcodecs.so.4.5 +0 -0
mindspore/lib/libopencv_imgproc.so.4.5 +0 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310/aic-ascend310-ops-info.json +123 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend310p/aic-ascend310p-ops-info.json +123 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910/aic-ascend910-ops-info.json +158 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/config/ascend910b/aic-ascend910b-ops-info.json +37 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/ai_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_dsl.py +46 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/add_tik.py +51 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/kv_cache_mgr.py +241 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_impl/vector_core/tbe/custom_aicore_ops_impl/matmul_tik.py +212 -0
mindspore/lib/plugin/ascend/custom_aicore_ops/op_proto/libop_proto.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_aicpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/aicpu_kernel/impl/libcust_cpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_impl/cpu/config/cust_aicpu_kernel.json +78 -80
mindspore/lib/plugin/ascend/custom_aicpu_ops/op_proto/libcust_op_proto.so +0 -0
mindspore/lib/plugin/ascend/libakg.so +0 -0
mindspore/lib/plugin/ascend/libhccl_plugin.so +0 -0
mindspore/lib/plugin/ascend/libmindspore_aicpu_kernels.so +0 -0
mindspore/lib/plugin/ascend/libmindspore_cpu_kernels.so +0 -0
mindspore/lib/plugin/cpu/libakg.so +0 -0
mindspore/lib/plugin/gpu/libcuda_ops.so.10 +0 -0
mindspore/lib/plugin/gpu/libcuda_ops.so.11 +0 -0
mindspore/lib/plugin/gpu10.1/libakg.so +0 -0
mindspore/lib/plugin/gpu10.1/libnccl.so.2 +0 -0
mindspore/lib/plugin/gpu11.1/libakg.so +0 -0
mindspore/lib/plugin/gpu11.6/libakg.so +0 -0
mindspore/lib/plugin/gpu11.6/libnccl.so.2 +0 -0
mindspore/lib/plugin/libmindspore_ascend.so.1 +0 -0
mindspore/lib/plugin/libmindspore_ascend.so.2 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.10.1 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.11.1 +0 -0
mindspore/lib/plugin/libmindspore_gpu.so.11.6 +0 -0
mindspore/nn/cell.py +0 -3
mindspore/nn/layer/activation.py +4 -5
mindspore/nn/layer/conv.py +39 -23
mindspore/nn/layer/flash_attention.py +54 -129
mindspore/nn/layer/math.py +3 -7
mindspore/nn/layer/rnn_cells.py +5 -5
mindspore/nn/wrap/__init__.py +4 -2
mindspore/nn/wrap/cell_wrapper.py +12 -3
mindspore/numpy/utils_const.py +5 -5
mindspore/ops/_grad_experimental/grad_array_ops.py +1 -1
mindspore/ops/_grad_experimental/grad_implementations.py +2 -2
mindspore/ops/_grad_experimental/grad_math_ops.py +19 -18
mindspore/ops/_grad_experimental/grad_sparse_ops.py +3 -3
mindspore/ops/_op_impl/aicpu/add.py +3 -3
mindspore/ops/_op_impl/aicpu/linear_sum_assignment.py +21 -2
mindspore/ops/_utils/utils.py +2 -0
mindspore/ops/composite/multitype_ops/_compile_utils.py +2 -1
mindspore/ops/composite/multitype_ops/getitem_impl.py +2 -2
mindspore/ops/function/array_func.py +10 -7
mindspore/ops/function/grad/grad_func.py +0 -1
mindspore/ops/function/nn_func.py +98 -9
mindspore/ops/function/random_func.py +2 -1
mindspore/ops/op_info_register.py +24 -21
mindspore/ops/operations/__init__.py +6 -2
mindspore/ops/operations/_grad_ops.py +25 -6
mindspore/ops/operations/_inner_ops.py +155 -23
mindspore/ops/operations/array_ops.py +9 -7
mindspore/ops/operations/comm_ops.py +2 -2
mindspore/ops/operations/custom_ops.py +85 -68
mindspore/ops/operations/inner_ops.py +26 -3
mindspore/ops/operations/math_ops.py +7 -6
mindspore/ops/operations/nn_ops.py +193 -49
mindspore/parallel/_parallel_serialization.py +10 -3
mindspore/parallel/_tensor.py +4 -1
mindspore/parallel/checkpoint_transform.py +13 -2
mindspore/parallel/shard.py +17 -10
mindspore/profiler/common/util.py +1 -0
mindspore/profiler/parser/ascend_hccl_generator.py +232 -0
mindspore/profiler/parser/ascend_msprof_exporter.py +86 -43
mindspore/profiler/parser/ascend_msprof_generator.py +196 -9
mindspore/profiler/parser/ascend_op_generator.py +1 -1
mindspore/profiler/parser/ascend_timeline_generator.py +6 -182
mindspore/profiler/parser/base_timeline_generator.py +1 -1
mindspore/profiler/parser/cpu_gpu_timeline_generator.py +2 -2
mindspore/profiler/parser/framework_parser.py +1 -1
mindspore/profiler/parser/profiler_info.py +19 -0
mindspore/profiler/profiling.py +46 -24
mindspore/rewrite/api/pattern_engine.py +1 -1
mindspore/rewrite/parsers/for_parser.py +7 -7
mindspore/rewrite/parsers/module_parser.py +4 -4
mindspore/rewrite/symbol_tree.py +1 -4
mindspore/run_check/_check_version.py +5 -3
mindspore/safeguard/rewrite_obfuscation.py +52 -28
mindspore/scipy/ops.py +55 -5
mindspore/scipy/optimize/__init__.py +3 -2
mindspore/scipy/optimize/linear_sum_assignment.py +38 -33
mindspore/train/callback/_summary_collector.py +1 -1
mindspore/train/dataset_helper.py +1 -0
mindspore/train/model.py +2 -2
mindspore/train/serialization.py +97 -11
mindspore/train/summary/_summary_adapter.py +1 -1
mindspore/train/summary/summary_record.py +23 -7
mindspore/version.py +1 -1
{mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/METADATA +3 -2
{mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/RECORD +160 -151
mindspore/ops/_op_impl/_custom_op/flash_attention/attention.py +0 -406
mindspore/ops/_op_impl/_custom_op/flash_attention/constants.py +0 -41
mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_bwd.py +0 -467
mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_fwd.py +0 -563
mindspore/ops/_op_impl/_custom_op/flash_attention/flash_attention_impl.py +0 -193
mindspore/ops/_op_impl/_custom_op/flash_attention/tik_ops_utils.py +0 -435
mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/__init__.py +0 -0
mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/sparse_tiling.py +0 -45
mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/strategy.py +0 -67
mindspore/ops/_op_impl/_custom_op/flash_attention/tiling_strategy/wukong_tiling.py +0 -62
/mindspore/{ops/_op_impl/_custom_op/flash_attention → _akg/akg/utils/ascend_profilier}/__init__.py +0 -0
{mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/WHEEL +0 -0
{mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/entry_points.txt +0 -0
{mindspore-2.2.0.dist-info → mindspore-2.2.11.dist-info}/top_level.txt +0 -0

mindspore/profiler/parser/ascend_msprof_generator.py CHANGED Viewed

@@ -20,7 +20,7 @@ import os
 import numpy as np
-class AscendMsprofDataGenerator:
+class AscendMsprofDataGeneratorOld:
     """Generate ascend data from files."""
     def __init__(self, source_path):
@@ -47,10 +47,15 @@ class AscendMsprofDataGenerator:
             'Output Data Types': {'index': self.invalid_index, 'dtype': ('Output Data Types', object)},
             'Output Formats': {'index': self.invalid_index, 'dtype': ('Output Formats', object)},
         }
-        self.op_summary_extend_name = {
+        self.op_summaryA_extend_name = {
             'vector_fops': {'index': self.invalid_index, 'dtype': ('vector_fops', float)},
             'cube_fops': {'index': self.invalid_index, 'dtype': ('cube_fops', float)},
         }
+        self.op_summaryB_extend_name = {
+            'aiv_vector_fops': {'index': self.invalid_index, 'dtype': ('vector_fops', float)},
+            'aic_cube_fops': {'index': self.invalid_index, 'dtype': ('cube_fops', float)},
+        }
         self.op_summary_name = None
         self.op_statistic_name = {
@@ -110,10 +115,15 @@ class AscendMsprofDataGenerator:
                 iteration = int(file.split('_')[-1].split('.')[0])
                 reader = csv.reader(csvfile, delimiter=',', quotechar='"')
                 header = next(reader)
-                self.link_index_with_name(header, self.op_summary_basis_name)
-                extend_flag = self.link_index_with_name(header, self.op_summary_extend_name)
-                if extend_flag:
-                    self.op_summary_name = {**self.op_summary_basis_name, **self.op_summary_extend_name}
+                flag = self.link_index_with_name(header, self.op_summary_basis_name)
+                if not flag:
+                    raise RuntimeError("Read op summary failed. The file is missing basic fields.")
+                extend_flag_A = self.link_index_with_name(header, self.op_summaryA_extend_name)
+                extend_flag_B = self.link_index_with_name(header, self.op_summaryB_extend_name)
+                if extend_flag_A:
+                    self.op_summary_name = {**self.op_summary_basis_name, **self.op_summaryA_extend_name}
+                elif extend_flag_B:
+                    self.op_summary_name = {**self.op_summary_basis_name, **self.op_summaryB_extend_name}
                 else:
                     self.op_summary_name = self.op_summary_basis_name
                 self.op_summary_name['Iteration ID'] = {'index': -1, 'dtype': ('Iteration ID', object)}
@@ -137,7 +147,9 @@ class AscendMsprofDataGenerator:
             with open(file, newline='') as csvfile:
                 reader = csv.reader(csvfile, delimiter=',', quotechar='"')
                 header = next(reader)
-                self.link_index_with_name(header, self.op_statistic_name)
+                flag = self.link_index_with_name(header, self.op_statistic_name)
+                if not flag:
+                    raise RuntimeError("Read op summary failed. The file is missing basic fields.")
                 for row in reader:
                     row = [row[index.get('index')] for index in self.op_statistic_name.values()]
                     row = ['0' if i == 'N/A' else i for i in row]
@@ -155,7 +167,9 @@ class AscendMsprofDataGenerator:
             with open(file, newline='') as csvfile:
                 reader = csv.reader(csvfile, delimiter=',', quotechar='"')
                 header = next(reader)
-                self.link_index_with_name(header, self.steptrace_name)
+                flag = self.link_index_with_name(header, self.steptrace_name)
+                if not flag:
+                    raise RuntimeError("Read op summary failed. The file is missing basic fields.")
                 for row in reader:
                     rows = [row[index.get('index')] for index in self.steptrace_name.values()]
                     if row[9:]:
@@ -182,7 +196,7 @@ class AscendMsprofDataGenerator:
         for i in range(len(self.steptrace_name), len(header), 2):
             name = f'hccl_{i}'
             self.steptrace_name[name] = {'index': i, 'dtype': (name, float)}
-            self.steptrace_name[f'{name} duration'] = {'index': i+1, 'dtype': (f'{name} duration', float)}
+            self.steptrace_name[f'{name} duration'] = {'index': i + 1, 'dtype': (f'{name} duration', float)}
         steptrace_dt = np.dtype([value['dtype'] for value in self.steptrace_name.values()])
@@ -197,3 +211,176 @@ class AscendMsprofDataGenerator:
         for name in self.steptrace.dtype.names[9:]:
             self.steptrace[name] = self.steptrace[name] * 1e-3
+class AscendMsprofDataGenerator:
+    """Generate ascend data from files."""
+    def __init__(self, source_path):
+        self.source_path = source_path
+        self.op_summary = None
+        self.op_statistic = None
+        self.steptrace = []
+        self.op_summary_type = [
+            ('Model ID', int),
+            ('Task ID', int),
+            ('Stream ID', int),
+            ('Op Name', object),
+            ('Op Type', object),
+            ('Task Type', object),
+            ('Task Start Time', float),
+            ('Task Duration', float),
+            ('Task Wait Time', float),
+            ('Input Shapes', object),
+            ('Input Data Types', object),
+            ('Input Formats', object),
+            ('Output Shapes', object),
+            ('Output Data Types', object),
+            ('Output Formats', object)
+        ]
+        self.op_statistic_type = [
+            ('Op Type', object),
+            ('Count', int),
+            ('Total Time', float),
+        ]
+        self.steptrace_type = [
+            ('Iteration ID', int),
+            ('FP Start', float),
+            ('BP End', float),
+            ('Iteration End', float),
+            ('Iteration Time', float),
+            ('FP to BP Time', float),
+            ('Iteration Refresh', float),
+            ('Data Aug Bound', float),
+            ('Model ID', int),
+        ]
+    @staticmethod
+    def find_files(directory, pattern):
+        """Find files with feature 'pattern' from the directory"""
+        for root, _, files in os.walk(directory):
+            files.sort(key=lambda x: os.path.getctime(os.path.join(directory, x)))
+            for basename in files:
+                if fnmatch.fnmatch(basename, pattern):
+                    filename = os.path.join(root, basename)
+                    yield filename
+    def parse(self):
+        """read msprof data generate DataFrame data"""
+        self._read_op_summary()
+        self._read_op_statistic()
+        self._read_steptrace()
+        return self.op_summary, self.op_statistic, self.steptrace
+    def _read_op_summary(self):
+        """read op summary to memory"""
+        op_summary = []
+        for file in self.find_files(self.source_path, "op_summary*.csv"):
+            with open(file, newline='') as csvfile:
+                reader = csv.DictReader(csvfile, delimiter=',', quotechar='"')
+                for row in reader:
+                    vector_fops = row.get('vector_fops', None)
+                    cube_fops = row.get('cube_fops', None)
+                    aiv_vector_fops = row.get('aiv_vector_fops', None)
+                    aic_cube_fops = row.get('aic_cube_fops', None)
+                    new_row = [
+                        row.get('Model ID'),
+                        row.get('Task ID'),
+                        row.get('Stream ID'),
+                        row.get('Op Name'),
+                        row.get('OP Type'),
+                        row.get('Task Type'),
+                        row.get('Task Start Time(us)'),
+                        row.get('Task Duration(us)'),
+                        row.get('Task Wait Time(us)'),
+                        row.get('Input Shapes'),
+                        row.get('Input Data Types'),
+                        row.get('Input Formats'),
+                        row.get('Output Shapes'),
+                        row.get('Output Data Types'),
+                        row.get('Output Formats')
+                    ]
+                    if vector_fops is not None and cube_fops is not None:
+                        new_row.append(vector_fops)
+                        new_row.append(cube_fops)
+                    elif aic_cube_fops is not None and aiv_vector_fops is not None:
+                        new_row.append(aiv_vector_fops)
+                        new_row.append(aic_cube_fops)
+                    new_row = tuple(['0' if d == 'N/A' else d for d in new_row])
+                    op_summary.append(new_row)
+            break
+        if op_summary and len(op_summary[0]) > len(self.op_summary_type):
+            self.op_summary_type.extend([
+                ('vector_fops', float),
+                ('cube_fops', float)
+            ])
+        op_summary_dt = np.dtype(self.op_summary_type)
+        self.op_summary = np.array(op_summary, dtype=op_summary_dt)
+        self.op_summary['Task Start Time'] *= 1e-3
+        self.op_summary['Task Duration'] *= 1e-3
+        self.op_summary['Task Wait Time'] *= 1e-3
+    def _read_op_statistic(self):
+        """read op statistic to memory"""
+        op_statistic = []
+        for file in self.find_files(self.source_path, "op_statistic*.csv"):
+            with open(file, newline='') as csvfile:
+                reader = csv.DictReader(csvfile, delimiter=',', quotechar='"')
+                for row in reader:
+                    new_row = (
+                        row.get('OP Type'),
+                        row.get('Count'),
+                        row.get('Total Time(us)'),
+                    )
+                    new_row = tuple(['0' if d == 'N/A' else d for d in new_row])
+                    op_statistic.append(new_row)
+            break
+        op_statistic_dt = np.dtype(self.op_statistic_type)
+        self.op_statistic = np.array(op_statistic, dtype=op_statistic_dt)
+        self.op_statistic['Total Time'] *= 1e-3
+    def _read_steptrace(self):
+        """read steptrace to memory"""
+        steptrace = []
+        for file in self.find_files(self.source_path, "step_trace*.csv"):
+            with open(file, newline='') as csvfile:
+                reader = csv.DictReader(csvfile, delimiter=',', quotechar='"')
+                for row in reader:
+                    new_row = [
+                        row.get('Iteration ID'),
+                        row.get('FP Start(us)'),
+                        row.get('BP End(us)'),
+                        row.get('Iteration End(us)'),
+                        row.get('Iteration Time(us)'),
+                        row.get('FP to BP Time(us)'),
+                        row.get('Iteration Refresh(us)'),
+                        row.get('Data Aug Bound(us)'),
+                        row.get('Model ID'),
+                    ]
+                    new_row = ['0' if i == 'N/A' else i for i in new_row]
+                    steptrace.append(tuple(new_row))
+        steptrace_dt = np.dtype(self.steptrace_type)
+        self.steptrace = np.array(steptrace, dtype=steptrace_dt)
+        self.steptrace['FP Start'] = self.steptrace['FP Start'] * 1e-3
+        self.steptrace['BP End'] = self.steptrace['BP End'] * 1e-3
+        self.steptrace['Iteration End'] = self.steptrace['Iteration End'] * 1e-3
+        self.steptrace['Iteration Time'] = self.steptrace['Iteration Time'] * 1e-3
+        self.steptrace['FP to BP Time'] = self.steptrace['FP to BP Time'] * 1e-3
+        self.steptrace['Iteration Refresh'] = self.steptrace['Iteration Refresh'] * 1e-3
+        self.steptrace['Data Aug Bound'] = self.steptrace['Data Aug Bound'] * 1e-3

mindspore/profiler/parser/ascend_op_generator.py CHANGED Viewed

@@ -124,7 +124,7 @@ class AscendOPGenerator:
                     writer.writerows(self.aicpu_detail.tolist())
             except (IOError, OSError) as err:
                 logging.critical('Errot occurred when write aicpu detail file: %s', err)
-                raise ProfilerIOException()
+                raise ProfilerIOException() from err
             if os.path.exists(aicpu_intermediate_detail_path):
                 os.chmod(aicpu_intermediate_detail_path, stat.S_IREAD | stat.S_IWRITE)

mindspore/profiler/parser/ascend_timeline_generator.py CHANGED Viewed

@@ -13,7 +13,6 @@
 # limitations under the License.
 # ============================================================================
 """The integrator for integrating parsed profiling files."""
-import os
 import numpy as np
 from mindspore import log as logger
@@ -22,7 +21,6 @@ from mindspore.profiler.parser.base_timeline_generator import BaseTimelineGenera
 from mindspore.profiler.parser.container import TimelineContainer
 from mindspore.profiler.parser.cpu_gpu_timeline_generator import CpuTimelineGenerator
 from mindspore.profiler.parser.integrator import DeviceTarget
-from mindspore.profiler.parser.op_intermediate_parser import OPIntermediateParser
 class AscendTimelineGenerator(BaseTimelineGenerator):
@@ -51,16 +49,6 @@ class AscendTimelineGenerator(BaseTimelineGenerator):
             [('Op Name', object), ('Stream ID', int), ('Task Start Time', float), ('Task Duration', float),
              ('pid', int)])
-    @staticmethod
-    def _get_all_reduce_names(communication_info):
-        names = []
-        for info in communication_info:
-            # all_reduce_name format: stream_stream_id_stream_op_index_opname
-            all_reduce_name = info[0][info[0].rindex('_') + 1:]
-            if all_reduce_name not in names:
-                names.append(all_reduce_name)
-        return names
     def init_timeline(self, op_summary, steptrace):
         """
         Init timeline metadata, adding all collected info.
@@ -160,49 +148,19 @@ class AscendTimelineGenerator(BaseTimelineGenerator):
         self._timeline_meta = self._format_meta_data_list
         # Update timeline summary info
-        timeline_summary = op_summary[np.isin(op_summary['Task Type'], ['AI_CORE', 'AI_CPU', 'HCCL'])][[
-            'Op Name', 'Stream ID', 'Task Duration']]
+        timeline_summary = op_summary[['Op Name', 'Stream ID', 'Task Duration']]
         self._timeline_summary['total_time'] = np.sum(timeline_summary['Task Duration'])
         self._timeline_summary['num_of_streams'] = int(
             len(np.unique(timeline_summary['Stream ID'], return_counts=True)[0]))
         self._timeline_summary['num_of_ops'] = int(len(np.unique(timeline_summary['Op Name'], return_counts=True)[0]))
         self._timeline_summary['op_exe_times'] = int(len(timeline_summary))
-        self._timeline_summary['max_scope_name_num'] = int(np.max(
-            [len(x) for x in np.char.split(timeline_summary['Op Name'].astype(str), sep='/')]))
+        if self._timeline_summary['op_exe_times'] != 0:
+            self._timeline_summary['max_scope_name_num'] = int(np.max(
+                [len(x) for x in np.char.split(timeline_summary['Op Name'].astype(str), sep='/')]))
+        else:
+            self._timeline_summary['max_scope_name_num'] = 0
         logger.info('Finished adding info into timeline...')
-    def init_pynative_timeline(self):
-        """Init timeline for pynative model."""
-        timeline_list = OPIntermediateParser(self._profiling_dir, self._rank_id).get_timeline_data()
-        cpu_timeline_generator = CpuTimelineGenerator(self._profiling_dir, self._rank_id, self._model)
-        cpu_timeline_list = cpu_timeline_generator.load_cpu_op_data()
-        if cpu_timeline_list:
-            self._pynative_clock_synchronize(cpu_timeline_list)
-            timeline_list.extend(cpu_timeline_list)
-        self._register_op_name(timeline_list)
-        self._timeline_summary['op_exe_times'] = len(timeline_list)
-        self._max_scope_name_num = self._get_max_scope_name_num(timeline_list)
-        self._timeline_summary['max_scope_name_num'] = self._max_scope_name_num
-        self._timeline_summary['num_of_ops'] = len(self._op_name_list)
-        timeline_list.sort(key=lambda x: float(x[self._start_time_idx]))
-        min_cycle_counter = float(timeline_list[0][self._start_time_idx])
-        step_timeline = self._pynative_get_step_timeline_list(timeline_list)
-        timeline_list.extend(step_timeline)
-        stream_count_dict = {}
-        max_scope_name_num = 0
-        for timeline in timeline_list:
-            self._parse_timeline_data(timeline, min_cycle_counter)
-            self._update_num_of_streams(timeline, stream_count_dict)
-            cur_scope_name_num = len(timeline[self._op_name_idx].split('/')) - 1
-            max_scope_name_num = max(cur_scope_name_num, max_scope_name_num)
-        self._timeline_summary['max_scope_name_num'] = max_scope_name_num
-        self._timeline_summary['num_of_streams'] = len(stream_count_dict)
     def _parse_timeline_data(self, timeline, min_cycle_counter):
         """Parse timeline data."""
         # factor to convert the time unit from 1ms to 1us for timeline display
@@ -233,94 +191,6 @@ class AscendTimelineGenerator(BaseTimelineGenerator):
         self._update_format_meta_data(timeline_dict)
         self._timeline_meta.append(timeline_dict)
-    def _get_op_timeline(self, communication_info, source_path):
-        """get ai_core and cpu timeline."""
-        all_reduce_names = AscendTimelineGenerator._get_all_reduce_names(communication_info)
-        timeline_list = OPIntermediateParser(self._profiling_dir, self._rank_id).get_timeline_data(all_reduce_names)
-        for timeline in timeline_list:
-            timeline[self._tid_idx] = f"Stream #{timeline[self._tid_idx]}"
-        cpu_timeline_generator = CpuTimelineGenerator(self._profiling_dir, self._rank_id, self._model)
-        cpu_timeline_list = cpu_timeline_generator.get_timeline_data()
-        if cpu_timeline_list:
-            self._clock_synchronize_to_device(cpu_timeline_list, source_path)
-            timeline_list.extend(cpu_timeline_list)
-        timeline_list.sort(key=lambda x: float(x[self._start_time_idx]))
-        self._max_scope_name_num = self._get_max_scope_name_num(timeline_list)
-        self._timeline_summary['op_exe_times'] = len(timeline_list)
-        self._timeline_summary['max_scope_name_num'] = self._max_scope_name_num
-        return timeline_list
-    def _clock_synchronize_to_device(self, timeline_list, source_path):
-        """Synchronize the timestamp from host to device."""
-        host_start_file_path = os.path.join(source_path, f"host_start.log.{self._device_id}")
-        dev_start_file_path = os.path.join(source_path, f"dev_start.log.{self._device_id}")
-        host_monotonic = 0
-        dev_cntvct = 0
-        try:
-            with open(host_start_file_path) as f_obj:
-                lines = f_obj.readlines()
-            for line in lines:
-                info = line.strip().split(':')
-                if len(info) < 2 or info[0] != "clock_monotonic_raw":
-                    continue
-                host_monotonic = int(info[1])
-                break
-            with open(dev_start_file_path) as f_obj:
-                lines = f_obj.readlines()
-            for line in lines:
-                info = line.strip().split(':')
-                if len(info) < 2 or info[0] != "cntvct":
-                    continue
-                dev_cntvct = int(info[1])
-                break
-        except (IOError, OSError) as err:
-            logger.critical('Error occurred when read dev_start.log: %s', err)
-            raise ProfilerIOException() from err
-        if host_monotonic == 0 or dev_cntvct == 0:
-            logger.error('Error occurred when read host_monotonic or dev_cntvct time')
-        factor = {"factor_ns_to_ms": 1e-6, "factor_ten_ns_to_ns": 10, "factor_ms_to_ns": 1e6}
-        for idx, time_item in enumerate(timeline_list):
-            host_time = int(float(time_item[self._start_time_idx]) * factor.get("factor_ms_to_ns"))
-            device_time = dev_cntvct * factor.get("factor_ten_ns_to_ns") + (host_time - host_monotonic)
-            timeline_list[idx][self._start_time_idx] = device_time * factor.get("factor_ns_to_ms")
-    def _add_framework_info(self, framework_obj_list):
-        """
-        Add framework info into timeline metadata.
-        Args:
-            framework_obj_list (list): The framework metadata.
-        """
-        logger.debug('Start adding framework info into timeline...')
-        # Get the framework info that will be written into timeline.
-        framework_info_dict = {}
-        for framework_obj in framework_obj_list:
-            op_name = framework_obj[0]
-            op_type = framework_obj[1]
-            op_full_name = framework_obj[4]
-            op_info = framework_obj[5]
-            framework_info = {
-                'name': op_name,
-                'args': {
-                    'type': op_type,
-                    'fullname': op_full_name
-                }
-            }
-            framework_info.get('args').update(op_info)
-            framework_info_dict[op_full_name] = framework_info
-        # Insert framework info into timeline.
-        for timeline_item in self._timeline_meta:
-            op_full_name = timeline_item.get('name')
-            framework_item = framework_info_dict.get(op_full_name)
-            if framework_item:
-                timeline_item['name'] = framework_item.get('name')
-                timeline_item['args'] = framework_item.get('args')
-        logger.debug('Finished adding framework info into timeline...')
     def _produce_two_separated_timeline(self, timeline, op_name):
         """Produce two separated timeline based on op_name."""
         timeline_include_op_name = []
@@ -490,52 +360,6 @@ class AscendTimelineGenerator(BaseTimelineGenerator):
         return intersection_segment_display_list
-    def _pynative_get_step_timeline_list(self, timeline_list):
-        """Get step timeline list for pynative model."""
-        step_list = []
-        # The timeline starts with the GetNext op
-        if len(timeline_list) < 2 or 'GetNext' not in timeline_list[0][self._op_name_idx] and \
-                'GetNext' not in timeline_list[1][self._op_name_idx]:
-            return step_list
-        step = [-1, -1]
-        step_num = 0
-        tid = "Steps"
-        for timeline in timeline_list:
-            if 'GetNext' not in timeline[self._op_name_idx]:
-                continue
-            start_time = float(timeline[self._start_time_idx])
-            if step[0] == -1:
-                step[0] = start_time
-            else:
-                step[1] = start_time - step[0]
-                step_num = step_num + 1
-                step_list.append([str(step_num), tid, float(step[0]), step[1]])
-                step = [start_time, -1]
-        if step[0] != -1 and step[1] == -1:
-            step_num = step_num + 1
-            step_list.append([str(step_num), tid, float(step[0]),
-                              float(timeline_list[-1][self._start_time_idx]) - step[0]])
-        return step_list
-    def _pynative_clock_synchronize(self, timeline_list):
-        """Synchronize the timestamp from device to host."""
-        start_time_file_path = os.path.join(self._profiling_dir, f"start_time_{self._rank_id}.txt")
-        try:
-            with open(start_time_file_path) as f_obj:
-                lines = f_obj.readlines()
-                # lines[0] stores the host monotonic time of start training.
-                host_monotonic_start_time = int(lines[0].strip().split(':')[-1])
-                # lines[1] stores the gpu time of start training.
-                gpu_start_time = int(lines[1].strip().split(':')[-1])
-        except (IOError, OSError) as err:
-            logger.critical(f'Error occurred when read {start_time_file_path}: {err}')
-            raise ProfilerIOException()
-        time_diff = gpu_start_time * 1000 - host_monotonic_start_time
-        for idx, time_item in enumerate(timeline_list):
-            timeline_list[idx][self._start_time_idx] = int(time_item[self._start_time_idx]) + time_diff
-            timeline_list[idx][self._start_time_idx] = timeline_list[idx][self._start_time_idx] / 1000000
-            timeline_list[idx][self._duration_idx] = timeline_list[idx][self._duration_idx] / 1000
     def _set_step_start_and_end_op_name(self, timeline_list):
         """Set the start and end operator full name of each step."""
         if not timeline_list or len(timeline_list) < 2:

mindspore/profiler/parser/base_timeline_generator.py CHANGED Viewed

@@ -315,7 +315,7 @@ class BaseTimelineGenerator:
         tid_name = timeline_dict['tid']
         sort_index = 0
-        if tid_name in self._map_tid_name_to_int.keys():
+        if tid_name in self._map_tid_name_to_int:
             sort_index, tid = self._map_tid_name_to_int.get(tid_name)
         elif tid_name.startswith("Stream"):
             tid = int(tid_name.split("#")[-1])

mindspore/profiler/parser/cpu_gpu_timeline_generator.py CHANGED Viewed

@@ -497,9 +497,9 @@ class GpuTimelineGenerator(BaseTimelineGenerator):
             )
             if intersection_start < intersection_end:
                 intersection_segment_display_list.append(
-                    [display_name, self._tid_dict[display_name][0],
+                    [display_name, self._tid_dict.get(display_name, ('',))[0],
                      intersection_start, (intersection_end - intersection_start) * factor_ns_to_us,
-                     self._tid_dict[display_name][1]]
+                     self._tid_dict.get(display_name, ('', ''))[1]]
                 )
             if first_time_list[first_list_idx][self._duration_idx] >= \
                     second_time_list[second_list_idx][self._duration_idx]:

mindspore/profiler/parser/framework_parser.py CHANGED Viewed

@@ -578,7 +578,7 @@ class GpuFrameWorkParser:
                 op_occurrences = int(op_detail[0])
                 op_total_time = float(op_detail[1])
                 op_avg_time = float(op_detail[2])
-                if op_shape in op_shape_dict.keys():
+                if op_shape in op_shape_dict:
                     # Classify according to the operator information of the same shape.
                     op_shape_dict.get(op_shape)[0] += op_occurrences
                     op_shape_dict.get(op_shape)[1] += op_total_time

mindspore/profiler/parser/profiler_info.py CHANGED Viewed

@@ -76,6 +76,25 @@ class ProfilerInfo:
         info["analyse_end_time"] = end_time
         ProfilerInfo._profiler_info_dict.update(info)
+    @staticmethod
+    def set_export_start_time(start_time):
+        """Set the export start time."""
+        info = dict()
+        info["export_start_time"] = start_time
+        ProfilerInfo._profiler_info_dict.update(info)
+    @staticmethod
+    def set_export_end_time(end_time):
+        """Set the export end time."""
+        info = dict()
+        info["export_end_time"] = end_time
+        ProfilerInfo._profiler_info_dict.update(info)
+    @staticmethod
+    def set_export_flag(flag):
+        """Set the graph id list."""
+        ProfilerInfo._profiler_info_dict["all_export"] = flag
     @staticmethod
     def set_graph_ids(graph_ids):
         """Set the graph id list."""