From 8b627b89282f9ad90c4288649bd22f44568df7aa Mon Sep 17 00:00:00 2001
From: =?UTF-8?q?=E8=87=A7=E5=BA=86=E9=A6=99?= <zangqingxiang@huawei.com>
Date: Sat, 7 May 2022 11:11:05 +0800
Subject: [PATCH] msprof data type

---
 .../device/profiling/profiling_reporter.cc    |   9 ++++---
 .../hal/device/profiling/profiling_reporter.h |   7 ++---
 .../ascend/parallel_strategy_profiling.cc     |   4 +--
 .../profiler/parser/framework_enum.py         |   5 +++-
 .../profiler/parser/framework_parser.py       |  24 ++++++++++++++----
 .../mindspore/profiler/parser/integrator.py   |  21 +++++++++++++--
 .../data/Framework.task_desc_info.6.slice_0   | Bin 30720 -> 30720 bytes
 7 files changed, 53 insertions(+), 17 deletions(-)

diff --git a/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.cc b/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.cc
index 4babadb6425..4965031a2c7 100644
--- a/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.cc
+++ b/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.cc
@@ -254,20 +254,21 @@ void ProfilingReporter::BuildTensorData(MsprofGeTensorData *tensor_data, const C
   tensor_data->tensorType = tensor_type;
   std::vector<size_t> shape;
   string data_format;
+  uint32_t vm_data_type;
   if (tensor_type == MSPROF_GE_TENSOR_TYPE_INPUT) {
     auto input_node_with_index = common::AnfAlgo::GetPrevNodeOutput(node, index);
     auto input_node = input_node_with_index.first;
     auto input_index = input_node_with_index.second;
     shape = AnfAlgo::GetOutputDeviceShape(input_node, input_index);
     data_format = AnfAlgo::GetOutputFormat(input_node, input_index);
-    tensor_data->dataType = static_cast<uint32_t>(AnfAlgo::GetOutputDeviceDataType(input_node, input_index));
+    vm_data_type = static_cast<uint32_t>(AnfAlgo::GetOutputDeviceDataType(input_node, input_index));
   } else {
     shape = AnfAlgo::GetOutputDeviceShape(node, index);
     data_format = AnfAlgo::GetOutputFormat(node, index);
-    tensor_data->dataType = static_cast<uint32_t>(AnfAlgo::GetOutputDeviceDataType(node, index));
+    vm_data_type = static_cast<uint32_t>(AnfAlgo::GetOutputDeviceDataType(node, index));
   }
-
-  tensor_data->format = OpFormat2Index[data_format];
+  tensor_data->dataType = vm_data_type + MSPROF_DIFFERENCE;
+  tensor_data->format = OpFormat2Index[data_format] + MSPROF_DIFFERENCE;
   auto shape_size = std::min(static_cast<uint64_t>(MSPROF_GE_TENSOR_DATA_SHAPE_LEN), shape.size());
   (void)std::copy(shape.begin(), shape.begin() + shape_size, tensor_data->shape);
 }
diff --git a/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.h b/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.h
index 60925177437..3012b39caca 100644
--- a/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.h
+++ b/mindspore/ccsrc/plugin/device/ascend/hal/device/profiling/profiling_reporter.h
@@ -1,5 +1,5 @@
 /**
- * Copyright 2021 Huawei Technologies Co., Ltd
+ * Copyright 2021-2022 Huawei Technologies Co., Ltd
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -70,6 +70,7 @@ class ProfilingReporter {
   vector<uint32_t> stream_ids_;
   vector<uint32_t> task_ids_;
   map<string, int> node_name_index_map_;
+  const uint32_t MSPROF_DIFFERENCE = 200;
 
   bool CheckStreamTaskValid() const;
   static uint32_t GetBlockDim(const CNodePtr &node);
@@ -88,14 +89,14 @@ class ProfilingReporter {
   void SetAlternativeValue(T *property, const size_t property_size, const string &value, const int32_t &device_id) {
     MS_EXCEPTION_IF_NULL(property);
     if (value.size() < property_size) {
-      property->type = static_cast<uint8_t>(MSPROF_MIX_DATA_HASH_ID);
+      property->type = static_cast<uint8_t>(MSPROF_MIX_DATA_STRING);
       const auto ret = strncpy_s(property->data.dataStr, property_size, value.c_str(), value.size());
       if (ret != 0) {
         MS_LOG(ERROR) << "[Profiling] strncpy_s value " << value.c_str() << " error!";
         return;
       }
     } else {
-      property->type = static_cast<uint8_t>(MSPROF_MIX_DATA_STRING);
+      property->type = static_cast<uint8_t>(MSPROF_MIX_DATA_HASH_ID);
       uint64_t hash_id;
       ProfilingManager::GetInstance().QueryHashId(device_id, value, &hash_id);
       property->data.hashId = hash_id;
diff --git a/mindspore/ccsrc/profiler/device/ascend/parallel_strategy_profiling.cc b/mindspore/ccsrc/profiler/device/ascend/parallel_strategy_profiling.cc
index 23d9e9f622f..094e297ad95 100644
--- a/mindspore/ccsrc/profiler/device/ascend/parallel_strategy_profiling.cc
+++ b/mindspore/ccsrc/profiler/device/ascend/parallel_strategy_profiling.cc
@@ -1,5 +1,5 @@
 /**
- * Copyright 2021 Huawei Technologies Co., Ltd
+ * Copyright 2021-2022 Huawei Technologies Co., Ltd
  *
  * Licensed under the Apache License, Version 2.0 (the "License");
  * you may not use this file except in compliance with the License.
@@ -137,7 +137,7 @@ irpb::ProfilingParallel GetProfilingParallel(const FuncGraphPtr &func_graph) {
 }
 
 void DumpProfileParallelStrategy(const FuncGraphPtr &func_graph) {
-  if (!IsProfilingParallelStrategyEnabled()) {
+  if (has_save_parallel_strategy || !IsProfilingParallelStrategyEnabled()) {
     return;
   }
 
diff --git a/mindspore/python/mindspore/profiler/parser/framework_enum.py b/mindspore/python/mindspore/profiler/parser/framework_enum.py
index fd2771113c4..ca6eff786cf 100644
--- a/mindspore/python/mindspore/profiler/parser/framework_enum.py
+++ b/mindspore/python/mindspore/profiler/parser/framework_enum.py
@@ -1,4 +1,4 @@
-# Copyright 2021 Huawei Technologies Co., Ltd
+# Copyright 2021-2022 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -104,3 +104,6 @@ class VmFormat(IntEnum):
         """
         format_name = cls._value2member_map_.get(num)
         return 'UNKNOWN' if format_name is None else format_name.name
+
+
+MSPROF_DIFFERENCE = 200
diff --git a/mindspore/python/mindspore/profiler/parser/framework_parser.py b/mindspore/python/mindspore/profiler/parser/framework_parser.py
index 5e25545346e..9410d0c61a1 100644
--- a/mindspore/python/mindspore/profiler/parser/framework_parser.py
+++ b/mindspore/python/mindspore/profiler/parser/framework_parser.py
@@ -1,4 +1,4 @@
-# Copyright 2020-2021 Huawei Technologies Co., Ltd
+# Copyright 2020-2022 Huawei Technologies Co., Ltd
 #
 # Licensed under the Apache License, Version 2.0 (the "License");
 # you may not use this file except in compliance with the License.
@@ -27,7 +27,7 @@ from mindspore import log as logger
 from mindspore.profiler.parser.framework_struct import TASK_DESC_STRUCT
 from mindspore.profiler.parser.framework_struct import TENSOR_DATA_STRUCT
 from mindspore.profiler.parser.framework_struct import STEP_INFO_STRUCT
-from mindspore.profiler.parser.framework_enum import VmDataType, VmFormat, FileDataType
+from mindspore.profiler.parser.framework_enum import VmDataType, VmFormat, FileDataType, MSPROF_DIFFERENCE
 from mindspore.profiler.common.struct_type import StructType
 from mindspore.profiler.common.util import combine_stream_task_id
 from mindspore.profiler.common.exceptions.exceptions import ProfilerDirNotFoundException
@@ -253,7 +253,7 @@ class FrameworkParser:
         # skip rsv data, rsv has 7 bytes
         skip_size = 8
         remain_size = data_size - skip_size
-        if flag == 0:
+        if flag == 1:
             unpack_data = struct.unpack(StructType.CHAR.value * remain_size,
                                         item_binary_data[cursor + skip_size:cursor + data_size])
             unpack_data = ''.join(list(map(lambda c: c.decode(), filter(lambda c: c != b'\x00', unpack_data))))
@@ -315,6 +315,20 @@ class FrameworkParser:
             point_info[tag] = full_op_name
         return point_info
 
+    @staticmethod
+    def _get_vm_data_type(msprof_data_type):
+        """Get the mapped vm data type of msprof."""
+        if msprof_data_type >= MSPROF_DIFFERENCE:
+            return msprof_data_type - MSPROF_DIFFERENCE
+        return msprof_data_type
+
+    @staticmethod
+    def _get_vm_op_format(msprof_op_format):
+        """Get the mapped op format type of msprof."""
+        if msprof_op_format >= MSPROF_DIFFERENCE:
+            return msprof_op_format - MSPROF_DIFFERENCE
+        return msprof_op_format
+
     @staticmethod
     def _construct_task_id_op_attr_dict(prof_tensor_data):
         """prof_tensor_data is a list[tensor_data], tensor_data is a dict, key is same as TENSOR_DATA_STRUCT."""
@@ -323,11 +337,11 @@ class FrameworkParser:
             task_id = combine_stream_task_id(tensor_data['streamId'], tensor_data['taskId'])
             for tensor_attr in tensor_data['tensorData']:
                 tensor_type = 'input' if tensor_attr['tensorType'] == 0 else 'output'
-                tensor_format = VmFormat.get_format_name(tensor_attr['format'])
+                tensor_format = VmFormat.get_format_name(FrameworkParser._get_vm_data_type(tensor_attr['format']))
                 op_attr = dict(
                     tensor_type=tensor_type,
                     format=tensor_format,
-                    data_type=VmDataType.get_data_type_name(tensor_attr['dataType']),
+                    data_type=VmDataType.get_data_type_name(FrameworkParser._get_vm_op_format(tensor_attr['dataType'])),
                     shape=tensor_attr['shape']
                 )
                 task_id_op_attr_dict[task_id].append(op_attr)
diff --git a/mindspore/python/mindspore/profiler/parser/integrator.py b/mindspore/python/mindspore/profiler/parser/integrator.py
index 7fc0c2aef6f..ee026e3dcf9 100644
--- a/mindspore/python/mindspore/profiler/parser/integrator.py
+++ b/mindspore/python/mindspore/profiler/parser/integrator.py
@@ -587,6 +587,7 @@ class BaseTimelineGenerator:
         }
         self._device_target = str(device_target).lower()
         self._model = model
+        self._step_start_op_name = ""
         self._step_end_op_name = ""
 
     def get_thread_label_name(self):
@@ -660,8 +661,8 @@ class BaseTimelineGenerator:
         the merged result is [[1,6], [7,8]].
         """
         time_merged_segment_list = []
-        tid = self._tid_dict[display_name][0]
-        pid = self._tid_dict[display_name][1]
+        tid = self._tid_dict.get(display_name, (0, 0))[0]
+        pid = self._tid_dict.get(display_name, (0, 0))[1]
         for time_item in time_list:
             time_segment = list(map(float, time_item[self._start_time_idx:self._duration_idx + 1]))
             time_segment[1] = time_segment[0] + time_segment[1] / factor
@@ -1888,6 +1889,22 @@ class AscendTimelineGenerator(BaseTimelineGenerator):
             timeline_list[idx][self._start_time_idx] = timeline_list[idx][self._start_time_idx] / 1000000
             timeline_list[idx][self._duration_idx] = timeline_list[idx][self._duration_idx] / 1000
 
+    def _set_step_start_and_end_op_name(self, timeline_list):
+        """Set the start and end operator full name of each step."""
+        if not timeline_list or len(timeline_list) < 2:
+            return
+
+        start_op_idx = 0
+        self._step_end_op_name = timeline_list[-1][self._op_name_idx]
+        for i, timeline in enumerate(timeline_list):
+            if timeline[self._op_name_idx] == self._step_end_op_name:
+                start_op_idx = i + 1
+                break
+
+        if start_op_idx >= len(timeline_list):
+            start_op_idx = 0
+        self._step_start_op_name = timeline_list[start_op_idx][self._op_name_idx]
+
 
 class CpuTimelineGenerator(GpuTimelineGenerator):
     """Generate cpu Timeline data from file."""
diff --git a/tests/ut/data/profiler_data/framework/data/Framework.task_desc_info.6.slice_0 b/tests/ut/data/profiler_data/framework/data/Framework.task_desc_info.6.slice_0
index 492270e3f6712724a65af2433bb86a346fae6e9c..b67cd5d1be5e2a4ce6e1cbbd5f38812f77ea40f2 100644
GIT binary patch
delta 1570
zcmXBT#ZsLy06<|besS00uEi<ErKM<bxma<xqC41j2gB?2A$WwAbF#?fo0I(iB9rI$
z!1H?`7z$;FeT=|s@agq$?CZ;8An+Cpe5~JI0w7$3g9s4;B1Pn5AnYv|C88+NA{xYq
z7!WIB0snk^34%CF9Ecb3AVDO6M3D%RL=s3A$sk3ffK-tR(nK0a7wI5FWPnVO39>{M
z$QIckN92H9kqh!f9>^E@;FI_S3Pb@Y6osHj6oFz<3`#@^C>5okOq79gQ4T6Z1*jC2
z++3BYqEw4&N{y(Y)QVbAC+gT%FX};qXaJ3(ku#sgXV4^?K(lBDEusaqidN7j+CaN#
z2OXjVbc#;!MSKBWq6>T#UqQF%20fw&^om~4C;C9Y=m!I001S#jFeHY+uowm-Vg!5>
z-@teA9gK=m@Z;(K1O3As95aj&#>F_85EEchOoAyf1*XL`_{o=<gENL1!mOADb7Bt6
zi+Qjh7Qmud1WRHGEQ@8ZB38hvSOp;w0&8Lotc!K9AvVCK*aTZ*3;Ytlz_!>1J7Ndy
zie0cL_Q1Z_2M6K+9EwA5B#ywbI0h%;1e}Ufa3;>cxi|+G;sRWXOK>Hwz_qvrzr}BG
VBW}R0xCM9O4%~}-@E{(p{sH7%ExZ5#

delta 1570
zcmXBT#Zp{B06<X&AKcvo1P|_R37X(ANN{&ZU<cdmpyo&Uge3R&qN`8c?)Mg5{rVAj
z{Rjj@q1*_@d+_CbH~#(YIS>&J2L7+ZZvhY~B0-dh0?{J+IS>d3V?+!kR>Xoh5eMQ$
zJm8<<w;)KcB!EPb2$Dn+NEXQ;MWldKkqXj88b}xEAVXw;Opyt)L>9;v*&s*cfLxIa
z@<blU7x|z-6o5ie2#Q1zC>F(_M3jJ1Q3}dL87LR!ph8rDPvR4(6qTS#RDo(y&CPul
zpD8t>hEgkPDRrU_)QftyHHZe#C>lYNXyVKl@dY%CX3!#9K&xm4ZK4gdi+0c<IzXrB
z1YM#Fbc=4#BYHru=mmYE5A=(EFdzoNpcn*0Vh9Y2VK5>_z^E7nV`2=9i*Ya^Ccvba
z1YgBh@a^T_1O3AsoH9%iro}Xv5i?*`%z`;F2j;~*_|BJ^gFg&E2n%8XEQ&?2B$mLk
zSOzO%1+0oyuqM{Px>yGrVgrOk2yBW?uqC#@w%7(cVh8*bKf$ip1$$x-?2CPHAP&Hx
zI0Q%H2po%Ja3W5?sW=5^;tZUNb8sOpz@@kZSK<m>i)(NrZosX$1$W{O+>3kgARfS@
Rcm%)1FYsIZ22bMY_Ad_#^cMgC