diff --git a/ge/graph/build/task_generator.cc b/ge/graph/build/task_generator.cc
index 0082aece..786e4994 100755
--- a/ge/graph/build/task_generator.cc
+++ b/ge/graph/build/task_generator.cc
@@ -526,6 +526,13 @@ Status TaskGenerator::MarkNodeAndSetIndex(ComputeGraphPtr &graph) {
     return GE_GRAPH_GRAPH_NODE_NULL;
   }
 
+  int64_t node_index = 0;
+  for (auto &node : all_nodes) {
+    OpDescPtr op_desc = node->GetOpDesc();
+    GE_CHECK_NOTNULL(op_desc);
+    op_desc->SetId(node_index++);
+  }
+
   map<int64_t, vector<OpDescPtr>> all_stream_ops;
   for (auto &node : all_nodes) {
     OpDescPtr op_desc = node->GetOpDesc();
diff --git a/ge/graph/load/model_manager/davinci_model.cc b/ge/graph/load/model_manager/davinci_model.cc
index 30e47052..bb75bff1 100755
--- a/ge/graph/load/model_manager/davinci_model.cc
+++ b/ge/graph/load/model_manager/davinci_model.cc
@@ -446,20 +446,23 @@ void DavinciModel::InitRuntimeParams() {
       runtime_param_.mem_size, runtime_param_.weight_size, runtime_param_.var_size);
 }
 
-void DavinciModel::CheckHasHcomOp(const ComputeGraphPtr &compute_graph) {
-  const set<string> hcom_opp_types({
-      HCOMBROADCAST, HCOMALLGATHER, HCOMALLREDUCE, HCOMSEND, HCOMRECEIVE, HCOMREDUCESCATTER,
-      HVDCALLBACKALLREDUCE, HVDCALLBACKALLGATHER, HVDCALLBACKBROADCAST, HVDWAIT, HCOMREDUCE
-  });
-
+void DavinciModel::CheckHasHcomOp() {
+  Graph graph = ge_model_->GetGraph();
+  auto compute_graph = GraphUtils::GetComputeGraph(graph);
+  if (compute_graph == nullptr) {
+    return;
+  }
   for (const auto &node : compute_graph->GetAllNodes()) {
     OpDescPtr op_desc = node->GetOpDesc();
     GE_IF_BOOL_EXEC(op_desc == nullptr, GELOGW("Node OpDesc is nullptr"); continue);
-    if (hcom_opp_types.count(op_desc->GetType()) > 0) {
-      uint32_t stream_id = static_cast<uint32_t>(op_desc->GetStreamId());
-      hcom_streams_.emplace(stream_id);
-      GELOGD("hcom stream: %u.", stream_id);
-    }
+    GE_IF_BOOL_EXEC(((op_desc->GetType() == HCOMBROADCAST) || (op_desc->GetType() == HCOMALLGATHER) ||
+                     (op_desc->GetType() == HCOMALLREDUCE) || (op_desc->GetType() == HCOMSEND) ||
+                     (op_desc->GetType() == HCOMRECEIVE) || (op_desc->GetType() == HCOMREDUCESCATTER) ||
+                     (op_desc->GetType() == HVDCALLBACKALLREDUCE) || (op_desc->GetType() == HVDCALLBACKALLGATHER) ||
+                     (op_desc->GetType() == HVDCALLBACKBROADCAST) || (op_desc->GetType() == HVDWAIT) ||
+                     (op_desc->GetType() == HCOMREDUCE)),
+                    uint32_t stream_id = static_cast<uint32_t>(op_desc->GetStreamId());
+                    (void)hcom_streams_.emplace(stream_id); GELOGD("hcom stream: %u.", stream_id); continue);
   }
 }
 
@@ -639,7 +642,7 @@ Status DavinciModel::Init(void *dev_ptr, size_t mem_size, void *weight_ptr, size
   name_ = ge_model_->GetName();
   (void)ge::AttrUtils::GetBool(ge_model_, ATTR_NAME_SWITCH_FOR_L1_FUSION, is_l1_fusion_enable_);
   GELOGD("The value of ge.l1Fusion in ge_model is %d.", is_l1_fusion_enable_);
-  CheckHasHcomOp(compute_graph);
+  CheckHasHcomOp();
 
   vector<int64_t> huge_stream_list;
   (void)ge::AttrUtils::GetListInt(ge_model_, ATTR_MODEL_HUGE_STREAM_LIST, huge_stream_list);
@@ -1025,7 +1028,7 @@ Status DavinciModel::GenInputOutputInfo(const map<uint32_t, OpDescPtr> &data_by_
                                         const vector<OpDescPtr> &output_op_list) {
   GELOGD("Data node size: %zu, NetOutput node size: %zu", data_by_index.size(), output_op_list.size());
   for (auto &item : data_by_index) {
-    const auto output_addrs = ModelUtils::GetOutputDataAddrs(runtime_param_, item.second);
+    auto output_addrs = ModelUtils::GetOutputDataAddrs(runtime_param_, item.second);
     GELOGD("Data node: %s, output addr size: %zu", item.second->GetName().c_str(), output_addrs.size());
     input_addrs_list_.emplace_back(output_addrs);
 
@@ -1033,18 +1036,14 @@ Status DavinciModel::GenInputOutputInfo(const map<uint32_t, OpDescPtr> &data_by_
     GE_CHK_STATUS_RET(InitAippType(item.first, item.second, data_by_index), "Init AIPP Type failed");
     GE_CHK_STATUS_RET(InitOrigInputInfo(item.first, item.second), "Init Orig input failed");
     GE_CHK_STATUS_RET(InitAippInputOutputDims(item.first, item.second), "Init AIPP dims failed");
-    GE_CHK_STATUS_RET(InitInputDescInfo(item.second), "Init input desc info failed");
     if (item.second->GetType() == AIPP_DATA_TYPE) {
       GELOGI("This is dynamic aipp model, Node: %s", item.second->GetName().c_str());
       is_dynamic_aipp_ = true;
     }
   }
 
-  vector<string> out_node_name;
-  (void)AttrUtils::GetListStr(ge_model_, ATTR_MODEL_OUT_NODES_NAME, out_node_name);
-  GELOGD("Output node size: %zu, out nodes name: %zu", output_op_list.size(), out_node_name.size());
   for (const auto &op_desc : output_op_list) {
-    const auto input_addrs = ModelUtils::GetInputDataAddrs(runtime_param_, op_desc);
+    auto input_addrs = ModelUtils::GetInputDataAddrs(runtime_param_, op_desc);
     GELOGD("NetOutput node: %s, input addr size: %zu", op_desc->GetName().c_str(), input_addrs.size());
     output_addrs_list_.emplace_back(input_addrs);
 
@@ -1062,11 +1061,10 @@ Status DavinciModel::GenInputOutputInfo(const map<uint32_t, OpDescPtr> &data_by_
     if (InitOutputTensorInfo(op_desc) != SUCCESS) {
       return INTERNAL_ERROR;
     }
-
-    GE_CHK_STATUS_RET(InitOutputDescInfo(op_desc, out_node_name), "Init output desc info failed");
   }
 
-  return SUCCESS;
+  GE_CHK_STATUS_RET(InitInputDescInfo(data_by_index), "Init input desc info failed");
+  return InitOutputDescInfo(output_op_list);
 }
 
 bool DavinciModel::IsGetNextSinkDynamic(const OpDescPtr &op_desc) {
@@ -1982,24 +1980,27 @@ void DavinciModel::CreateInputDimsInfo(const OpDescPtr &op_desc, Format format,
   }
 }
 
-Status DavinciModel::InitInputDescInfo(const OpDescPtr &op_desc) {
-  GE_CHECK_NOTNULL(op_desc->GetInputDescPtr(0));
+Status DavinciModel::InitInputDescInfo(const map<uint32_t, OpDescPtr> &data_by_index) {
+  for (const auto &item : data_by_index) {
+    const auto op_desc = item.second;
+    GE_CHECK_NOTNULL(op_desc->GetInputDescPtr(0));
 
-  InputOutputDescInfo input;
-  ShapeDescription dims_info;
-  Format format = op_desc->GetInputDescPtr(0)->GetFormat();
-  CreateInputDimsInfo(op_desc, format, input.shape_info, dims_info);
+    InputOutputDescInfo input;
+    ShapeDescription dims_info;
+    Format format = op_desc->GetInputDescPtr(0)->GetFormat();
+    CreateInputDimsInfo(op_desc, format, input.shape_info, dims_info);
 
-  input.data_type = op_desc->GetInputDescPtr(0)->GetDataType();
-  input.name = op_desc->GetName();
-  int64_t input_size = 0;
-  GE_CHK_STATUS_RET(TensorUtils::GetSize(*op_desc->GetInputDescPtr(0), input_size), "get input size failed.");
-  input.size = input_size;
-  input_formats_.push_back(format);
-  input_descs_.push_back(input);
+    input.data_type = op_desc->GetInputDescPtr(0)->GetDataType();
+    input.name = op_desc->GetName();
+    int64_t input_size = 0;
+    GE_CHK_STATUS_RET(TensorUtils::GetSize(*op_desc->GetInputDescPtr(0), input_size), "get input size failed.");
+    input.size = input_size;
+    input_formats_.push_back(format);
+    input_descs_.push_back(input);
 
-  input.shape_info = dims_info;
-  input_descs_dims_.push_back(input);
+    input.shape_info = dims_info;
+    input_descs_dims_.push_back(input);
+  }
   return SUCCESS;
 }
 
@@ -2065,31 +2066,37 @@ void DavinciModel::CreateOutput(uint32_t index, const OpDescPtr &op_desc, InputO
   output.data_type = op_desc->GetInputDescPtr(index)->GetDataType();
 }
 
-Status DavinciModel::InitOutputDescInfo(const OpDescPtr &op_desc, const vector<string> &out_node_name) {
-  uint32_t out_size = static_cast<uint32_t>(op_desc->GetInputsSize());
-  for (uint32_t i = 0; i < out_size; ++i) {
-    string output_name;
-    InputOutputDescInfo output;
-    uint32_t format_result;
-    CreateOutput(i, op_desc, output, format_result);
-
-    std::vector<std::string> src_name = op_desc->GetSrcName();
-    std::vector<int64_t> src_index = op_desc->GetSrcIndex();
-    GE_CHK_BOOL_RET_STATUS(src_name.size() > i && src_index.size() > i, INTERNAL_ERROR,
-                           "construct output_name failed.");
-    // forward compatbility, if old om has no out_node_name, need to return output follow origin way
-    if (out_size == out_node_name.size()) {
-      // neweast plan, the index will add to name during generate model.
-      bool contains_colon = out_node_name[i].find(":") != std::string::npos;
-      output_name = contains_colon ? out_node_name[i] : out_node_name[i] + ":" + std::to_string(src_index[i]);
-    } else {
-      output_name = string("output_") + std::to_string(i) + "_" + src_name[i] + "_" + std::to_string(src_index[i]);
+Status DavinciModel::InitOutputDescInfo(const vector<OpDescPtr> &output_op_list) {
+  GELOGD("Output node size: %zu", output_op_list.size());
+  vector<string> out_node_name;
+  (void)ge::AttrUtils::GetListStr(ge_model_, ATTR_MODEL_OUT_NODES_NAME, out_node_name);
+  for (const auto &op_desc : output_op_list) {
+    uint32_t out_size = static_cast<uint32_t>(op_desc->GetInputsSize());
+    for (uint32_t index = 0; index < out_size; index++) {
+      string output_name;
+      InputOutputDescInfo output;
+      uint32_t format_result;
+      CreateOutput(index, op_desc, output, format_result);
+
+      std::vector<std::string> src_name = op_desc->GetSrcName();
+      std::vector<int64_t> src_index = op_desc->GetSrcIndex();
+      GE_CHK_BOOL_RET_STATUS(src_name.size() > index && src_index.size() > index, INTERNAL_ERROR,
+                             "construct output_name failed.");
+      // forward compatbility, if old om has no out_node_name, need to return output follow origin way
+      if (out_size == out_node_name.size()) {
+        // neweast plan, the index will add to name during generate model.
+        bool contains_colon = out_node_name[index].find(":") != std::string::npos;
+        output_name =
+            contains_colon ? out_node_name[index] : out_node_name[index] + ":" + std::to_string(src_index[index]);
+      } else {
+        output_name = std::string("output_") + std::to_string(index) + "_" + src_name[index] + "_" +
+                      std::to_string(src_index[index]);
+      }
+      output.name = output_name;
+      output_descs_.push_back(output);
+      output_formats_.push_back(format_result);
     }
-    output.name = output_name;
-    output_descs_.push_back(output);
-    output_formats_.push_back(format_result);
   }
-
   return SUCCESS;
 }
 
diff --git a/ge/graph/load/model_manager/davinci_model.h b/ge/graph/load/model_manager/davinci_model.h
index 22f3bcab..53db77a7 100755
--- a/ge/graph/load/model_manager/davinci_model.h
+++ b/ge/graph/load/model_manager/davinci_model.h
@@ -827,7 +827,7 @@ class DavinciModel {
 
   void OpDebugUnRegister();
 
-  void CheckHasHcomOp(const ComputeGraphPtr &graph);
+  void CheckHasHcomOp();
 
   Status DoTaskSink();
 
@@ -850,8 +850,8 @@ class DavinciModel {
   Status InitOutputTensorInfo(const OpDescPtr &op_desc);
   Status GenOutputTensorInfo(OutputData *output_data, vector<OutputTensorInfo> &outputs);
 
-  Status InitInputDescInfo(const OpDescPtr &op_desc);
-  Status InitOutputDescInfo(const OpDescPtr &op_desc, const vector<string> &out_node_name);
+  Status InitInputDescInfo(const map<uint32_t, OpDescPtr> &data_by_index);
+  Status InitOutputDescInfo(const vector<OpDescPtr> &output_op_list);
 
   Status InitOrigInputInfo(uint32_t index, const OpDescPtr &op_desc);
   Status InitAippInfo(uint32_t index, const OpDescPtr &op_desc);
diff --git a/ge/graph/manager/graph_manager.cc b/ge/graph/manager/graph_manager.cc
index 55e26cf9..410611b0 100755
--- a/ge/graph/manager/graph_manager.cc
+++ b/ge/graph/manager/graph_manager.cc
@@ -730,7 +730,9 @@ Status GraphManager::PreRunAfterOptimizeSubGraph(const GraphNodePtr &graph_node,
   CompilerStages &stages = GetCompilerStages(graph_node->GetGraphId());
   GM_RUN_AND_DUMP_PERF("OptimizeWholeGraph", stages.optimizer.OptimizeWholeGraph, compute_graph);
   GM_RUN_AND_DUMP_PERF("Optimize2", OptimizeStage2, compute_graph);
-  GM_RUN_AND_DUMP_PERF("OptimizeBeforeBuildForRts", stages.optimizer.OptimizeGraphBeforeBuildForRts, compute_graph);
+  GM_RUN_AND_DUMP_PERF("OptimizeGraphBeforeBuildForRts",
+                       GetCompilerStages(graph_node->GetGraphId()).optimizer.OptimizeGraphBeforeBuildForRts,
+                       compute_graph);
 
   Status ret = compute_graph->TopologicalSorting();
   if (ret != SUCCESS) {