Browse Source

!1374 fix hccl loading error

From: @xchu42
Reviewed-by: @wqtshg,@ji_chen
Signed-off-by: @ji_chen
tags/v1.3.0
mindspore-ci-bot Gitee 4 years ago
parent
commit
cf473fb4bc
1 changed files with 3 additions and 2 deletions
  1. +3
    -2
      ge/hybrid/model/hybrid_model_builder.cc

+ 3
- 2
ge/hybrid/model/hybrid_model_builder.cc View File

@@ -1097,6 +1097,7 @@ Status HybridModelBuilder::LoadTasks() {
} }
if (node_item->node_type == PARTITIONEDCALL) { if (node_item->node_type == PARTITIONEDCALL) {
ordered_partitioned_calls.emplace(node_item->node_id, node_item.get()); ordered_partitioned_calls.emplace(node_item->node_id, node_item.get());
continue;
} }
GE_CHK_STATUS_RET_NOLOG(LoadTask(*node_item)); GE_CHK_STATUS_RET_NOLOG(LoadTask(*node_item));
} }
@@ -2029,14 +2030,14 @@ Status HybridModelBuilder::CollectParallelGroups(NodeItem *node_item) {
if (executor_type == NodeExecutorManager::ExecutorType::HCCL) { if (executor_type == NodeExecutorManager::ExecutorType::HCCL) {
std::string parallel_group; std::string parallel_group;
if (AttrUtils::GetStr(node->GetOpDesc(), ATTR_NAME_PARALLEL_GROUP, parallel_group)) { if (AttrUtils::GetStr(node->GetOpDesc(), ATTR_NAME_PARALLEL_GROUP, parallel_group)) {
GELOGD("[%s] Got parallel group = %s", node_item->NodeName().c_str(), parallel_group.c_str());
GELOGD("[%s] Got parallel group = [%s]", node_item->NodeName().c_str(), parallel_group.c_str());
parallel_group_to_nodes_[parallel_group].emplace(node_item); parallel_group_to_nodes_[parallel_group].emplace(node_item);
std::set<std::string> group{parallel_group}; std::set<std::string> group{parallel_group};
node_to_parallel_groups_[node_item].emplace(parallel_group); node_to_parallel_groups_[node_item].emplace(parallel_group);
} }
} else if (executor_type == NodeExecutorManager::ExecutorType::COMPILED_SUBGRAPH) { } else if (executor_type == NodeExecutorManager::ExecutorType::COMPILED_SUBGRAPH) {
std::set<std::string> parallel_groups; std::set<std::string> parallel_groups;
GELOGD("[%s] Parse parallel group for known-shaped subgraph", node_item->NodeName().c_str());
GELOGD("[%s] To collect parallel group for known-shaped subgraph", node_item->NodeName().c_str());
for (const auto &subgraph_name : node->GetOpDesc()->GetSubgraphInstanceNames()) { for (const auto &subgraph_name : node->GetOpDesc()->GetSubgraphInstanceNames()) {
GELOGD("[%s] Start to get parallel group from subgraph: %s", GELOGD("[%s] Start to get parallel group from subgraph: %s",
node_item->NodeName().c_str(), node_item->NodeName().c_str(),


Loading…
Cancel
Save