You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_generator.cc 37 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "generator/ge_generator.h"
  17. #include <atomic>
  18. #include "common/ge/ge_util.h"
  19. #include "common/ge/plugin_manager.h"
  20. #include "common/helper/model_helper.h"
  21. #include "common/helper/om_file_helper.h"
  22. #include "common/util.h"
  23. #include "common/util/error_manager/error_manager.h"
  24. #include "framework/common/debug/ge_log.h"
  25. #include "framework/common/debug/log.h"
  26. #include "ge/ge_api.h"
  27. #include "graph/debug/ge_attr_define.h"
  28. #include "graph/ge_context.h"
  29. #include "graph/manager/graph_manager.h"
  30. #include "graph/manager/util/rt_context_util.h"
  31. #include "graph/opsproto_manager.h"
  32. #include "graph/utils/graph_utils.h"
  33. #include "graph/utils/type_utils.h"
  34. #include "init/gelib.h"
  35. #include "model/ge_model.h"
  36. using std::map;
  37. using std::string;
  38. using std::vector;
  39. namespace {
  40. const char *const kAttrOpType = "op_type";
  41. const char *const kEngineNameDefault = "default";
  42. const char *const kVectorEngine = "VectorEngine";
  43. const char *const kAIcoreEngine = "AIcoreEngine";
  44. const char *const kFileNameSuffix = "online";
  45. const char *const kAicpuAllshape = "_AllShape";
  46. constexpr char const *kAttrSupportDynamicShape = "support_dynamicshape";
  47. const int64_t kDynamicDimValue = -2;
  48. std::map<ge::OpEngineType, std::string> engine_type_map{
  49. {ge::ENGINE_SYS, kEngineNameDefault}, {ge::ENGINE_AICORE, kAIcoreEngine}, {ge::ENGINE_VECTOR, kVectorEngine}};
  50. bool ContainsDynamicInpus(const ge::OpDesc &op_desc) {
  51. for (auto &tensor_desc : op_desc.GetAllInputsDescPtr()) {
  52. if (tensor_desc->MutableShape().IsUnknownShape()) {
  53. GELOGI("Contains unknown shape input. set is_dynamic_input to true.");
  54. return true;
  55. }
  56. }
  57. return false;
  58. }
  59. } // namespace
  60. namespace ge {
  61. static Status CheckEngineTypeSupport(const OpDescPtr &op_desc, OpEngineType engine_type) {
  62. GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID);
  63. if (engine_type == ENGINE_SYS) {
  64. GELOGI("CheckEngineType: use default engine.");
  65. return SUCCESS;
  66. }
  67. // get op engine name
  68. string op_engine_name;
  69. auto iter = engine_type_map.find(engine_type);
  70. if (iter != engine_type_map.end()) {
  71. op_engine_name = iter->second;
  72. GELOGI("CheckEngineType: engine type: %d", static_cast<int>(engine_type));
  73. } else {
  74. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  75. {op_desc->GetName(), op_desc->GetType(), "engine type",
  76. "it only support kEngineNameDefault/kAIcoreEngine/kVectorEngine"});
  77. GELOGE(FAILED, "CheckEngineType: engine type: %d not support", static_cast<int>(engine_type));
  78. return FAILED;
  79. }
  80. if (op_desc->HasAttr(ATTR_NAME_UNREGST_OPPATH)) {
  81. op_desc->SetOpEngineName(op_engine_name);
  82. op_desc->SetOpKernelLibName(op_engine_name);
  83. return SUCCESS;
  84. }
  85. // set op engine name and opkernelLib. when engine support
  86. std::shared_ptr<GELib> instance_ptr = ge::GELib::GetInstance();
  87. if ((instance_ptr == nullptr) || (!instance_ptr->InitFlag())) {
  88. GELOGE(GE_CLI_GE_NOT_INITIALIZED, "CheckEngineType failed.");
  89. return FAILED;
  90. }
  91. OpsKernelManager &ops_kernel_manager = instance_ptr->OpsKernelManagerObj();
  92. std::vector<OpInfo> op_infos = ops_kernel_manager.GetOpsKernelInfo(op_desc->GetType());
  93. if (op_infos.empty()) {
  94. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  95. {op_desc->GetName(), op_desc->GetType(), "optype", "it can not find"});
  96. GELOGE(FAILED, "CheckEngineType: Can not get op info by op type %s", op_desc->GetType().c_str());
  97. return FAILED;
  98. }
  99. string kernel_name;
  100. for (const auto &it : op_infos) {
  101. if (it.engine == op_engine_name) {
  102. kernel_name = it.opKernelLib;
  103. break;
  104. }
  105. }
  106. if (kernel_name.empty()) {
  107. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  108. {op_desc->GetName(), op_desc->GetType(), "engine name" + FmtToStr(op_engine_name), "it can not find"});
  109. GELOGE(FAILED, "CheckEngineType:Can not find ops kernel, engine name: %s.", op_engine_name.c_str());
  110. return FAILED;
  111. }
  112. auto &kernel_map = ops_kernel_manager.GetAllOpsKernelInfoStores();
  113. auto kernel_info_store = kernel_map.find(kernel_name);
  114. if (kernel_info_store != kernel_map.end()) {
  115. std::string unsupported_reason;
  116. if (kernel_info_store->second->CheckSupported(op_desc, unsupported_reason)) {
  117. op_desc->SetOpEngineName(op_engine_name);
  118. op_desc->SetOpKernelLibName(kernel_name);
  119. GELOGI("CheckEngineType:Set OpKernelLibName %s and engine name %s into op_desc %s", kernel_name.c_str(),
  120. op_engine_name.c_str(), op_desc->GetName().c_str());
  121. return SUCCESS;
  122. } else {
  123. ErrorManager::GetInstance().ATCReportErrMessage(
  124. "E13002", {"optype", "opskernel", "reason"}, {op_desc->GetType(), kernel_name, unsupported_reason});
  125. GELOGE(FAILED, "CheckEngineType: check support failed, Op type %s of ops kernel %s is unsupported, reason:%s",
  126. op_desc->GetType().c_str(), kernel_name.c_str(), unsupported_reason.c_str());
  127. return FAILED;
  128. }
  129. } else {
  130. ErrorManager::GetInstance().ATCReportErrMessage(
  131. "E13003", {"opname", "optype"}, {op_desc->GetName(), op_desc->GetType()});
  132. GELOGE(FAILED,
  133. "CheckEngineType:Can not find any supported ops kernel info store by kernel_name %s,"
  134. "op type is %s, op name is %s",
  135. kernel_name.c_str(), op_desc->GetType().c_str(), op_desc->GetName().c_str());
  136. }
  137. return FAILED;
  138. }
  139. static Status AddInputs(const ComputeGraphPtr &graph, const NodePtr &node, const GeTensorDesc &tensor, int32_t index,
  140. bool attr) {
  141. GE_CHECK_NOTNULL_EXEC(graph, return PARAM_INVALID);
  142. GE_CHECK_NOTNULL_EXEC(node, return PARAM_INVALID);
  143. auto format = tensor.GetFormat();
  144. auto data_type = tensor.GetDataType();
  145. if (format == FORMAT_RESERVED && data_type == DT_UNDEFINED) {
  146. return SUCCESS;
  147. }
  148. string op_type;
  149. bool is_const = false;
  150. (void)AttrUtils::GetBool(tensor, CONST_ATTR_NAME_INPUT, is_const);
  151. if (is_const) {
  152. GELOGD("Get input[%d] is const", index);
  153. op_type = CONSTANTOP;
  154. } else if (!AttrUtils::GetStr(tensor, kAttrOpType, op_type) || op_type.empty()) {
  155. op_type = DATA;
  156. }
  157. string op_name = node->GetName() + "_in_" + std::to_string(index);
  158. OpDescPtr data_op = MakeShared<ge::OpDesc>(op_name, op_type);
  159. if (data_op == nullptr) {
  160. return FAILED;
  161. }
  162. if (is_const) {
  163. ConstGeTensorPtr tensor_value;
  164. if (!AttrUtils::GetTensor(tensor, ge::ATTR_NAME_WEIGHTS, tensor_value)) {
  165. GELOGE(FAILED, "Get value failed, node name:%s.", tensor.GetName().c_str());
  166. return FAILED;
  167. }
  168. if (!AttrUtils::SetTensor(data_op, ge::ATTR_NAME_WEIGHTS, tensor_value)) {
  169. GELOGE(FAILED, "Set attr ATTR_NAME_WEIGHTS fail.");
  170. return FAILED;
  171. }
  172. }
  173. (void)AttrUtils::SetBool(data_op, "_is_single_op", true);
  174. GE_CHK_BOOL_EXEC(data_op->AddInputDesc(tensor) == GRAPH_SUCCESS, return FAILED, "Add input desc fail.");
  175. GE_CHK_BOOL_EXEC(data_op->AddOutputDesc(tensor) == GRAPH_SUCCESS, return FAILED, "Add output desc fail.");
  176. if (attr) {
  177. GE_CHK_BOOL_EXEC(AttrUtils::SetInt(data_op, ATTR_NAME_INDEX, index), return FAILED, "Set index fail.");
  178. }
  179. ge::NodePtr arg_node = graph->AddNode(data_op);
  180. GE_CHK_BOOL_EXEC(arg_node != nullptr, return FAILED, "Insert Data node fail.");
  181. GE_CHK_STATUS(GraphUtils::AddEdge(arg_node->GetOutDataAnchor(0), node->GetInDataAnchor(index)),
  182. "Add edge[%s->%s] fail.", data_op->GetName().c_str(), node->GetName().c_str());
  183. return SUCCESS;
  184. }
  185. static Status AddOutputs(const ComputeGraphPtr &graph, const NodePtr &node, const vector<GeTensor> &outputs) {
  186. OpDescPtr op_desc = MakeShared<ge::OpDesc>(graph->GetName() + "_" + NODE_NAME_NET_OUTPUT, NETOUTPUT);
  187. if (op_desc == nullptr) {
  188. return FAILED;
  189. }
  190. (void)AttrUtils::SetBool(op_desc, "_is_single_op", true);
  191. int32_t count = 0;
  192. for (const auto &out_desc : outputs) {
  193. GeTensorDesc tensor = out_desc.GetTensorDesc();
  194. TensorUtils::SetInputTensor(tensor, true);
  195. GE_CHK_BOOL_EXEC(op_desc->AddInputDesc(tensor) == GRAPH_SUCCESS, return FAILED, "Add input desc fail");
  196. TensorUtils::SetInputTensor(tensor, false);
  197. TensorUtils::SetOutputTensor(tensor, true);
  198. GE_CHK_BOOL_EXEC(op_desc->AddOutputDesc(tensor) == GRAPH_SUCCESS, return FAILED, "Add output desc fail");
  199. count++;
  200. }
  201. GE_CHECK_NOTNULL_EXEC(graph, return PARAM_INVALID);
  202. ge::NodePtr out_node = graph->AddNode(op_desc);
  203. GE_CHK_BOOL_EXEC(out_node != nullptr, return FAILED, "Insert Output node fail.");
  204. GE_CHECK_NOTNULL_EXEC(node, return PARAM_INVALID);
  205. for (int32_t i = 0; i < count; ++i) {
  206. GE_CHK_STATUS(GraphUtils::AddEdge(node->GetOutDataAnchor(i), out_node->GetInDataAnchor(i)),
  207. "Add edge[%s->%s] fail.", node->GetName().c_str(), out_node->GetName().c_str());
  208. }
  209. return SUCCESS;
  210. }
  211. static void GetOpsProtoPath(string &opsproto_path) {
  212. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  213. if (path_env != nullptr) {
  214. string path = path_env;
  215. string file_path = RealPath(path.c_str());
  216. if (file_path.empty()) {
  217. GELOGE(FAILED, "File path %s is invalid.", path.c_str());
  218. return;
  219. }
  220. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  221. GELOGI("Get opsproto so path from env : %s", path.c_str());
  222. return;
  223. }
  224. string path_base = PluginManager::GetPath();
  225. GELOGI("path_base is %s", path_base.c_str());
  226. path_base = path_base.substr(0, path_base.rfind('/'));
  227. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  228. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  229. }
  230. static Status ResetTensorVecShape(const vector<GeTensor> &inputs, vector<GeTensor> &inputs_dynamic) {
  231. for (auto input : inputs) {
  232. auto input_desc = input.GetTensorDesc();
  233. GeShape shape_ori = input_desc.GetShape();
  234. std::vector<int64_t> dynamic_shape_dims = {kDynamicDimValue};
  235. GeShape dynamic_shape(dynamic_shape_dims);
  236. std::vector<std::pair<int64_t, int64_t>> dynamic_shape_range;
  237. ge::GeTensor inputTensor;
  238. ge::GeTensorDesc desc(input_desc);
  239. bool is_const = false;
  240. (void)AttrUtils::GetBool(input_desc, CONST_ATTR_NAME_INPUT, is_const);
  241. if (!is_const) {
  242. int64_t storage_format = FORMAT_NCHW;
  243. if (ge::AttrUtils::GetInt(desc, ge::ATTR_NAME_STORAGE_FORMAT, storage_format) &&
  244. !ge::AttrUtils::SetListInt(desc, ge::ATTR_NAME_STORAGE_SHAPE, dynamic_shape_dims)) {
  245. GELOGE(FAILED, "Set attr ATTR_NAME_STORAGE_SHAPE fail.");
  246. return FAILED;
  247. }
  248. desc.SetShape(dynamic_shape);
  249. desc.SetShapeRange(dynamic_shape_range);
  250. }
  251. inputTensor.SetTensorDesc(desc);
  252. inputs_dynamic.push_back(inputTensor);
  253. }
  254. return SUCCESS;
  255. }
  256. class GeGenerator::Impl {
  257. public:
  258. Impl(OmgContext &omg_context) : omg_context_(omg_context) {}
  259. ~Impl() = default;
  260. Status BuildModel(const Graph &graph, const vector<GeTensor> &inputs, GeRootModelPtr &ge_models);
  261. Status SaveModel(const string &file_name_prefix, GeModelPtr &models, ModelBufferData &model);
  262. Status SaveRootModel(const string &file_name_prefix, GeRootModelPtr &model, ModelBufferData &model_buff);
  263. Status SaveParams(GeModelPtr &ge_model, const string &type, const map<string, GeAttrValue> &attrs,
  264. const vector<GeTensor> &inputs, const vector<GeTensor> &outputs);
  265. Status GenerateInfershapeGraph(const Graph &graph);
  266. OmgContext &omg_context_;
  267. GraphManager graph_manager_;
  268. SaveParam save_param_;
  269. bool is_offline_ = true;
  270. bool is_singleop_unregistered_ = false;
  271. std::string build_mode_;
  272. std::string build_step_;
  273. static std::mutex mutex_;
  274. private:
  275. static std::string Trim(const std::string &str);
  276. bool ParseVersion(const std::string &line, std::string &version);
  277. bool GetVersionFromPath(const std::string &file_path, std::string &version);
  278. bool SetAtcVersionInfo(AttrHolder &obj);
  279. bool SetOppVersionInfo(AttrHolder &obj);
  280. bool SetOmSystemInfo(AttrHolder &obj);
  281. };
  282. Status GeGenerator::Initialize(const map<string, string> &options) {
  283. return Initialize(options, domi::GetContext());
  284. }
  285. Status GeGenerator::Initialize(const map<string, string> &options, OmgContext &omg_context) {
  286. impl_ = ge::MakeShared<Impl>(omg_context);
  287. if (impl_ == nullptr) {
  288. GELOGE(MEMALLOC_FAILED, "Make shared failed");
  289. return MEMALLOC_FAILED;
  290. }
  291. ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kOpsProtoInit);
  292. string opsproto_path;
  293. GetOpsProtoPath(opsproto_path);
  294. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  295. OpsProtoManager *manager = OpsProtoManager::Instance();
  296. map<string, string> option_tmp;
  297. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  298. (void)manager->Initialize(option_tmp);
  299. Status ret = impl_->graph_manager_.Initialize(options);
  300. if (ret != SUCCESS) {
  301. GELOGE(GE_GENERATOR_GRAPH_MANAGER_INIT_FAILED, "Graph manager initialize failed.");
  302. return GE_GENERATOR_GRAPH_MANAGER_INIT_FAILED;
  303. }
  304. // get ek file
  305. auto iter = options.find(EK_FILE);
  306. if (iter != options.end()) {
  307. impl_->save_param_.ek_file = iter->second;
  308. }
  309. // get cert file
  310. iter = options.find(CERT_FILE);
  311. if (iter != options.end()) {
  312. impl_->save_param_.cert_file = iter->second;
  313. }
  314. // get hw key file
  315. iter = options.find(HW_KEY_FILE);
  316. if (iter != options.end()) {
  317. impl_->save_param_.hw_key_file = iter->second;
  318. }
  319. // get private file
  320. iter = options.find(PRIVATE_KEY_FILE);
  321. if (iter != options.end()) {
  322. impl_->save_param_.pri_key_file = iter->second;
  323. }
  324. // get build mode
  325. iter = options.find(BUILD_MODE);
  326. if (iter != options.end()) {
  327. impl_->build_mode_ = iter->second;
  328. }
  329. // get build step
  330. iter = options.find(BUILD_STEP);
  331. if (iter != options.end()) {
  332. impl_->build_step_ = iter->second;
  333. }
  334. return SUCCESS;
  335. }
  336. Status GeGenerator::Finalize() {
  337. ErrorManager::GetInstance().SetStage(ErrorMessage::kFinalize, ErrorMessage::kFinalize);
  338. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  339. Status ret = impl_->graph_manager_.Finalize();
  340. if (ret != SUCCESS) {
  341. GELOGE(GE_GENERATOR_GRAPH_MANAGER_FINALIZE_FAILED, "Graph manager finalize failed.");
  342. return GE_GENERATOR_GRAPH_MANAGER_FINALIZE_FAILED;
  343. }
  344. return SUCCESS;
  345. }
  346. Status GeGenerator::GenerateOfflineModel(const Graph &graph, const string &file_name_prefix,
  347. const vector<GeTensor> &inputs) {
  348. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  349. GELOGI("Start to generate offline model.");
  350. ModelBufferData model;
  351. return GenerateModel(graph, file_name_prefix, inputs, model, true);
  352. }
  353. Status GeGenerator::GenerateOnlineModel(const Graph &graph, const vector<GeTensor> &inputs, ModelBufferData &model) {
  354. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  355. return GenerateModel(graph, "online", inputs, model, false);
  356. }
  357. Status GeGenerator::GenerateInfershapeGraph(const Graph &graph) {
  358. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  359. Status ret = impl_->GenerateInfershapeGraph(graph);
  360. if (ret != SUCCESS) {
  361. GELOGE(ret, "Dump infershape json failed");
  362. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  363. GELOGE(FAILED, "graph_manager finalize fail.");
  364. }
  365. return ret;
  366. }
  367. GELOGI("Generate infer shape graph success");
  368. return SUCCESS;
  369. }
  370. std::mutex GeGenerator::Impl::mutex_;
  371. // Remove the space and tab before and after the string
  372. std::string GeGenerator::Impl::Trim(const std::string &str) {
  373. if (str.empty()) {
  374. return str;
  375. }
  376. std::string::size_type start = str.find_first_not_of(" \t\r\n");
  377. if (start == std::string::npos) {
  378. return str;
  379. }
  380. std::string::size_type end = str.find_last_not_of(" \t\r\n") + 1;
  381. return str.substr(start, end);
  382. }
  383. // Parsing the command line
  384. bool GeGenerator::Impl::ParseVersion(const std::string &line, std::string &version) {
  385. std::string flag = "Version=";
  386. std::string temp = Trim(line);
  387. if (temp.empty()) {
  388. GELOGW("line is empty.");
  389. return false;
  390. }
  391. std::string::size_type pos = temp.find(flag);
  392. if (pos == std::string::npos) {
  393. GELOGW("Incorrect line [%s], it must include [%s].", line.c_str(), flag.c_str());
  394. return false;
  395. }
  396. if (temp.size() == flag.size()) {
  397. GELOGW("version information is empty. %s", line.c_str());
  398. return false;
  399. }
  400. version = temp.substr(pos + flag.size());
  401. return true;
  402. }
  403. bool GeGenerator::Impl::GetVersionFromPath(const std::string &file_path, std::string &version) {
  404. // Normalize the path
  405. string resolved_file_path = RealPath(file_path.c_str());
  406. if (resolved_file_path.empty()) {
  407. GELOGW("Invalid input file path [%s], make sure that the file path is correct.", file_path.c_str());
  408. return false;
  409. }
  410. std::ifstream fs(resolved_file_path, std::ifstream::in);
  411. if (!fs.is_open()) {
  412. GELOGW("Open %s failed.", file_path.c_str());
  413. return false;
  414. }
  415. std::string line;
  416. if (getline(fs, line)) {
  417. if (!ParseVersion(line, version)) {
  418. GELOGW("Parse version failed. content is [%s].", line.c_str());
  419. fs.close();
  420. return false;
  421. }
  422. } else {
  423. GELOGW("No version information found in the file path:%s", file_path.c_str());
  424. fs.close();
  425. return false;
  426. }
  427. fs.close(); // close the file
  428. return true;
  429. }
  430. // Set package version information in the model
  431. bool GeGenerator::Impl::SetAtcVersionInfo(AttrHolder &obj) {
  432. std::string path_base = ge::GELib::GetPath();
  433. path_base = path_base.substr(0, path_base.rfind('/'));
  434. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  435. std::string version_path = path_base + "version.info";
  436. std::string version;
  437. if (!GetVersionFromPath(version_path, version)) {
  438. GELOGW("Get atc version information failed!");
  439. return false;
  440. }
  441. // set version info
  442. if (!ge::AttrUtils::SetStr(obj, ATTR_MODEL_ATC_VERSION, version)) {
  443. GELOGW("Ge model set atc version failed!");
  444. return false;
  445. }
  446. return true;
  447. }
  448. // Set package version information in the model
  449. bool GeGenerator::Impl::SetOppVersionInfo(AttrHolder &obj) {
  450. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  451. if (path_env == nullptr) {
  452. GELOGW("Get environment variable ASCEND_OPP_PATH failed!");
  453. return false;
  454. }
  455. std::string version_path = path_env;
  456. version_path += "/version.info";
  457. std::string version;
  458. if (!GetVersionFromPath(version_path, version)) {
  459. GELOGW("Get opp version information failed!");
  460. return false;
  461. }
  462. // set version info
  463. if (!ge::AttrUtils::SetStr(obj, ATTR_MODEL_OPP_VERSION, version)) {
  464. GELOGW("Ge model set opp version failed!");
  465. return false;
  466. }
  467. return true;
  468. }
  469. bool GeGenerator::Impl::SetOmSystemInfo(AttrHolder &obj) {
  470. std::string soc_version;
  471. (void)ge::GetContext().GetOption(ge::SOC_VERSION, soc_version);
  472. GELOGI("SetOmSystemInfo soc_version: %s", soc_version.c_str());
  473. if (!ge::AttrUtils::SetStr(obj, "soc_version", soc_version)) {
  474. GELOGW("SetStr of soc_version failed.");
  475. return false;
  476. }
  477. std::string framework_type;
  478. (void)ge::GetContext().GetOption(ge::FRAMEWORK_TYPE, framework_type);
  479. GELOGI("SetOmSystemInfo framework_type: %s", framework_type.c_str());
  480. auto iter = ge::kFwkTypeToStr.find(framework_type);
  481. if (iter == ge::kFwkTypeToStr.end()) {
  482. GELOGW("Can not find framework_type in the map.");
  483. return false;
  484. }
  485. if (!ge::AttrUtils::SetStr(obj, "framework_type", iter->second)) {
  486. GELOGW("SetStr of framework_type failed.");
  487. return false;
  488. }
  489. return true;
  490. }
  491. Status GeGenerator::GenerateModel(const Graph &graph, const string &file_name_prefix, const vector<GeTensor> &inputs,
  492. ModelBufferData &model, bool is_offline) {
  493. rtContext_t ctx = nullptr;
  494. auto rt = rtCtxGetCurrent(&ctx);
  495. if (rt != RT_ERROR_NONE) {
  496. GELOGD("Current ctx is null.");
  497. ctx = nullptr;
  498. }
  499. GeRootModelPtr ge_root_model = nullptr;
  500. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  501. impl_->is_offline_ = is_offline;
  502. Status ret = impl_->BuildModel(graph, inputs, ge_root_model);
  503. if (ret != SUCCESS) {
  504. GELOGE(ret, "Build model failed.");
  505. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  506. GELOGE(FAILED, "graph_manager finalize fail.");
  507. }
  508. return ret;
  509. }
  510. /// BUILD_MODE_TUNING with BUILD_STEP_BEFORE_UB_MATCH no need save model;
  511. /// BUILD_MODE_TUNING with BUILD_STEP_AFTER_BUILDER no need save model;
  512. /// BUILD_MODE_TUNING with BUILD_STEP_AFTER_BUILDER_SUB no need save model.
  513. if ((impl_->build_mode_ == BUILD_MODE_TUNING) &&
  514. (impl_->build_step_ == BUILD_STEP_BEFORE_UB_MATCH || impl_->build_step_ == BUILD_STEP_AFTER_BUILDER ||
  515. impl_->build_step_ == BUILD_STEP_AFTER_BUILDER_SUB)) {
  516. GELOGI("Build mode:%s with step:%s no need SaveModel.",
  517. impl_->build_mode_.c_str(),
  518. impl_->build_step_.c_str());
  519. return SUCCESS;
  520. }
  521. GE_CHECK_NOTNULL(ge_root_model);
  522. GE_CHECK_NOTNULL(ge_root_model->GetRootGraph());
  523. ModelHelper model_helper;
  524. string model_name = "";
  525. Status name_ret = model_helper.GetModelNameFromMergedGraphName(ge_root_model->GetRootGraph()->GetName(),
  526. model_name);
  527. if (name_ret != SUCCESS) {
  528. ErrorManager::GetInstance().ATCReportErrMessage("E10000", {"parameter"}, {"output"});
  529. GELOGE(FAILED, "Get model_name failed. Param --output is invalid.");
  530. return PARAM_INVALID;
  531. }
  532. map<string, GeModelPtr> name_to_ge_model = ge_root_model->GetSubgraphInstanceNameToModel();
  533. GeModelPtr &ge_model = name_to_ge_model[ge_root_model->GetRootGraph()->GetName()];
  534. GE_RETURN_WITH_LOG_IF_FALSE(ge_model != nullptr, "ge_model cannot be null");
  535. ge_model->SetName(model_name);
  536. ret = impl_->SaveRootModel(file_name_prefix, ge_root_model, model);
  537. if (ret != SUCCESS) {
  538. GELOGE(ret, "Save model failed");
  539. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  540. GELOGE(FAILED, "graph_manager finalize fail.");
  541. }
  542. return ret;
  543. }
  544. if (ctx != nullptr) {
  545. (void)rtCtxSetCurrent(ctx);
  546. }
  547. return SUCCESS;
  548. }
  549. namespace {
  550. bool IsNeedConnectInputOpForSingleOp(GeTensorDesc &tensor_desc) {
  551. bool is_need = true;
  552. // format and dtype is all reserved, stand for Optional input. When singleop scene
  553. if (tensor_desc.GetFormat() == FORMAT_RESERVED && tensor_desc.GetDataType() == DT_UNDEFINED) {
  554. is_need = false;
  555. }
  556. return is_need;
  557. }
  558. Status CheckDynamicSupport(GeModelPtr &ge_model, const ComputeGraphPtr &graph) {
  559. bool support_dynamic = true;
  560. bool is_dynamic = false;
  561. for (const auto &node : graph->GetDirectNode()) {
  562. GE_CHECK_NOTNULL(node);
  563. auto op_desc = node->GetOpDesc();
  564. GE_CHECK_NOTNULL(op_desc);
  565. if (op_desc->GetOpEngineName() != kAIcoreEngine) {
  566. continue;
  567. }
  568. if (AttrUtils::HasAttr(op_desc, kAttrSupportDynamicShape)) {
  569. is_dynamic = true;
  570. (void) AttrUtils::GetBool(op_desc, kAttrSupportDynamicShape, support_dynamic);
  571. if (!support_dynamic) {
  572. GELOGW("Node[%s] doesn't support dynamic shape.", node->GetName().c_str());
  573. break;
  574. }
  575. }
  576. }
  577. if (is_dynamic) {
  578. (void) AttrUtils::SetBool(ge_model, kAttrSupportDynamicShape, support_dynamic);
  579. }
  580. return SUCCESS;
  581. }
  582. }
  583. Status GeGenerator::CheckForSingleOp(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  584. const vector<GeTensor> &outputs) {
  585. GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID);
  586. if (!inputs.empty() && (inputs.size() != op_desc->GetAllInputsSize())) {
  587. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  588. {op_desc->GetName(), op_desc->GetType(), "inputs size" + FmtToStr(op_desc->GetAllInputsSize()),
  589. "tensor size is " + FmtToStr(inputs.size())});
  590. GELOGE(PARAM_INVALID, "Tensor size: %zu, Inputs size: %zu", inputs.size(), op_desc->GetAllInputsSize());
  591. return PARAM_INVALID;
  592. }
  593. if (!outputs.empty() && (outputs.size() != op_desc->GetOutputsSize())) {
  594. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  595. {op_desc->GetName(), op_desc->GetType(), "outputs size" + FmtToStr(op_desc->GetOutputsSize()),
  596. "tensor size is " + FmtToStr(outputs.size())});
  597. GELOGE(PARAM_INVALID, "Tensor size: %zu, Outputs size: %zu", outputs.size(), op_desc->GetOutputsSize());
  598. return PARAM_INVALID;
  599. }
  600. return SUCCESS;
  601. }
  602. Status GeGenerator::BuildSingleOp(OpDescPtr &op_desc, const vector<GeTensor> &inputs, const vector<GeTensor> &outputs,
  603. const string &model_file_name, OpEngineType engine_type, ModelBufferData &model_buff,
  604. bool is_offline) {
  605. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  606. impl_->is_offline_ = is_offline;
  607. if (!is_offline) {
  608. (void)AttrUtils::SetBool(op_desc, ATTR_SINGLE_OP_SCENE, true);
  609. }
  610. if (CheckForSingleOp(op_desc, inputs, outputs) != SUCCESS) {
  611. GELOGE(PARAM_INVALID, "input param is invalid when build single op!");
  612. return PARAM_INVALID;
  613. }
  614. OmgContext &omg_context = (impl_ == nullptr) ? domi::GetContext() : impl_->omg_context_;
  615. omg_context.is_dynamic_input = ContainsDynamicInpus(*op_desc);
  616. if (op_desc->HasAttr(ATTR_NAME_UNREGST_OPPATH)) {
  617. impl_->is_singleop_unregistered_ = true;
  618. }
  619. // 0. Save original attributes.
  620. OpDescPtr op_desc_tmp = AttrUtils::CloneOpDesc(op_desc);
  621. GE_CHECK_NOTNULL(op_desc_tmp);
  622. // 1. check engine type when compile online
  623. if (model_file_name == kFileNameSuffix) {
  624. Status ret = CheckEngineTypeSupport(op_desc, engine_type);
  625. if (ret != SUCCESS) {
  626. GELOGE(ret, "check engine type failed.");
  627. return ret;
  628. }
  629. }
  630. // 2. Create ComputeGraph.
  631. string name = ge::CurrentTimeInStr() + "_" + model_file_name;
  632. Graph graph;
  633. if (BuildSingleOpGraph(op_desc, inputs, outputs, name, graph) != ge::SUCCESS) {
  634. GELOGE(GRAPH_FAILED, "make graph fail.");
  635. return GRAPH_FAILED;
  636. }
  637. GELOGI("ATC parser success in single op build.");
  638. GeRootModelPtr ge_root_model = nullptr;
  639. GE_CHK_STATUS_RET_NOLOG(impl_->BuildModel(graph, inputs, ge_root_model));
  640. map<string, GeAttrValue> op_attrs = op_desc_tmp->GetAllAttrs();
  641. GE_CHECK_NOTNULL(ge_root_model);
  642. GE_CHECK_NOTNULL(ge_root_model->GetRootGraph());
  643. map<string, GeModelPtr> name_to_ge_model = ge_root_model->GetSubgraphInstanceNameToModel();
  644. if (name_to_ge_model.empty()) {
  645. GELOGE(PARAM_INVALID, "GetSubgraphInstanceNameToModel is empty.");
  646. return PARAM_INVALID;
  647. }
  648. const ComputeGraphPtr root_graph = ge_root_model->GetRootGraph();
  649. GeModelPtr &ge_model = name_to_ge_model.begin()->second;
  650. GE_CHK_STATUS_RET_NOLOG(CheckDynamicSupport(ge_model, root_graph));
  651. GELOGI("After build model, The opType in op_desc_tmp is [%s]", op_desc_tmp->GetType().c_str());
  652. bool all_shape = false;
  653. (void)AttrUtils::GetBool(op_desc, kAicpuAllshape, all_shape);
  654. if (all_shape) {
  655. GELOGD("Get aicpu all_shape kernel!");
  656. vector<GeTensor> inputs_dynamic;
  657. vector<GeTensor> outputs_dynamic;
  658. GE_CHK_STATUS_RET_NOLOG(ResetTensorVecShape(inputs, inputs_dynamic));
  659. GE_CHK_STATUS_RET_NOLOG(ResetTensorVecShape(outputs, outputs_dynamic));
  660. GE_CHK_STATUS_RET_NOLOG(
  661. impl_->SaveParams(ge_model, op_desc_tmp->GetType(), op_attrs, inputs_dynamic, outputs_dynamic));
  662. } else {
  663. GE_CHK_STATUS_RET_NOLOG(impl_->SaveParams(ge_model, op_desc_tmp->GetType(), op_attrs, inputs, outputs));
  664. }
  665. GELOGI("Start save GeModel to Model buffer");
  666. GE_CHK_STATUS_RET_NOLOG(impl_->SaveModel(model_file_name, ge_model, model_buff));
  667. return SUCCESS;
  668. }
  669. /**
  670. * @ingroup ge
  671. * @brief Compiling a single operator into an offline model
  672. * @param [in] OpDescPtr &op_desc: Operator description info that needs to be compiled into an offline model file
  673. * @param [in] vector<GeTensor> &inputs: Operator input data description information.
  674. * @param [in] vector<GeTensor> &outputs: Operator output data description information.
  675. * @param [in] const string &model_file_name: Offline model filename.
  676. * @return SUCCESS handle successfully / others handle failed
  677. */
  678. Status GeGenerator::BuildSingleOpModel(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  679. const vector<GeTensor> &outputs, const string &model_file_name) {
  680. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  681. GELOGI("Start to build single op offline model, input size: %zu, output size: %zu", inputs.size(), outputs.size());
  682. ModelBufferData model_buff;
  683. OpEngineType engine_type = ENGINE_SYS;
  684. Status status = BuildSingleOp(op_desc, inputs, outputs, model_file_name, engine_type, model_buff, true);
  685. GELOGI("Finish build single offline model, status: %u", status);
  686. return status;
  687. }
  688. /**
  689. * @ingroup ge
  690. * @brief Compiling a single operator into online buffer
  691. * @param [in] OpDescPtr &op_desc: Operator description info that needs to be compiled into an offline model file
  692. * @param [in] vector<GeTensor> &inputs: Operator input data description information.
  693. * @param [in] vector<GeTensor> &outputs: Operator output data description information.
  694. * @param [in] engine_type: specific engine.
  695. * @param [out] ModelBufferData &Model_buff: Model_buff: model buffer of the op.
  696. * @return SUCCESS handle successfully / others handle failed
  697. */
  698. Status GeGenerator::BuildSingleOpModel(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  699. const vector<GeTensor> &outputs, OpEngineType engine_type,
  700. ModelBufferData &model_buff) {
  701. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  702. GELOGI("Start to build single op online, input size: %zu, output size: %zu", inputs.size(), outputs.size());
  703. Status status = BuildSingleOp(op_desc, inputs, outputs, kFileNameSuffix, engine_type, model_buff, false);
  704. GELOGI("Finish build single online model, status: %u", status);
  705. return status;
  706. }
  707. Status GeGenerator::BuildSingleOpGraph(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  708. const vector<GeTensor> &outputs, std::string graph_name, Graph &graph) {
  709. ge::ComputeGraphPtr compute_graph = MakeShared<ComputeGraph>(graph_name);
  710. GE_CHECK_NOTNULL_EXEC(compute_graph, return INTERNAL_ERROR);
  711. // 1. Add Node to ComputeGraph.
  712. NodePtr op_node = compute_graph->AddNode(op_desc);
  713. GE_CHECK_NOTNULL_EXEC(op_node, return INTERNAL_ERROR);
  714. // 2. Create InputData node.
  715. int32_t arg_index = 0;
  716. if (inputs.empty()) {
  717. for (const auto &input_desc : op_desc->GetAllInputsDescPtr()) {
  718. GE_CHECK_NOTNULL_EXEC(input_desc, return INTERNAL_ERROR);
  719. if (!IsNeedConnectInputOpForSingleOp(*input_desc)) {
  720. continue;
  721. }
  722. GE_CHK_STATUS_RET_NOLOG(AddInputs(compute_graph, op_node, *input_desc, arg_index, false));
  723. arg_index++;
  724. }
  725. } else {
  726. for (const auto &in_desc : inputs) {
  727. GE_CHK_STATUS_RET_NOLOG(AddInputs(compute_graph, op_node, in_desc.GetTensorDesc(), arg_index, true));
  728. arg_index++;
  729. }
  730. }
  731. // 3. Create Output node.
  732. if (!outputs.empty()) {
  733. GE_CHK_STATUS_RET_NOLOG(AddOutputs(compute_graph, op_node, outputs));
  734. }
  735. // dump ComputeGraph node.
  736. compute_graph->Dump();
  737. graph = ge::GraphUtils::CreateGraphFromComputeGraph(compute_graph);
  738. return SUCCESS;
  739. }
  740. Status GeGenerator::Impl::SaveParams(GeModelPtr &ge_model, const string &type, const map<string, GeAttrValue> &attrs,
  741. const vector<GeTensor> &inputs, const vector<GeTensor> &outputs) {
  742. GE_CHECK_NOTNULL_EXEC(ge_model, return PARAM_INVALID);
  743. GE_CHK_BOOL_EXEC_NOLOG(graph_manager_.SaveParams(*ge_model, type, attrs, inputs, outputs) == SUCCESS,
  744. (void)graph_manager_.Finalize();
  745. return FAILED);
  746. return SUCCESS;
  747. }
  748. Status GeGenerator::Impl::SaveModel(const string &file_name_prefix, GeModelPtr &model, ModelBufferData &model_buff) {
  749. // set atc version
  750. if (!SetAtcVersionInfo(*(model.get()))) {
  751. GELOGW("SetPackageVersionInfo of atc failed!");
  752. }
  753. // set opp version
  754. if (!SetOppVersionInfo(*(model.get()))) {
  755. GELOGW("SetPackageVersionInfo of ops failed!");
  756. }
  757. ModelHelper model_helper;
  758. model_helper.SetSaveMode(is_offline_);
  759. Status ret = model_helper.SaveToOmModel(model, save_param_, file_name_prefix, model_buff);
  760. if (ret != SUCCESS) {
  761. GELOGE(ret, "Save to om model failed");
  762. return ret;
  763. }
  764. return SUCCESS;
  765. }
  766. Status GeGenerator::Impl::SaveRootModel(const string &file_name_prefix, GeRootModelPtr &ge_root_model,
  767. ModelBufferData &model_buff) {
  768. bool is_unknown_shape = false;
  769. auto ret = ge_root_model->CheckIsUnknownShape(is_unknown_shape);
  770. if (ret != SUCCESS) {
  771. GELOGE(FAILED, "Check root model is unkonwn shape failed");
  772. return FAILED;
  773. }
  774. GELOGD("begin save root model, cur model is unkonwn shape model ? : %d", is_unknown_shape);
  775. GE_CHK_BOOL_EXEC(!ge_root_model->GetSubgraphInstanceNameToModel().empty(), return FAILED,
  776. "ge root model has no sub model")
  777. GeModelPtr model_root = nullptr;
  778. if (is_unknown_shape) {
  779. model_root = make_shared<GeModel>();
  780. model_root->SetGraph(GraphUtils::CreateGraphFromComputeGraph(ge_root_model->GetRootGraph()));
  781. ge_root_model->SetSubgraphInstanceNameToModel(ge_root_model->GetRootGraph()->GetName(), model_root);
  782. model_root->SetName(ge_root_model->GetRootGraph()->GetName());
  783. } else {
  784. model_root = ge_root_model->GetSubgraphInstanceNameToModel().begin()->second;
  785. }
  786. // set atc version
  787. if (!SetAtcVersionInfo(*(model_root.get()))) {
  788. GELOGW("SetPackageVersionInfo of atc failed!");
  789. }
  790. // set opp version
  791. if (!SetOppVersionInfo(*(model_root.get()))) {
  792. GELOGW("SetPackageVersionInfo of ops failed!");
  793. }
  794. if (!SetOmSystemInfo(*(model_root.get()))) {
  795. GELOGW("SetOmsystemInfo failed!");
  796. }
  797. ModelHelper model_helper;
  798. model_helper.SetSaveMode(is_offline_);
  799. ret = model_helper.SaveToOmRootModel(ge_root_model, save_param_, file_name_prefix, model_buff, is_unknown_shape);
  800. if (ret != SUCCESS) {
  801. GELOGE(ret, "Save to om model failed");
  802. return ret;
  803. }
  804. return SUCCESS;
  805. }
  806. Status GeGenerator::Impl::BuildModel(const Graph &graph, const vector<GeTensor> &inputs,
  807. GeRootModelPtr &ge_root_model) {
  808. static std::atomic<GraphId> atomic_graph_id(0);
  809. auto graph_id = atomic_graph_id.fetch_add(1);
  810. const std::map<std::string, std::string> options;
  811. Status ret = graph_manager_.AddGraph(graph_id, graph, options, omg_context_);
  812. if (ret != SUCCESS) {
  813. GELOGE(GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED, "GraphManager add graph fail, graph id: %u", graph_id);
  814. (void)graph_manager_.Finalize();
  815. return GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED;
  816. }
  817. graph_manager_.SetOptionsRunGraphFlag(false);
  818. static std::atomic<uint64_t> atomic_session_id(0);
  819. auto session_id = atomic_session_id.fetch_add(1);
  820. if (is_singleop_unregistered_) {
  821. ret = graph_manager_.BuildGraphForUnregisteredOp(graph_id, inputs, ge_root_model, session_id);
  822. } else {
  823. ret = graph_manager_.BuildGraph(graph_id, inputs, ge_root_model, session_id);
  824. }
  825. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  826. if (ret != SUCCESS) {
  827. GELOGE(GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED, "GraphManager build graph fail, graph id: %u", graph_id);
  828. VarManagerPool::Instance().RemoveVarManager(session_id);
  829. return GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED;
  830. }
  831. VarManagerPool::Instance().RemoveVarManager(session_id);
  832. return SUCCESS;
  833. }
  834. Status GeGenerator::Impl::GenerateInfershapeGraph(const Graph &graph) {
  835. static std::atomic<GraphId> atomic_graph_id(0);
  836. auto graph_id = atomic_graph_id.fetch_add(1);
  837. const std::map<std::string, std::string> options;
  838. Status ret = graph_manager_.AddGraph(graph_id, graph, options, omg_context_);
  839. if (ret != SUCCESS) {
  840. GELOGE(GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED, "GraphManager add graph failed, graph id: %u", graph_id);
  841. (void)graph_manager_.Finalize();
  842. return GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED;
  843. }
  844. ret = graph_manager_.GenerateInfershapeGraph(graph_id);
  845. if (ret != SUCCESS) {
  846. GELOGE(GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED, "GraphManager generate graph failed");
  847. return GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED;
  848. }
  849. return SUCCESS;
  850. }
  851. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示