You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_generator.cc 44 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "generator/ge_generator.h"
  17. #include <atomic>
  18. #include "common/ge/ge_util.h"
  19. #include "common/ge/plugin_manager.h"
  20. #include "common/helper/model_helper.h"
  21. #include "common/helper/om_file_helper.h"
  22. #include "common/util.h"
  23. #include "common/util/error_manager/error_manager.h"
  24. #include "framework/common/debug/ge_log.h"
  25. #include "framework/common/debug/log.h"
  26. #include "ge/ge_api.h"
  27. #include "graph/debug/ge_attr_define.h"
  28. #include "graph/ge_context.h"
  29. #include "graph/manager/graph_manager.h"
  30. #include "graph/manager/util/rt_context_util.h"
  31. #include "graph/opsproto_manager.h"
  32. #include "graph/utils/graph_utils.h"
  33. #include "graph/utils/type_utils.h"
  34. #include "init/gelib.h"
  35. #include "model/ge_model.h"
  36. #include "analyzer/analyzer.h"
  37. using std::map;
  38. using std::string;
  39. using std::vector;
  40. namespace {
  41. const char *const kAttrOpType = "op_type";
  42. const char *const kEngineNameDefault = "default";
  43. const char *const kVectorEngine = "VectorEngine";
  44. const char *const kAIcoreEngine = "AIcoreEngine";
  45. const char *const kFileNameSuffix = "online";
  46. const char *const kAicpuAllshape = "_AllShape";
  47. constexpr char const *kAttrSupportDynamicShape = "support_dynamicshape";
  48. const int64_t kDynamicDimValue = -2;
  49. const int kDefaultDeviceId = 0;
  50. const int kDefaultJobId = 0;
  51. const int32_t kFuzzBuildPattern = 1;
  52. std::map<ge::OpEngineType, std::string> engine_type_map{
  53. {ge::ENGINE_SYS, kEngineNameDefault},
  54. {ge::ENGINE_AICORE, kAIcoreEngine},
  55. {ge::ENGINE_VECTOR, kVectorEngine}};
  56. bool ContainsDynamicInpus(const ge::OpDesc &op_desc) {
  57. for (auto &tensor_desc : op_desc.GetAllInputsDescPtr()) {
  58. if (tensor_desc->MutableShape().IsUnknownShape()) {
  59. GELOGI("Contains unknown shape input. set is_dynamic_input to true.");
  60. return true;
  61. }
  62. }
  63. return false;
  64. }
  65. // if optional in/out, format is format_reserved and dtype is dt_undefined
  66. bool IsOptional(const ge::GeTensorDesc &tensor_desc) {
  67. return tensor_desc.GetFormat() == ge::FORMAT_RESERVED && tensor_desc.GetDataType() == ge::DT_UNDEFINED;
  68. }
  69. } // namespace
  70. namespace ge {
  71. static Status CheckEngineTypeSupport(const NodePtr &node, OpEngineType engine_type) {
  72. const OpDescPtr &op_desc = node->GetOpDesc();
  73. GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID);
  74. if (engine_type == ENGINE_SYS) {
  75. GELOGI("CheckEngineType: use default engine.");
  76. return SUCCESS;
  77. }
  78. // get op engine name
  79. string op_engine_name;
  80. auto iter = engine_type_map.find(engine_type);
  81. if (iter != engine_type_map.end()) {
  82. op_engine_name = iter->second;
  83. GELOGI("CheckEngineType: engine type: %d", static_cast<int>(engine_type));
  84. } else {
  85. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  86. {op_desc->GetName(), op_desc->GetType(), "engine type",
  87. "it only support default/AIcoreEngine/VectorEngine"});
  88. GELOGE(FAILED, "[Check][EngineType]value:%d not support, "
  89. "only support default/AIcoreEngine/VectorEngine now", static_cast<int>(engine_type));
  90. return FAILED;
  91. }
  92. if (op_desc->HasAttr(ATTR_NAME_UNREGST_OPPATH)) {
  93. op_desc->SetOpEngineName(op_engine_name);
  94. op_desc->SetOpKernelLibName(op_engine_name);
  95. return SUCCESS;
  96. }
  97. // set op engine name and opkernelLib. when engine support
  98. std::shared_ptr<GELib> instance_ptr = ge::GELib::GetInstance();
  99. if ((instance_ptr == nullptr) || (!instance_ptr->InitFlag())) {
  100. GELOGE(GE_CLI_GE_NOT_INITIALIZED, "CheckEngineType failed.");
  101. return FAILED;
  102. }
  103. OpsKernelManager &ops_kernel_manager = instance_ptr->OpsKernelManagerObj();
  104. std::vector<OpInfo> op_infos = ops_kernel_manager.GetOpsKernelInfo(op_desc->GetType());
  105. if (op_infos.empty()) {
  106. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  107. {op_desc->GetName(), op_desc->GetType(), "optype", "it can not find"});
  108. GELOGE(FAILED, "CheckEngineType: Can not get op info by op type %s", op_desc->GetType().c_str());
  109. return FAILED;
  110. }
  111. string kernel_name;
  112. for (const auto &it : op_infos) {
  113. if (it.engine == op_engine_name) {
  114. kernel_name = it.opKernelLib;
  115. break;
  116. }
  117. }
  118. if (kernel_name.empty()) {
  119. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  120. {op_desc->GetName(), op_desc->GetType(), "engine name" + FmtToStr(op_engine_name), "it can not find"});
  121. GELOGE(FAILED, "CheckEngineType:Can not find ops kernel, engine name: %s.", op_engine_name.c_str());
  122. return FAILED;
  123. }
  124. auto &kernel_map = ops_kernel_manager.GetAllOpsKernelInfoStores();
  125. auto kernel_info_store = kernel_map.find(kernel_name);
  126. if (kernel_info_store != kernel_map.end()) {
  127. std::string unsupported_reason;
  128. if (kernel_info_store->second->CheckSupported(node, unsupported_reason)) {
  129. op_desc->SetOpEngineName(op_engine_name);
  130. op_desc->SetOpKernelLibName(kernel_name);
  131. GELOGI("CheckEngineType:Set OpKernelLibName %s and engine name %s into op_desc %s", kernel_name.c_str(),
  132. op_engine_name.c_str(), op_desc->GetName().c_str());
  133. return SUCCESS;
  134. } else {
  135. ErrorManager::GetInstance().ATCReportErrMessage(
  136. "E13002", {"optype", "opskernel", "reason"}, {op_desc->GetType(), kernel_name, unsupported_reason});
  137. GELOGE(FAILED, "CheckEngineType: check support failed, Op type %s of ops kernel %s is unsupported, reason:%s",
  138. op_desc->GetType().c_str(), kernel_name.c_str(), unsupported_reason.c_str());
  139. return FAILED;
  140. }
  141. } else {
  142. ErrorManager::GetInstance().ATCReportErrMessage(
  143. "E13003", {"opname", "optype"}, {op_desc->GetName(), op_desc->GetType()});
  144. GELOGE(FAILED,
  145. "CheckEngineType:Can not find any supported ops kernel info store by kernel_name %s,"
  146. "op type is %s, op name is %s",
  147. kernel_name.c_str(), op_desc->GetType().c_str(), op_desc->GetName().c_str());
  148. }
  149. return FAILED;
  150. }
  151. static Status AddInputs(const ComputeGraphPtr &graph, const NodePtr &node, const GeTensorDesc &tensor, int32_t index,
  152. bool attr, int32_t &data_index) {
  153. GE_CHECK_NOTNULL_EXEC(graph, return PARAM_INVALID);
  154. GE_CHECK_NOTNULL_EXEC(node, return PARAM_INVALID);
  155. auto format = tensor.GetFormat();
  156. auto data_type = tensor.GetDataType();
  157. if (format == FORMAT_RESERVED && data_type == DT_UNDEFINED) {
  158. return SUCCESS;
  159. }
  160. string op_type;
  161. bool is_const = false;
  162. (void)AttrUtils::GetBool(tensor, CONST_ATTR_NAME_INPUT, is_const);
  163. if (is_const) {
  164. GELOGD("Get input[%d] is const", index);
  165. op_type = CONSTANTOP;
  166. } else if (!AttrUtils::GetStr(tensor, kAttrOpType, op_type) || op_type.empty()) {
  167. op_type = DATA;
  168. }
  169. string op_name = node->GetName() + "_in_" + std::to_string(index);
  170. OpDescPtr data_op = MakeShared<ge::OpDesc>(op_name, op_type);
  171. if (data_op == nullptr) {
  172. return FAILED;
  173. }
  174. if (is_const) {
  175. ConstGeTensorPtr tensor_value;
  176. if (!AttrUtils::GetTensor(tensor, ge::ATTR_NAME_WEIGHTS, tensor_value)) {
  177. GELOGE(FAILED, "Get value failed, node name:%s.", tensor.GetName().c_str());
  178. return FAILED;
  179. }
  180. if (!AttrUtils::SetTensor(data_op, ge::ATTR_NAME_WEIGHTS, tensor_value)) {
  181. GELOGE(FAILED, "Set attr ATTR_NAME_WEIGHTS fail.");
  182. return FAILED;
  183. }
  184. }
  185. (void)AttrUtils::SetBool(data_op, "_is_single_op", true);
  186. GE_CHK_BOOL_EXEC(data_op->AddInputDesc(tensor) == GRAPH_SUCCESS, return FAILED,
  187. "[Add][InputDesc]fail for node:%s", data_op->GetName().c_str());
  188. GE_CHK_BOOL_EXEC(data_op->AddOutputDesc(tensor) == GRAPH_SUCCESS, return FAILED,
  189. "[Add][OutputDesc]fail for node:%s", data_op->GetName().c_str());
  190. if (attr && !is_const) {
  191. GE_CHK_BOOL_EXEC(AttrUtils::SetInt(data_op, ATTR_NAME_INDEX, data_index), return FAILED,
  192. "[Set][Attr:%s]fail for node:%s", ATTR_NAME_INDEX.c_str(), data_op->GetName().c_str());
  193. ++data_index;
  194. }
  195. ge::NodePtr arg_node = graph->AddNode(data_op);
  196. GE_CHK_BOOL_EXEC(arg_node != nullptr, return FAILED, "Insert Data node fail");
  197. GE_CHK_STATUS(GraphUtils::AddEdge(arg_node->GetOutDataAnchor(0), node->GetInDataAnchor(index)),
  198. "[Add][Edge]fail from node:%s to node:%s", data_op->GetName().c_str(), node->GetName().c_str());
  199. return SUCCESS;
  200. }
  201. static Status AddOutputs(const ComputeGraphPtr &graph, const NodePtr &node, const vector<GeTensor> &outputs) {
  202. OpDescPtr op_desc = MakeShared<ge::OpDesc>(graph->GetName() + "_" + NODE_NAME_NET_OUTPUT, NETOUTPUT);
  203. if (op_desc == nullptr) {
  204. return FAILED;
  205. }
  206. (void)AttrUtils::SetBool(op_desc, "_is_single_op", true);
  207. int32_t count = 0;
  208. for (const auto &out_desc : outputs) {
  209. GeTensorDesc tensor = out_desc.GetTensorDesc();
  210. TensorUtils::SetInputTensor(tensor, true);
  211. GE_CHK_BOOL_EXEC(op_desc->AddInputDesc(tensor) == GRAPH_SUCCESS, return FAILED,
  212. "[Add][InputDesc]fail for node:%s", op_desc->GetName().c_str());
  213. TensorUtils::SetInputTensor(tensor, false);
  214. TensorUtils::SetOutputTensor(tensor, true);
  215. GE_CHK_BOOL_EXEC(op_desc->AddOutputDesc(tensor) == GRAPH_SUCCESS, return FAILED,
  216. "[Add][OutputDesc]fail for node:%s", op_desc->GetName().c_str());
  217. count++;
  218. }
  219. GE_CHECK_NOTNULL_EXEC(graph, return PARAM_INVALID);
  220. ge::NodePtr out_node = graph->AddNode(op_desc);
  221. GE_CHK_BOOL_EXEC(out_node != nullptr, return FAILED,
  222. "[Add][Node:%s]fail in graph:%u", op_desc->GetName().c_str(), graph->GetGraphID());
  223. GE_CHECK_NOTNULL_EXEC(node, return PARAM_INVALID);
  224. for (int32_t i = 0; i < count; ++i) {
  225. GE_CHK_STATUS(GraphUtils::AddEdge(node->GetOutDataAnchor(i), out_node->GetInDataAnchor(i)),
  226. "[Add][Edge]fail from node:%s to node:%s", node->GetName().c_str(), out_node->GetName().c_str());
  227. }
  228. return SUCCESS;
  229. }
  230. static void GetOpsProtoPath(string &opsproto_path) {
  231. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  232. if (path_env != nullptr) {
  233. string path = path_env;
  234. string file_path = RealPath(path.c_str());
  235. if (file_path.empty()) {
  236. GELOGE(FAILED, "File path %s is invalid.", path.c_str());
  237. return;
  238. }
  239. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  240. GELOGI("Get opsproto so path from env : %s", path.c_str());
  241. return;
  242. }
  243. string path_base = PluginManager::GetPath();
  244. GELOGI("path_base is %s", path_base.c_str());
  245. path_base = path_base.substr(0, path_base.rfind('/'));
  246. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  247. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  248. }
  249. static Status ResetTensorVecShape(const vector<GeTensor> &inputs, vector<GeTensor> &inputs_dynamic) {
  250. for (auto input : inputs) {
  251. auto input_desc = input.GetTensorDesc();
  252. GeShape shape_ori = input_desc.GetShape();
  253. std::vector<int64_t> dynamic_shape_dims = {kDynamicDimValue};
  254. GeShape dynamic_shape(dynamic_shape_dims);
  255. std::vector<std::pair<int64_t, int64_t>> dynamic_shape_range;
  256. ge::GeTensor inputTensor;
  257. ge::GeTensorDesc desc(input_desc);
  258. bool is_const = false;
  259. (void)AttrUtils::GetBool(input_desc, CONST_ATTR_NAME_INPUT, is_const);
  260. if (!is_const) {
  261. int64_t storage_format = FORMAT_NCHW;
  262. if (ge::AttrUtils::GetInt(desc, ge::ATTR_NAME_STORAGE_FORMAT, storage_format) &&
  263. !ge::AttrUtils::SetListInt(desc, ge::ATTR_NAME_STORAGE_SHAPE, dynamic_shape_dims)) {
  264. GELOGE(FAILED, "Set attr ATTR_NAME_STORAGE_SHAPE fail.");
  265. return FAILED;
  266. }
  267. desc.SetShape(dynamic_shape);
  268. desc.SetShapeRange(dynamic_shape_range);
  269. }
  270. inputTensor.SetTensorDesc(desc);
  271. inputs_dynamic.push_back(inputTensor);
  272. }
  273. return SUCCESS;
  274. }
  275. static Status GetFuzzBuildAttrs(const OpDescPtr &op_desc, const GeRootModelPtr &ge_root_model,
  276. GeAttrValue::LIST_NAMED_ATTRS &fuzz_build_attrs) {
  277. GELOGD("Start get fuzz build attrs of %s.", op_desc->GetName().c_str());
  278. GE_CHECK_NOTNULL(ge_root_model->GetRootGraph());
  279. for (const auto &node : ge_root_model->GetRootGraph()->GetAllNodes()) {
  280. GE_CHECK_NOTNULL(node);
  281. GE_CHECK_NOTNULL(node->GetOpDesc());
  282. GELOGD("Delete fuzz build attr of %s after build.", node->GetName().c_str());
  283. node->GetOpDesc()->DelAttr(ATTR_NAME_FUZZ_BUILD);
  284. }
  285. (void)AttrUtils::GetListNamedAttrs(op_desc, ATTR_NAME_FUZZ_BUILD_RES_ATTRS, fuzz_build_attrs);
  286. if (!fuzz_build_attrs.empty()) {
  287. GELOGD("%s has split, get ATTR_NAME_FUZZ_BUILD_RES_ATTRS directly.", op_desc->GetName().c_str());
  288. return SUCCESS;
  289. } else {
  290. GELOGW("%s build with fuzz build pattern, but not set ATTR_NAME_FUZZ_BUILD_RES_ATTRS.", op_desc->GetName().c_str());
  291. }
  292. return SUCCESS;
  293. }
  294. static bool HasShapeRange(const vector<GeTensor> &inputs) {
  295. for (const auto &input : inputs) {
  296. vector<pair<int64_t, int64_t>> shape_range;
  297. (void)input.GetTensorDesc().GetShapeRange(shape_range);
  298. if (!shape_range.empty()) {
  299. GELOGD("Has set shape range.");
  300. return true;
  301. }
  302. }
  303. return false;
  304. }
  305. class GeGenerator::Impl {
  306. public:
  307. Impl(OmgContext &omg_context) : omg_context_(omg_context) {}
  308. ~Impl() = default;
  309. Status BuildModel(const Graph &graph, const vector<GeTensor> &inputs, GeRootModelPtr &ge_models);
  310. Status SaveModel(const string &file_name_prefix, GeModelPtr &models, ModelBufferData &model);
  311. Status SaveRootModel(const string &file_name_prefix, GeRootModelPtr &model, ModelBufferData &model_buff);
  312. Status SaveParams(GeModelPtr &ge_model, const string &type, const map<string, GeAttrValue> &attrs,
  313. const vector<GeTensor> &inputs, const vector<GeTensor> &outputs);
  314. Status GenerateInfershapeGraph(const Graph &graph);
  315. OmgContext &omg_context_;
  316. GraphManager graph_manager_;
  317. SaveParam save_param_;
  318. bool is_offline_ = true;
  319. bool is_singleop_unregistered_ = false;
  320. std::string build_mode_;
  321. std::string build_step_;
  322. static std::mutex mutex_;
  323. private:
  324. static std::string Trim(const std::string &str);
  325. bool ParseVersion(const std::string &line, std::string &version);
  326. bool GetVersionFromPath(const std::string &file_path, std::string &version);
  327. bool SetAtcVersionInfo(AttrHolder &obj);
  328. bool SetOppVersionInfo(AttrHolder &obj);
  329. bool SetOmSystemInfo(AttrHolder &obj);
  330. };
  331. Status GeGenerator::Initialize(const map<string, string> &options) {
  332. return Initialize(options, domi::GetContext());
  333. }
  334. Status GeGenerator::Initialize(const map<string, string> &options, OmgContext &omg_context) {
  335. impl_ = ge::MakeShared<Impl>(omg_context);
  336. if (impl_ == nullptr) {
  337. GELOGE(MEMALLOC_FAILED, "Make shared failed");
  338. return MEMALLOC_FAILED;
  339. }
  340. ErrorManager::GetInstance().SetStage(ErrorMessage::kInitialize, ErrorMessage::kOpsProtoInit);
  341. string opsproto_path;
  342. GetOpsProtoPath(opsproto_path);
  343. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  344. OpsProtoManager *manager = OpsProtoManager::Instance();
  345. map<string, string> option_tmp;
  346. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  347. (void)manager->Initialize(option_tmp);
  348. Status ret = impl_->graph_manager_.Initialize(options);
  349. if (ret != SUCCESS) {
  350. GELOGE(GE_GENERATOR_GRAPH_MANAGER_INIT_FAILED, "Graph manager initialize failed.");
  351. return GE_GENERATOR_GRAPH_MANAGER_INIT_FAILED;
  352. }
  353. // get ek file
  354. auto iter = options.find(EK_FILE);
  355. if (iter != options.end()) {
  356. impl_->save_param_.ek_file = iter->second;
  357. }
  358. // get cert file
  359. iter = options.find(CERT_FILE);
  360. if (iter != options.end()) {
  361. impl_->save_param_.cert_file = iter->second;
  362. }
  363. // get hw key file
  364. iter = options.find(HW_KEY_FILE);
  365. if (iter != options.end()) {
  366. impl_->save_param_.hw_key_file = iter->second;
  367. }
  368. // get private file
  369. iter = options.find(PRIVATE_KEY_FILE);
  370. if (iter != options.end()) {
  371. impl_->save_param_.pri_key_file = iter->second;
  372. }
  373. // get build mode
  374. iter = options.find(BUILD_MODE);
  375. if (iter != options.end()) {
  376. impl_->build_mode_ = iter->second;
  377. }
  378. // get build step
  379. iter = options.find(BUILD_STEP);
  380. if (iter != options.end()) {
  381. impl_->build_step_ = iter->second;
  382. }
  383. return SUCCESS;
  384. }
  385. Status GeGenerator::Finalize() {
  386. ErrorManager::GetInstance().SetStage(ErrorMessage::kFinalize, ErrorMessage::kFinalize);
  387. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  388. Status ret = impl_->graph_manager_.Finalize();
  389. if (ret != SUCCESS) {
  390. GELOGE(GE_GENERATOR_GRAPH_MANAGER_FINALIZE_FAILED, "Graph manager finalize failed.");
  391. return GE_GENERATOR_GRAPH_MANAGER_FINALIZE_FAILED;
  392. }
  393. return SUCCESS;
  394. }
  395. Status GeGenerator::GenerateOfflineModel(const Graph &graph, const string &file_name_prefix,
  396. const vector<GeTensor> &inputs) {
  397. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  398. GELOGI("Start to generate offline model.");
  399. ModelBufferData model;
  400. return GenerateModel(graph, file_name_prefix, inputs, model, true);
  401. }
  402. Status GeGenerator::GenerateOnlineModel(const Graph &graph, const vector<GeTensor> &inputs, ModelBufferData &model) {
  403. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  404. return GenerateModel(graph, "online", inputs, model, false);
  405. }
  406. Status GeGenerator::GenerateInfershapeGraph(const Graph &graph) {
  407. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  408. Status ret = impl_->GenerateInfershapeGraph(graph);
  409. if (ret != SUCCESS) {
  410. GELOGE(ret, "Dump infershape json failed");
  411. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  412. GELOGE(FAILED, "graph_manager finalize fail.");
  413. }
  414. return ret;
  415. }
  416. GELOGI("Generate infer shape graph success");
  417. return SUCCESS;
  418. }
  419. std::mutex GeGenerator::Impl::mutex_;
  420. // Remove the space and tab before and after the string
  421. std::string GeGenerator::Impl::Trim(const std::string &str) {
  422. if (str.empty()) {
  423. return str;
  424. }
  425. std::string::size_type start = str.find_first_not_of(" \t\r\n");
  426. if (start == std::string::npos) {
  427. return str;
  428. }
  429. std::string::size_type end = str.find_last_not_of(" \t\r\n") + 1;
  430. return str.substr(start, end);
  431. }
  432. // Parsing the command line
  433. bool GeGenerator::Impl::ParseVersion(const std::string &line, std::string &version) {
  434. std::string flag = "Version=";
  435. std::string temp = Trim(line);
  436. if (temp.empty()) {
  437. GELOGW("line is empty.");
  438. return false;
  439. }
  440. std::string::size_type pos = temp.find(flag);
  441. if (pos == std::string::npos) {
  442. GELOGW("Incorrect line [%s], it must include [%s].", line.c_str(), flag.c_str());
  443. return false;
  444. }
  445. if (temp.size() == flag.size()) {
  446. GELOGW("version information is empty. %s", line.c_str());
  447. return false;
  448. }
  449. version = temp.substr(pos + flag.size());
  450. return true;
  451. }
  452. bool GeGenerator::Impl::GetVersionFromPath(const std::string &file_path, std::string &version) {
  453. // Normalize the path
  454. string resolved_file_path = RealPath(file_path.c_str());
  455. if (resolved_file_path.empty()) {
  456. GELOGW("Invalid input file path [%s], make sure that the file path is correct.", file_path.c_str());
  457. return false;
  458. }
  459. std::ifstream fs(resolved_file_path, std::ifstream::in);
  460. if (!fs.is_open()) {
  461. GELOGW("Open %s failed.", file_path.c_str());
  462. return false;
  463. }
  464. std::string line;
  465. if (getline(fs, line)) {
  466. if (!ParseVersion(line, version)) {
  467. GELOGW("Parse version failed. content is [%s].", line.c_str());
  468. fs.close();
  469. return false;
  470. }
  471. } else {
  472. GELOGW("No version information found in the file path:%s", file_path.c_str());
  473. fs.close();
  474. return false;
  475. }
  476. fs.close(); // close the file
  477. return true;
  478. }
  479. // Set package version information in the model
  480. bool GeGenerator::Impl::SetAtcVersionInfo(AttrHolder &obj) {
  481. std::string path_base = ge::GELib::GetPath();
  482. path_base = path_base.substr(0, path_base.rfind('/'));
  483. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  484. std::string version_path = path_base + "version.info";
  485. std::string version;
  486. if (!GetVersionFromPath(version_path, version)) {
  487. GELOGW("Get atc version information failed!");
  488. return false;
  489. }
  490. // set version info
  491. if (!ge::AttrUtils::SetStr(obj, ATTR_MODEL_ATC_VERSION, version)) {
  492. GELOGW("Ge model set atc version failed!");
  493. return false;
  494. }
  495. return true;
  496. }
  497. // Set package version information in the model
  498. bool GeGenerator::Impl::SetOppVersionInfo(AttrHolder &obj) {
  499. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  500. if (path_env == nullptr) {
  501. GELOGW("Get environment variable ASCEND_OPP_PATH failed!");
  502. return false;
  503. }
  504. std::string version_path = path_env;
  505. version_path += "/version.info";
  506. std::string version;
  507. if (!GetVersionFromPath(version_path, version)) {
  508. GELOGW("Get opp version information failed!");
  509. return false;
  510. }
  511. // set version info
  512. if (!ge::AttrUtils::SetStr(obj, ATTR_MODEL_OPP_VERSION, version)) {
  513. GELOGW("Ge model set opp version failed!");
  514. return false;
  515. }
  516. return true;
  517. }
  518. bool GeGenerator::Impl::SetOmSystemInfo(AttrHolder &obj) {
  519. std::string soc_version;
  520. (void)ge::GetContext().GetOption(ge::SOC_VERSION, soc_version);
  521. GELOGI("SetOmSystemInfo soc_version: %s", soc_version.c_str());
  522. if (!ge::AttrUtils::SetStr(obj, "soc_version", soc_version)) {
  523. GELOGW("SetStr of soc_version failed.");
  524. return false;
  525. }
  526. std::string framework_type;
  527. (void)ge::GetContext().GetOption(ge::FRAMEWORK_TYPE, framework_type);
  528. GELOGI("SetOmSystemInfo framework_type: %s", framework_type.c_str());
  529. auto iter = ge::kFwkTypeToStr.find(framework_type);
  530. if (iter == ge::kFwkTypeToStr.end()) {
  531. GELOGW("Can not find framework_type in the map.");
  532. return false;
  533. }
  534. if (!ge::AttrUtils::SetStr(obj, "framework_type", iter->second)) {
  535. GELOGW("SetStr of framework_type failed.");
  536. return false;
  537. }
  538. return true;
  539. }
  540. Status GeGenerator::SetModelNameForDump(const GeRootModelPtr &ge_root_model) {
  541. bool is_unknown_shape = false;
  542. Status ret = ge_root_model->CheckIsUnknownShape(is_unknown_shape);
  543. if (ret != SUCCESS) {
  544. GELOGE(FAILED, "[Check][IsUnknownShape]Check root model is unknown shape failed, model id:%u",
  545. ge_root_model->GetModelId());
  546. REPORT_CALL_ERROR("E19999", "Check root model is unknown shape failed, model id:%u",
  547. ge_root_model->GetModelId());
  548. return FAILED;
  549. }
  550. GeModelPtr model_root = nullptr;
  551. if (is_unknown_shape) {
  552. model_root = MakeShared<GeModel>();
  553. GE_CHECK_NOTNULL(model_root);
  554. model_root->SetGraph(GraphUtils::CreateGraphFromComputeGraph(ge_root_model->GetRootGraph()));
  555. ge_root_model->SetSubgraphInstanceNameToModel(ge_root_model->GetRootGraph()->GetName(), model_root);
  556. }
  557. ModelHelper model_helper;
  558. string model_name;
  559. GE_CHECK_NOTNULL(ge_root_model->GetRootGraph());
  560. Status name_ret = model_helper.GetModelNameFromMergedGraphName(ge_root_model->GetRootGraph()->GetName(),
  561. model_name);
  562. if (name_ret != SUCCESS) {
  563. ErrorManager::GetInstance().ATCReportErrMessage("E10000", {"parameter"}, {"output"});
  564. GELOGE(FAILED, "[Check][GetModelNameStep]Get model_name failed. Param --output is invalid, root graph name: %s",
  565. ge_root_model->GetRootGraph()->GetName().c_str());
  566. return PARAM_INVALID;
  567. }
  568. map<string, GeModelPtr> name_to_ge_model = ge_root_model->GetSubgraphInstanceNameToModel();
  569. GeModelPtr &ge_model = name_to_ge_model[ge_root_model->GetRootGraph()->GetName()];
  570. GE_CHECK_NOTNULL(ge_model);
  571. ge_model->SetName(model_name);
  572. return SUCCESS;
  573. }
  574. Status GeGenerator::GenerateModel(const Graph &graph, const string &file_name_prefix, const vector<GeTensor> &inputs,
  575. ModelBufferData &model, bool is_offline) {
  576. rtContext_t ctx = nullptr;
  577. auto rt = rtCtxGetCurrent(&ctx);
  578. if (rt != RT_ERROR_NONE) {
  579. GELOGD("Current ctx is null.");
  580. ctx = nullptr;
  581. }
  582. GeRootModelPtr ge_root_model = nullptr;
  583. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  584. impl_->is_offline_ = is_offline;
  585. Status ret = impl_->BuildModel(graph, inputs, ge_root_model);
  586. if (ret != SUCCESS) {
  587. GELOGE(ret, "Build model failed.");
  588. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  589. GELOGE(FAILED, "graph_manager finalize fail.");
  590. }
  591. return ret;
  592. }
  593. /// BUILD_MODE_TUNING with BUILD_STEP_BEFORE_UB_MATCH no need save model;
  594. /// BUILD_MODE_TUNING with BUILD_STEP_AFTER_BUILDER no need save model;
  595. /// BUILD_MODE_TUNING with BUILD_STEP_AFTER_BUILDER_SUB no need save model.
  596. if ((impl_->build_mode_ == BUILD_MODE_TUNING) &&
  597. (impl_->build_step_ == BUILD_STEP_BEFORE_UB_MATCH || impl_->build_step_ == BUILD_STEP_AFTER_BUILDER ||
  598. impl_->build_step_ == BUILD_STEP_AFTER_BUILDER_SUB)) {
  599. GELOGI("Build mode:%s with step:%s no need SaveModel.",
  600. impl_->build_mode_.c_str(),
  601. impl_->build_step_.c_str());
  602. return SUCCESS;
  603. }
  604. GE_CHECK_NOTNULL(ge_root_model);
  605. ret = SetModelNameForDump(ge_root_model);
  606. if (ret != SUCCESS) {
  607. return ret;
  608. }
  609. ret = impl_->SaveRootModel(file_name_prefix, ge_root_model, model);
  610. if (ret != SUCCESS) {
  611. GELOGE(ret, "Save model failed");
  612. if (impl_->graph_manager_.Finalize() != SUCCESS) {
  613. GELOGE(FAILED, "graph_manager finalize fail.");
  614. }
  615. return ret;
  616. }
  617. if (ctx != nullptr) {
  618. (void)rtCtxSetCurrent(ctx);
  619. }
  620. return SUCCESS;
  621. }
  622. namespace {
  623. bool IsNeedConnectInputOpForSingleOp(GeTensorDesc &tensor_desc) {
  624. bool is_need = true;
  625. // format and dtype is all reserved, stand for Optional input. When singleop scene
  626. if (tensor_desc.GetFormat() == FORMAT_RESERVED && tensor_desc.GetDataType() == DT_UNDEFINED) {
  627. is_need = false;
  628. }
  629. return is_need;
  630. }
  631. Status CheckDynamicSupport(GeModelPtr &ge_model, const ComputeGraphPtr &graph) {
  632. bool support_dynamic = true;
  633. bool is_dynamic = false;
  634. for (const auto &node : graph->GetDirectNode()) {
  635. GE_CHECK_NOTNULL(node);
  636. auto op_desc = node->GetOpDesc();
  637. GE_CHECK_NOTNULL(op_desc);
  638. if (op_desc->GetOpEngineName() != kAIcoreEngine) {
  639. continue;
  640. }
  641. if (AttrUtils::HasAttr(op_desc, kAttrSupportDynamicShape)) {
  642. is_dynamic = true;
  643. (void) AttrUtils::GetBool(op_desc, kAttrSupportDynamicShape, support_dynamic);
  644. if (!support_dynamic) {
  645. GELOGW("Node[%s] doesn't support dynamic shape.", node->GetName().c_str());
  646. break;
  647. }
  648. }
  649. }
  650. if (is_dynamic) {
  651. (void) AttrUtils::SetBool(ge_model, kAttrSupportDynamicShape, support_dynamic);
  652. }
  653. return SUCCESS;
  654. }
  655. }
  656. bool GeGenerator::CheckNoAicore(const ComputeGraphPtr &graph) {
  657. for (const auto &node : graph->GetDirectNode()) {
  658. if (node == nullptr) {
  659. continue;
  660. }
  661. auto op_desc = node->GetOpDesc();
  662. if (op_desc == nullptr) {
  663. continue;
  664. }
  665. if (op_desc->GetOpEngineName() == kAIcoreEngine) {
  666. return false;
  667. }
  668. }
  669. return true;
  670. }
  671. void GeGenerator::RemoveConst(const vector<GeTensor> &inputs, vector<GeTensor> &outputs) {
  672. for (auto &input : inputs) {
  673. GeTensorDesc input_desc = input.GetTensorDesc();
  674. bool is_const = false;
  675. (void)AttrUtils::GetBool(input_desc, CONST_ATTR_NAME_INPUT, is_const);
  676. bool is_optional = IsOptional(input_desc);
  677. if (!is_optional && !is_const) {
  678. outputs.emplace_back(input);
  679. }
  680. }
  681. }
  682. Status GeGenerator::CheckForSingleOp(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  683. const vector<GeTensor> &outputs) {
  684. GE_CHECK_NOTNULL_EXEC(op_desc, return PARAM_INVALID);
  685. if (!inputs.empty() && (inputs.size() != op_desc->GetAllInputsSize())) {
  686. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  687. {op_desc->GetName(), op_desc->GetType(), "inputs size" + FmtToStr(op_desc->GetAllInputsSize()),
  688. "tensor size is " + FmtToStr(inputs.size())});
  689. GELOGE(PARAM_INVALID, "Tensor size: %zu, Inputs size: %zu", inputs.size(), op_desc->GetAllInputsSize());
  690. return PARAM_INVALID;
  691. }
  692. if (!outputs.empty() && (outputs.size() != op_desc->GetOutputsSize())) {
  693. ErrorManager::GetInstance().ATCReportErrMessage("E14001", {"opname", "optype", "value", "reason"},
  694. {op_desc->GetName(), op_desc->GetType(), "outputs size" + FmtToStr(op_desc->GetOutputsSize()),
  695. "tensor size is " + FmtToStr(outputs.size())});
  696. GELOGE(PARAM_INVALID, "Tensor size: %zu, Outputs size: %zu", outputs.size(), op_desc->GetOutputsSize());
  697. return PARAM_INVALID;
  698. }
  699. return SUCCESS;
  700. }
  701. Status GeGenerator::BuildSingleOp(OpDescPtr &op_desc, const vector<GeTensor> &inputs, const vector<GeTensor> &outputs,
  702. const string &model_file_name, OpEngineType engine_type, ModelBufferData &model_buff,
  703. bool is_offline, int32_t compile_flag) {
  704. GELOGD("Inputs size is %zu, outputs size is %zu.", inputs.size(), outputs.size());
  705. GE_CHECK_NOTNULL_EXEC(impl_, return PARAM_INVALID);
  706. impl_->is_offline_ = is_offline;
  707. (void)AttrUtils::SetBool(op_desc, ATTR_SINGLE_OP_SCENE, true);
  708. if (CheckForSingleOp(op_desc, inputs, outputs) != SUCCESS) {
  709. GELOGE(PARAM_INVALID, "input param is invalid when build single op!");
  710. return PARAM_INVALID;
  711. }
  712. OmgContext &omg_context = (impl_ == nullptr) ? domi::GetContext() : impl_->omg_context_;
  713. omg_context.is_dynamic_input = ContainsDynamicInpus(*op_desc);
  714. if (op_desc->HasAttr(ATTR_NAME_UNREGST_OPPATH)) {
  715. impl_->is_singleop_unregistered_ = true;
  716. }
  717. // 0. Save original attributes.
  718. OpDescPtr op_desc_tmp = AttrUtils::CloneOpDesc(op_desc);
  719. GE_CHECK_NOTNULL(op_desc_tmp);
  720. bool fuzz_compile_flag = false;
  721. if (!HasShapeRange(inputs) && compile_flag == kFuzzBuildPattern) {
  722. fuzz_compile_flag = true;
  723. }
  724. if (!AttrUtils::SetBool(op_desc, ATTR_NAME_FUZZ_BUILD, fuzz_compile_flag)) {
  725. GELOGE(FAILED, "[Set][ATTR_NAME_FUZZ_BUILD] Failed to set attr for %s.", op_desc->GetName().c_str());
  726. return FAILED;
  727. }
  728. impl_->omg_context_.fuzz_compile_flag = fuzz_compile_flag;
  729. // 1. Create ComputeGraph.
  730. string name = ge::CurrentTimeInStr() + "_" + model_file_name;
  731. Graph graph;
  732. GE_CHK_STATUS(BuildSingleOpGraph(op_desc, inputs, outputs, name, graph), "make graph fail.");
  733. // 2. check engine type when compile online
  734. if (model_file_name == kFileNameSuffix) {
  735. auto comp_graph = GraphUtils::GetComputeGraph(graph);
  736. GE_CHECK_NOTNULL(comp_graph);
  737. auto node = comp_graph->FindNode(op_desc->GetName());
  738. Status ret = CheckEngineTypeSupport(node, engine_type);
  739. if (ret != SUCCESS) {
  740. GELOGE(ret, "[Check][EngineType]value:%d for node:%s not support", engine_type, node->GetName().c_str());
  741. return ret;
  742. }
  743. }
  744. GELOGI("ATC parser success in single op build.");
  745. GeRootModelPtr ge_root_model = nullptr;
  746. vector<GeTensor> data_inputs;
  747. RemoveConst(inputs, data_inputs);
  748. GE_CHK_STATUS_RET_NOLOG(impl_->BuildModel(graph, data_inputs, ge_root_model));
  749. map<string, GeAttrValue> op_attrs = op_desc_tmp->GetAllAttrs();
  750. GE_CHECK_NOTNULL(ge_root_model);
  751. GE_CHECK_NOTNULL(ge_root_model->GetRootGraph());
  752. map<string, GeModelPtr> name_to_ge_model = ge_root_model->GetSubgraphInstanceNameToModel();
  753. if (name_to_ge_model.empty()) {
  754. GELOGE(PARAM_INVALID, "GetSubgraphInstanceNameToModel is empty.");
  755. return PARAM_INVALID;
  756. }
  757. const ComputeGraphPtr root_graph = ge_root_model->GetRootGraph();
  758. GeModelPtr &ge_model = name_to_ge_model.begin()->second;
  759. GE_CHK_STATUS_RET_NOLOG(CheckDynamicSupport(ge_model, root_graph));
  760. GELOGI("After build model, The opType in op_desc_tmp is [%s]", op_desc_tmp->GetType().c_str());
  761. bool all_shape = false;
  762. (void)AttrUtils::GetBool(op_desc, kAicpuAllshape, all_shape);
  763. if (all_shape && CheckNoAicore(root_graph)) {
  764. GELOGD("Get aicpu all_shape kernel!");
  765. vector<GeTensor> inputs_dynamic;
  766. vector<GeTensor> outputs_dynamic;
  767. GE_CHK_STATUS_RET_NOLOG(ResetTensorVecShape(inputs, inputs_dynamic));
  768. GE_CHK_STATUS_RET_NOLOG(ResetTensorVecShape(outputs, outputs_dynamic));
  769. GE_CHK_STATUS_RET_NOLOG(
  770. impl_->SaveParams(ge_model, op_desc_tmp->GetType(), op_attrs, inputs_dynamic, outputs_dynamic));
  771. } else if (fuzz_compile_flag) {
  772. GELOGD("Get fuzz build result of %s.", op_desc->GetName().c_str());
  773. (void)AttrUtils::SetInt(ge_model, ATTR_NAME_BUILD_MODE, fuzz_compile_flag);
  774. GeAttrValue::LIST_NAMED_ATTRS fuzz_build_attrs;
  775. if (GetFuzzBuildAttrs(op_desc, ge_root_model, fuzz_build_attrs) != SUCCESS) {
  776. GELOGE(FAILED, "[Get][FuzzRet]Failed to get fuzz build result of %s.", op_desc->GetName().c_str());
  777. return FAILED;
  778. }
  779. if (!fuzz_build_attrs.empty()) {
  780. GE_CHK_BOOL_EXEC(AttrUtils::SetListNamedAttrs(ge_model, ATTR_NAME_FUZZ_BUILD_RES_ATTRS, fuzz_build_attrs),
  781. return FAILED, "Set ATTR_NAME_FUZZ_BUILD_RES_ATTRS failed.");
  782. }
  783. GE_CHK_STATUS_RET_NOLOG(impl_->SaveParams(ge_model, op_desc_tmp->GetType(), op_attrs, inputs, outputs));
  784. } else {
  785. GE_CHK_STATUS_RET_NOLOG(impl_->SaveParams(ge_model, op_desc_tmp->GetType(), op_attrs, inputs, outputs));
  786. }
  787. GELOGI("Start save GeModel to Model buffer");
  788. GE_CHK_STATUS_RET_NOLOG(impl_->SaveModel(model_file_name, ge_model, model_buff));
  789. return SUCCESS;
  790. }
  791. /**
  792. * @ingroup ge
  793. * @brief Compiling a single operator into an offline model
  794. * @param [in] OpDescPtr &op_desc: Operator description info that needs to be compiled into an offline model file
  795. * @param [in] vector<GeTensor> &inputs: Operator input data description information.
  796. * @param [in] vector<GeTensor> &outputs: Operator output data description information.
  797. * @param [in] const string &model_file_name: Offline model filename.
  798. * @param [in] compile_flag: op build flag from atc
  799. * @return SUCCESS handle successfully / others handle failed
  800. */
  801. Status GeGenerator::BuildSingleOpModel(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  802. const vector<GeTensor> &outputs, const string &model_file_name,
  803. int32_t compile_flag) {
  804. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  805. GELOGI("Start to build single op offline model, input size: %zu, output size: %zu", inputs.size(), outputs.size());
  806. ModelBufferData model_buff;
  807. OpEngineType engine_type = ENGINE_SYS;
  808. Status status = BuildSingleOp(op_desc, inputs, outputs, model_file_name, engine_type, model_buff, true, compile_flag);
  809. GELOGI("Finish build single offline model, status: %u", status);
  810. return status;
  811. }
  812. /**
  813. * @ingroup ge
  814. * @brief Compiling a single operator into online buffer
  815. * @param [in] OpDescPtr &op_desc: Operator description info that needs to be compiled into an offline model file
  816. * @param [in] vector<GeTensor> &inputs: Operator input data description information.
  817. * @param [in] vector<GeTensor> &outputs: Operator output data description information.
  818. * @param [in] engine_type: specific engine.
  819. * @param [in] compile_flag: op build flag, compile flag by acl
  820. * @param [out] ModelBufferData &Model_buff: Model_buff: model buffer of the op.
  821. * @return SUCCESS handle successfully / others handle failed
  822. */
  823. Status GeGenerator::BuildSingleOpModel(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  824. const vector<GeTensor> &outputs, OpEngineType engine_type,
  825. ModelBufferData &model_buff) {
  826. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  827. GELOGI("Start to build single op online, input size: %zu, output size: %zu", inputs.size(), outputs.size());
  828. Status status = BuildSingleOp(op_desc, inputs, outputs, kFileNameSuffix, engine_type, model_buff, false);
  829. GELOGI("Finish build single online model, status: %u", status);
  830. return status;
  831. }
  832. Status GeGenerator::BuildSingleOpModel(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  833. const vector<GeTensor> &outputs, OpEngineType engine_type, int32_t compile_flag,
  834. ModelBufferData &model_buff) {
  835. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  836. GELOGI("Start to build single op online, input size: %zu, output size: %zu", inputs.size(), outputs.size());
  837. Status status = BuildSingleOp(op_desc, inputs, outputs, kFileNameSuffix, engine_type, model_buff, false,
  838. compile_flag);
  839. GELOGI("Finish build single online model, status: %u", status);
  840. return status;
  841. }
  842. Status GeGenerator::BuildSingleOpGraph(OpDescPtr &op_desc, const vector<GeTensor> &inputs,
  843. const vector<GeTensor> &outputs, std::string graph_name, Graph &graph) {
  844. ge::ComputeGraphPtr compute_graph = MakeShared<ComputeGraph>(graph_name);
  845. GE_CHECK_NOTNULL_EXEC(compute_graph, return INTERNAL_ERROR);
  846. // 1. Add Node to ComputeGraph.
  847. NodePtr op_node = compute_graph->AddNode(op_desc);
  848. GE_CHECK_NOTNULL_EXEC(op_node, return INTERNAL_ERROR);
  849. // 2. Create InputData node.
  850. int32_t arg_index = 0;
  851. int32_t data_index = 0;
  852. if (inputs.empty()) {
  853. for (const auto &input_desc : op_desc->GetAllInputsDescPtr()) {
  854. GE_CHECK_NOTNULL_EXEC(input_desc, return INTERNAL_ERROR);
  855. if (!IsNeedConnectInputOpForSingleOp(*input_desc)) {
  856. continue;
  857. }
  858. GE_CHK_STATUS_RET_NOLOG(AddInputs(compute_graph, op_node, *input_desc, arg_index, false, data_index));
  859. arg_index++;
  860. }
  861. } else {
  862. for (const auto &in_desc : inputs) {
  863. GE_CHK_STATUS_RET_NOLOG(AddInputs(compute_graph, op_node, in_desc.GetTensorDesc(), arg_index, true, data_index));
  864. arg_index++;
  865. }
  866. }
  867. // 3. Create Output node.
  868. if (!outputs.empty()) {
  869. GE_CHK_STATUS_RET_NOLOG(AddOutputs(compute_graph, op_node, outputs));
  870. }
  871. // dump ComputeGraph node.
  872. compute_graph->Dump();
  873. graph = ge::GraphUtils::CreateGraphFromComputeGraph(compute_graph);
  874. return SUCCESS;
  875. }
  876. Status GeGenerator::Impl::SaveParams(GeModelPtr &ge_model, const string &type, const map<string, GeAttrValue> &attrs,
  877. const vector<GeTensor> &inputs, const vector<GeTensor> &outputs) {
  878. GE_CHECK_NOTNULL_EXEC(ge_model, return PARAM_INVALID);
  879. GE_CHK_BOOL_EXEC_NOLOG(graph_manager_.SaveParams(*ge_model, type, attrs, inputs, outputs) == SUCCESS,
  880. (void)graph_manager_.Finalize();
  881. return FAILED);
  882. return SUCCESS;
  883. }
  884. Status GeGenerator::Impl::SaveModel(const string &file_name_prefix, GeModelPtr &model, ModelBufferData &model_buff) {
  885. // set atc version
  886. if (!SetAtcVersionInfo(*(model.get()))) {
  887. GELOGW("SetPackageVersionInfo of atc failed!");
  888. }
  889. // set opp version
  890. if (!SetOppVersionInfo(*(model.get()))) {
  891. GELOGW("SetPackageVersionInfo of ops failed!");
  892. }
  893. ModelHelper model_helper;
  894. model_helper.SetSaveMode(is_offline_);
  895. Status ret = model_helper.SaveToOmModel(model, save_param_, file_name_prefix, model_buff);
  896. if (ret != SUCCESS) {
  897. GELOGE(ret, "Save to om model failed");
  898. return ret;
  899. }
  900. return SUCCESS;
  901. }
  902. Status GeGenerator::Impl::SaveRootModel(const string &file_name_prefix, GeRootModelPtr &ge_root_model,
  903. ModelBufferData &model_buff) {
  904. bool is_unknown_shape = false;
  905. auto ret = ge_root_model->CheckIsUnknownShape(is_unknown_shape);
  906. if (ret != SUCCESS) {
  907. GELOGE(FAILED, "Check root model is unkonwn shape failed");
  908. return FAILED;
  909. }
  910. GELOGD("begin save root model, cur model is unkonwn shape model ? : %d", is_unknown_shape);
  911. GE_CHK_BOOL_EXEC(!ge_root_model->GetSubgraphInstanceNameToModel().empty(), return FAILED,
  912. "ge root model has no sub model")
  913. GeModelPtr model_root = nullptr;
  914. if (is_unknown_shape) {
  915. auto name_to_ge_model = ge_root_model->GetSubgraphInstanceNameToModel();
  916. model_root = name_to_ge_model[ge_root_model->GetRootGraph()->GetName()];
  917. } else {
  918. model_root = ge_root_model->GetSubgraphInstanceNameToModel().begin()->second;
  919. }
  920. GE_CHECK_NOTNULL(model_root);
  921. // set atc version
  922. if (!SetAtcVersionInfo(*(model_root.get()))) {
  923. GELOGW("SetPackageVersionInfo of atc failed!");
  924. }
  925. // set opp version
  926. if (!SetOppVersionInfo(*(model_root.get()))) {
  927. GELOGW("SetPackageVersionInfo of ops failed!");
  928. }
  929. if (!SetOmSystemInfo(*(model_root.get()))) {
  930. GELOGW("SetOmsystemInfo failed!");
  931. }
  932. ModelHelper model_helper;
  933. model_helper.SetSaveMode(is_offline_);
  934. ret = model_helper.SaveToOmRootModel(ge_root_model, save_param_, file_name_prefix, model_buff, is_unknown_shape);
  935. if (ret != SUCCESS) {
  936. GELOGE(ret, "Save to om model failed");
  937. return ret;
  938. }
  939. return SUCCESS;
  940. }
  941. Status GeGenerator::Impl::BuildModel(const Graph &graph, const vector<GeTensor> &inputs,
  942. GeRootModelPtr &ge_root_model) {
  943. static std::atomic<GraphId> atomic_graph_id(0);
  944. auto graph_id = atomic_graph_id.fetch_add(1);
  945. const std::map<std::string, std::string> options;
  946. Status ret = graph_manager_.AddGraph(graph_id, graph, options, omg_context_);
  947. if (ret != SUCCESS) {
  948. GELOGE(GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED, "GraphManager add graph fail, graph id: %u", graph_id);
  949. (void)graph_manager_.Finalize();
  950. return GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED;
  951. }
  952. graph_manager_.SetOptionsRunGraphFlag(false);
  953. static std::atomic<uint64_t> atomic_session_id(0);
  954. auto session_id = atomic_session_id.fetch_add(1);
  955. // This is a temporary add for graph with variable
  956. auto version = static_cast<int32_t>(SessionVersion::ClOUD_VERSION);
  957. ret = VarManager::Instance(session_id)->Init(version, session_id, kDefaultDeviceId, kDefaultJobId);
  958. GELOGI("Start init var instance, session_id %lu", session_id);
  959. if (ret != SUCCESS) {
  960. GELOGW("Failed init var instance, session_id %lu", session_id);
  961. }
  962. if (is_singleop_unregistered_) {
  963. ret = graph_manager_.BuildGraphForUnregisteredOp(graph_id, inputs, ge_root_model, session_id);
  964. } else {
  965. ret = graph_manager_.BuildGraph(graph_id, inputs, ge_root_model, session_id);
  966. }
  967. ErrorManager::GetInstance().SetStage(ErrorMessage::kModelCompile, ErrorMessage::kOther);
  968. if (ret != SUCCESS) {
  969. GELOGE(GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED, "GraphManager build graph fail, graph id: %u", graph_id);
  970. ret = GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED;
  971. }
  972. RtContextUtil::GetInstance().DestroyRtContexts(session_id);
  973. Analyzer::GetInstance()->DestroySessionJsonObject(session_id);
  974. VarManagerPool::Instance().RemoveVarManager(session_id);
  975. return ret;
  976. }
  977. Status GeGenerator::Impl::GenerateInfershapeGraph(const Graph &graph) {
  978. static std::atomic<GraphId> atomic_graph_id(0);
  979. auto graph_id = atomic_graph_id.fetch_add(1);
  980. const std::map<std::string, std::string> options;
  981. Status ret = graph_manager_.AddGraph(graph_id, graph, options, omg_context_);
  982. if (ret != SUCCESS) {
  983. GELOGE(GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED, "GraphManager add graph failed, graph id: %u", graph_id);
  984. (void)graph_manager_.Finalize();
  985. return GE_GENERATOR_GRAPH_MANAGER_ADD_GRAPH_FAILED;
  986. }
  987. ret = graph_manager_.GenerateInfershapeGraph(graph_id);
  988. if (ret != SUCCESS) {
  989. GELOGE(GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED, "GraphManager generate graph failed");
  990. return GE_GENERATOR_GRAPH_MANAGER_BUILD_GRAPH_FAILED;
  991. }
  992. return SUCCESS;
  993. }
  994. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示