You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_ir_build.cc 30 kB

5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "external/ge/ge_ir_build.h"
  17. #include <vector>
  18. #include "common/auth/file_saver.h"
  19. #include "external/register/register_types.h"
  20. #include "framework/common/debug/ge_log.h"
  21. #include "framework/common/ge_inner_error_codes.h"
  22. #include "framework/common/string_util.h"
  23. #include "framework/common/types.h"
  24. #include "framework/common/util.h"
  25. #include "framework/omg/omg_inner_types.h"
  26. #include "framework/omg/omg_inner_types.h"
  27. #include "ge/ge_api_types.h"
  28. #include "generator/ge_generator.h"
  29. #include "graph/compute_graph.h"
  30. #include "graph/ge_tensor.h"
  31. #include "graph/utils/type_utils.h"
  32. #include "graph/ge_global_options.h"
  33. #include "init/gelib.h"
  34. #include "ir_build/atc_ir_common.h"
  35. #include "model/ge_model.h"
  36. #include "graph/shape_refiner.h"
  37. #include "graph/opsproto_manager.h"
  38. #include "inc/pass_manager.h"
  39. #include "graph/passes/net_output_pass.h"
  40. #include "graph/passes/data_pass.h"
  41. using std::string;
  42. using namespace std;
  43. namespace ge {
  44. namespace {
  45. const std::string IR_OPTION_TARGET = "target";
  46. const std::string IR_OPTION_MODE = "mode";
  47. const std::string IR_OP_CONF_DELIMITER = ":";
  48. const std::string IR_OPTION_LOG_LEVEL_DEFAULT = "default";
  49. const std::string IR_OPTION_BUFFER_OPTIMIZE_DEFAULT = "l2_optimize";
  50. const std::string IR_OPTION_DISABLE_REUSE_MEMORY_DEFAULT = "0";
  51. const std::string IR_OPTION_ENABLE_COMPRESS_WEIGHT_DEFAULT = "false";
  52. const std::string kInputShape = "input_shape";
  53. const std::string kInputFormat = "input_format";
  54. } // namespace
  55. static graphStatus CheckGlobalOptions(std::map<std::string, std::string> &global_options) {
  56. // check param disable_reuse_memory
  57. std::string disable_reuse_memory = global_options.find(ge::ir_option::EXEC_DISABLE_REUSED_MEMORY) ==
  58. global_options.end()
  59. ? IR_OPTION_DISABLE_REUSE_MEMORY_DEFAULT
  60. : global_options[ge::ir_option::EXEC_DISABLE_REUSED_MEMORY];
  61. GE_CHK_BOOL_EXEC(ge::CheckDisableReuseMemoryParamValid(disable_reuse_memory) == ge::SUCCESS,
  62. return ge::GRAPH_PARAM_INVALID, "check disable_reuse_memory failed!");
  63. global_options[ge::ir_option::EXEC_DISABLE_REUSED_MEMORY] = disable_reuse_memory;
  64. // check buffer_optimize
  65. std::string buffer_optimize = global_options.find(ge::ir_option::BUFFER_OPTIMIZE) == global_options.end()
  66. ? IR_OPTION_BUFFER_OPTIMIZE_DEFAULT
  67. : global_options[ge::ir_option::BUFFER_OPTIMIZE];
  68. GE_CHK_BOOL_EXEC(ge::CheckBufferOptimizeParamValid(buffer_optimize) == ge::SUCCESS,
  69. return ge::GRAPH_PARAM_INVALID, "check buffer optimize failed!");
  70. global_options[ge::ir_option::BUFFER_OPTIMIZE] = buffer_optimize;
  71. // check enable_single_stream
  72. std::string enable_single_stream = global_options.find(ge::ir_option::ENABLE_SINGLE_STREAM) == global_options.end()
  73. ? ""
  74. : global_options[ge::ir_option::ENABLE_SINGLE_STREAM];
  75. GE_CHK_BOOL_EXEC(ge::CheckEnableSingleStreamParamValid(enable_single_stream) == ge::SUCCESS,
  76. return ge::GRAPH_PARAM_INVALID, "check enable single stream failed!");
  77. // check compress_weight
  78. std::string enable_compress_weight = global_options.find(ge::ir_option::ENABLE_COMPRESS_WEIGHT) ==
  79. global_options.end()
  80. ? IR_OPTION_ENABLE_COMPRESS_WEIGHT_DEFAULT
  81. : global_options[ge::ir_option::ENABLE_COMPRESS_WEIGHT];
  82. std::string compress_weight_conf = global_options.find(ge::ir_option::COMPRESS_WEIGHT_CONF) == global_options.end()
  83. ? ""
  84. : global_options[ge::ir_option::COMPRESS_WEIGHT_CONF];
  85. GE_CHK_BOOL_EXEC(ge::CheckCompressWeightParamValid(enable_compress_weight, compress_weight_conf) == ge::SUCCESS,
  86. return ge::GRAPH_PARAM_INVALID, "check compress weight failed!");
  87. global_options[ge::ir_option::ENABLE_COMPRESS_WEIGHT] = (enable_compress_weight == "true") ?
  88. ge::kEnableCompressWeightTrue :
  89. ge::kEnableCompressWeightFalse;
  90. // check optypelist_for_implmode and op_select_implmode
  91. std::string optypelist_for_implmode = global_options.find(ge::ir_option::OPTYPELIST_FOR_IMPLMODE) ==
  92. global_options.end()
  93. ? ""
  94. : global_options[ge::ir_option::OPTYPELIST_FOR_IMPLMODE];
  95. std::string op_select_implmode = global_options.find(ge::ir_option::OP_SELECT_IMPL_MODE) ==
  96. global_options.end()
  97. ? ""
  98. : global_options[ge::ir_option::OP_SELECT_IMPL_MODE];
  99. GE_CHK_BOOL_EXEC(
  100. ge::CheckImplmodeParamValid(optypelist_for_implmode, op_select_implmode) == ge::SUCCESS,
  101. return ge::GRAPH_PARAM_INVALID, "check optypelist_for_implmode and op_select_implmode failed!");
  102. global_options[ge::ir_option::OP_SELECT_IMPL_MODE] = op_select_implmode;
  103. // set precision mode default value
  104. std::string precision_mode = global_options.find(ge::ir_option::PRECISION_MODE) ==
  105. global_options.end()
  106. ? "force_fp16"
  107. : global_options[ge::ir_option::PRECISION_MODE];
  108. global_options[ge::ir_option::PRECISION_MODE] = precision_mode;
  109. return GRAPH_SUCCESS;
  110. }
  111. static void GetOpsProtoPath(string &opsproto_path) {
  112. GELOGI("Start to get ops proto path schedule.");
  113. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  114. if (path_env != nullptr) {
  115. string path = path_env;
  116. string file_path = RealPath(path.c_str());
  117. if (file_path.empty()) {
  118. GELOGE(FAILED, "File path %s is invalid.", path.c_str());
  119. return;
  120. }
  121. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  122. GELOGI("Get opsproto so path from env : %s", path.c_str());
  123. return;
  124. }
  125. string path_base = PluginManager::GetPath();
  126. GELOGI("path_base is %s", path_base.c_str());
  127. path_base = path_base.substr(0, path_base.rfind('/'));
  128. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  129. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  130. }
  131. static void LoadOpsProto() {
  132. string opsproto_path;
  133. GetOpsProtoPath(opsproto_path);
  134. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  135. OpsProtoManager *manager = OpsProtoManager::Instance();
  136. map<string, string> option_tmp;
  137. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  138. (void)manager->Initialize(option_tmp);
  139. }
  140. graphStatus aclgrphBuildInitializeImpl(std::map<std::string, std::string> &global_options) {
  141. GELOGD("Enter aclgrphInitialize start!");
  142. // check global options
  143. if (CheckGlobalOptions(global_options) != GRAPH_SUCCESS) {
  144. GELOGE(GRAPH_PARAM_INVALID, "Check global options falied!");
  145. return GRAPH_PARAM_INVALID;
  146. }
  147. // print global option map
  148. ge::PrintOptionMap(global_options, "global option");
  149. LoadOpsProto();
  150. std::shared_ptr<ge::GELib> instance_ptr = ge::GELib::GetInstance();
  151. if (instance_ptr == nullptr || !instance_ptr->InitFlag()) {
  152. GELOGI("aclgrphInitialize start!");
  153. auto ret = ge::GELib::Initialize(global_options);
  154. if (ret != ge::SUCCESS) {
  155. GELOGE(ret, "GE initialize failed!");
  156. return GRAPH_FAILED;
  157. }
  158. }
  159. GELOGW("gelib has been initialized!");
  160. std::string path_base = ge::GELib::GetPath();
  161. int ret = ErrorManager::GetInstance().Init(path_base);
  162. if (ret != 0) {
  163. DOMI_LOGE("ErrorManager init fail !");
  164. return GRAPH_FAILED;
  165. }
  166. return GRAPH_SUCCESS;
  167. }
  168. graphStatus aclgrphBuildInitialize(std::map<std::string, std::string> global_options) {
  169. return aclgrphBuildInitializeImpl(global_options);
  170. }
  171. graphStatus aclgrphBuildInitialize(std::map<AscendString, AscendString> &global_options) {
  172. std::map<std::string, std::string> tmp_global_options;
  173. for (auto &option : global_options) {
  174. if (option.first.GetString() == nullptr || option.second.GetString() == nullptr) {
  175. GELOGE(GRAPH_FAILED, "AclgrphBuildInitialize option is nullptr.");
  176. return GRAPH_FAILED;
  177. }
  178. std::string key = option.first.GetString();
  179. std::string val = option.second.GetString();
  180. tmp_global_options[key] = val;
  181. }
  182. return aclgrphBuildInitializeImpl(tmp_global_options);
  183. }
  184. void aclgrphBuildFinalize() {
  185. if (ge::GELib::GetInstance() != nullptr && ge::GELib::GetInstance()->InitFlag()) {
  186. (void)ge::GELib::GetInstance()->Finalize();
  187. return;
  188. }
  189. GELOGW("[Notice] gelib has not been initialized!do nothing!");
  190. }
  191. class Impl {
  192. public:
  193. Impl() {
  194. omg_context_ = domi::GetContext();
  195. omg_context_.format = domi::DOMI_TENSOR_ND;
  196. omg_context_.input_nodes_format_map.clear();
  197. omg_context_.output_formats.clear();
  198. omg_context_.user_input_dims.clear();
  199. omg_context_.input_dims.clear();
  200. omg_context_.op_conf_map.clear();
  201. omg_context_.out_nodes_map.clear();
  202. omg_context_.user_out_nodes.clear();
  203. omg_context_.net_format = domi::DOMI_TENSOR_RESERVED;
  204. omg_context_.type = domi::FRAMEWORK_RESERVED;
  205. omg_context_.run_mode = ONLY_PRE_CHECK;
  206. omg_context_.train_flag = false;
  207. omg_context_.output_type.clear();
  208. omg_context_.is_dynamic_input = false;
  209. omg_context_.dynamic_batch_size.clear();
  210. omg_context_.dynamic_image_size.clear();
  211. omg_context_.dynamic_dims.clear();
  212. };
  213. ~Impl() { (void)generator_.Finalize(); };
  214. graphStatus CheckOptions(const std::map<std::string, std::string> &options);
  215. graphStatus CreateInputsForIRBuild(const ge::Graph &graph, vector<ge::GeTensor> &inputs);
  216. graphStatus UpdateDataOpAttr(const Graph &graph);
  217. graphStatus Init(const Graph &graph, const std::map<std::string, std::string> &options);
  218. graphStatus BuildModel(const Graph &graph, const std::map<std::string, std::string> &options,
  219. ModelBufferData &ge_models);
  220. graphStatus InitDomiOmgContext(const string &input_shape, const string &input_format, const string &net_format,
  221. bool is_dynamic_input);
  222. static graphStatus InferShapePrepare(const ComputeGraphPtr &compute_graph);
  223. void SetRtSocVersion();
  224. void UpdateThreadContext();
  225. void LoadOpsProto();
  226. public:
  227. ge::GeGenerator generator_;
  228. std::map<std::string, std::string> options_;
  229. bool is_dynamic_input_ = false;
  230. OmgContext omg_context_;
  231. };
  232. graphStatus Impl::InferShapePrepare(const ComputeGraphPtr &compute_graph) {
  233. GE_CHECK_NOTNULL(compute_graph);
  234. PassManager prepare_infershape;
  235. prepare_infershape.AddPass("PrepareNetoutput", new(std::nothrow) NetOutputPass);
  236. prepare_infershape.AddPass("PrepareSubGraphReflection", new (std::nothrow) DataPass);
  237. auto ret = prepare_infershape.Run(compute_graph);
  238. if ((ret != SUCCESS) && (ret != NOT_CHANGED)) {
  239. GELOGE(ret, "Prepair for infershape failed, ret:%d", ret);
  240. return ret;
  241. }
  242. GELOGD("Prepair for infershape success!");
  243. return GRAPH_SUCCESS;
  244. }
  245. graphStatus Impl::UpdateDataOpAttr(const Graph &graph) {
  246. GELOGD("Enter Update Data Attr Process!");
  247. if (options_.find(kInputShape) == options_.end()) {
  248. return GRAPH_SUCCESS;
  249. }
  250. unordered_map<string, vector<int64_t>> shape_map;
  251. vector<pair<string, vector<int64_t>>> user_shape_map;
  252. GE_CHK_BOOL_EXEC(ParseInputShape(options_[kInputShape], shape_map, user_shape_map, true),
  253. return GRAPH_PARAM_INVALID, "parse input shape failed!");
  254. auto compute_graph = ge::GraphUtils::GetComputeGraph(graph);
  255. GE_CHECK_NOTNULL(compute_graph);
  256. for (ge::NodePtr &input_node : compute_graph->GetDirectNode()) {
  257. GE_CHECK_NOTNULL(input_node);
  258. ge::OpDescPtr op = input_node->GetOpDesc();
  259. GE_CHECK_NOTNULL(op);
  260. if (op->GetType() == DATA) {
  261. auto tensor_input = op->MutableInputDesc(0);
  262. auto tensor_output = op->MutableOutputDesc(0);
  263. GE_CHECK_NOTNULL(tensor_input);
  264. GE_CHECK_NOTNULL(tensor_output);
  265. string data_op_name = op->GetName();
  266. auto iter = shape_map.find(data_op_name);
  267. if (iter != shape_map.end()) {
  268. tensor_input->SetShape(ge::GeShape(iter->second));
  269. tensor_output->SetShape(ge::GeShape(iter->second));
  270. GELOGD("update input [%s] shape info", data_op_name.c_str());
  271. } else {
  272. GELOGI("no need update input [%s] attr because not found from input_shape.", data_op_name.c_str());
  273. }
  274. }
  275. }
  276. return GRAPH_SUCCESS;
  277. }
  278. graphStatus Impl::CheckOptions(const std::map<std::string, std::string> &options) {
  279. for (auto &ele : options) {
  280. auto it = ge::ir_option::ir_builder_suppported_options.find(ele.first);
  281. if (it == ge::ir_option::ir_builder_suppported_options.end()) {
  282. auto it_lx_fusion = ir_builder_supported_options_for_lx_fusion.find(ele.first);
  283. if (it_lx_fusion == ir_builder_supported_options_for_lx_fusion.end()) {
  284. GELOGE(GRAPH_PARAM_INVALID, "input options include unsupported option(%s).Please check!",
  285. ele.first.c_str());
  286. return GRAPH_PARAM_INVALID;
  287. }
  288. }
  289. options_.insert(ele);
  290. }
  291. // Check options build_mode and build_step.
  292. std::string build_mode;
  293. auto it = options_.find(BUILD_MODE);
  294. if (it != options_.end() && !(it->second.empty())) {
  295. if (build_mode_options.find(it->second) == build_mode_options.end()) {
  296. GELOGE(GRAPH_PARAM_INVALID, "Build mode:%s is unsupported. Please check!", it->second.c_str());
  297. return GRAPH_PARAM_INVALID;
  298. }
  299. build_mode = it->second;
  300. }
  301. it = options_.find(BUILD_STEP);
  302. if (it != options_.end() && !(it->second.empty())) {
  303. if (build_step_options.find(it->second) == build_step_options.end()) {
  304. GELOGE(GRAPH_PARAM_INVALID, "Build step:%s is unsupported. Please check!", it->second.c_str());
  305. return GRAPH_PARAM_INVALID;
  306. }
  307. } else {
  308. if (build_mode == BUILD_MODE_TUNING) {
  309. GELOGE(GRAPH_PARAM_INVALID, "Build mode tuning must specify build step. Please check!");
  310. return GRAPH_PARAM_INVALID;
  311. }
  312. }
  313. // Check option EXEC_DISABLE_REUSED_MEMORY
  314. it = options_.find(ge::ir_option::EXEC_DISABLE_REUSED_MEMORY);
  315. if (it != options_.end() && (CheckDisableReuseMemoryParamValid(it->second) != GRAPH_SUCCESS)) {
  316. return GRAPH_PARAM_INVALID;
  317. }
  318. // Check Input Format
  319. if (options_.find(kInputFormat) != options_.end()) {
  320. return CheckInputFormat(options_[kInputFormat]);
  321. }
  322. return GRAPH_SUCCESS;
  323. }
  324. graphStatus Impl::Init(const Graph &graph, const std::map<std::string, std::string> &options) {
  325. // 1. check options
  326. graphStatus ret = CheckOptions(options);
  327. if (ret != GRAPH_SUCCESS) {
  328. GELOGE(ret, "User input options are illegal! Please check!");
  329. return ret;
  330. }
  331. ret = UpdateDataOpAttr(graph);
  332. if (ret != GRAPH_SUCCESS) {
  333. return ret;
  334. }
  335. std::string build_mode = (options_.find(BUILD_MODE) == options_.end() || options_[BUILD_MODE] == BUILD_MODE_NORMAL)
  336. ? "" : options_[BUILD_MODE];
  337. options_[BUILD_MODE] = build_mode;
  338. // set log level
  339. std::string log = options_.find(ge::ir_option::LOG_LEVEL) == options_.end()
  340. ? IR_OPTION_LOG_LEVEL_DEFAULT
  341. : options_[ge::ir_option::LOG_LEVEL];
  342. GE_CHK_BOOL_RET_STATUS_NOLOG(ge::CheckLogParamValidAndSetLogLevel(log) == 0, GRAPH_PARAM_INVALID);
  343. options_[ge::ir_option::LOG_LEVEL] = log;
  344. string input_shape = options_.find("input_shape") == options_.end() ? "" : options_["input_shape"];
  345. string input_format = options_.find("input_format") == options_.end() ? "" : options_["input_format"];
  346. string net_format = options_.find("net_format") == options_.end() ? "" : options_["net_format"];
  347. string dynamic_batch_size = options_.find(ge::ir_option::DYNAMIC_BATCH_SIZE) == options_.end()
  348. ? ""
  349. : options_[ge::ir_option::DYNAMIC_BATCH_SIZE];
  350. string dynamic_image_size = options_.find(ge::ir_option::DYNAMIC_IMAGE_SIZE) == options_.end()
  351. ? ""
  352. : options_[ge::ir_option::DYNAMIC_IMAGE_SIZE];
  353. string dynamic_dims =
  354. options_.find(ge::ir_option::DYNAMIC_DIMS) == options_.end() ? "" : options_[ge::ir_option::DYNAMIC_DIMS];
  355. auto status = CheckDynamicInputParamValid(dynamic_batch_size, dynamic_image_size, dynamic_dims, input_shape,
  356. input_format, is_dynamic_input_);
  357. if (status != ge::SUCCESS) {
  358. GELOGE(GRAPH_PARAM_INVALID, "Check dynamic input size failed!");
  359. return GRAPH_PARAM_INVALID;
  360. }
  361. GELOGD("User input dynamic_batch_size:%s, dynamic_image_size:%s, dynamic_dims:%s.", dynamic_batch_size.c_str(),
  362. dynamic_image_size.c_str(), dynamic_dims.c_str());
  363. omg_context_.dynamic_batch_size = dynamic_batch_size;
  364. omg_context_.dynamic_image_size = dynamic_image_size;
  365. omg_context_.dynamic_dims = dynamic_dims;
  366. // check output_type
  367. std::string output_type = options_.find(ge::ir_option::OUTPUT_TYPE) == options_.end()
  368. ? ""
  369. : options_[ge::ir_option::OUTPUT_TYPE];
  370. GE_CHK_BOOL_EXEC(ge::CheckOutputTypeParamValid(output_type) == ge::SUCCESS,
  371. return ge::GRAPH_PARAM_INVALID, "check output type failed!");
  372. // check insert_op_conf
  373. std::string insert_op_conf = options_.find(ge::ir_option::INSERT_OP_FILE) == options_.end()
  374. ? ""
  375. : options_[ge::ir_option::INSERT_OP_FILE];
  376. GE_CHK_BOOL_EXEC(ge::CheckInsertOpConfParamValid(std::string(insert_op_conf)) == ge::SUCCESS,
  377. return ge::GRAPH_PARAM_INVALID, "check insert op conf failed!");
  378. GE_CHK_BOOL_EXEC(insert_op_conf.empty() || dynamic_dims.empty(),
  379. return ge::GRAPH_PARAM_INVALID, "dynamic dims function does not support aipp");
  380. // for IR builder.Only support om mode, so here fixed;
  381. options_.insert(std::pair<string, string>(string(IR_OPTION_MODE), to_string(0)));
  382. options_.insert(std::pair<string, string>(string(IR_OPTION_TARGET), "mini"));
  383. options_.insert(std::pair<string, string>(string(ge::RUN_FLAG), to_string(0)));
  384. options_.insert(std::pair<string, string>(string(ge::TRAIN_FLAG), to_string(0)));
  385. options_.insert(std::pair<string, string>(string(ge::SAVE_ORIGINAL_MODEL), to_string(0)));
  386. // print ge option map
  387. ge::PrintOptionMap(options_, "ge option");
  388. SetRtSocVersion();
  389. UpdateThreadContext();
  390. // 3. init generator with options_
  391. ret = generator_.Initialize(options_, omg_context_);
  392. if (ret != GRAPH_SUCCESS) {
  393. GELOGE(ret, "generator Initialize failed!");
  394. return ret;
  395. }
  396. // 4.parse and init Context with input shape format and net format info
  397. return this->InitDomiOmgContext(input_shape, input_format, net_format, is_dynamic_input_);
  398. }
  399. void Impl::SetRtSocVersion() {
  400. const auto &global_options = GetMutableGlobalOptions();
  401. auto it = global_options.find(ge::SOC_VERSION);
  402. if (it != global_options.end()) {
  403. const char *soc_version = it->second.c_str();
  404. rtError_t rt_ret = rtSetSocVersion(soc_version);
  405. if (rt_ret != RT_ERROR_NONE) {
  406. GELOGW("Set soc version %s failed. ret:0x%X", soc_version, rt_ret);
  407. }
  408. GELOGD("Set soc version %s success.", soc_version);
  409. }
  410. }
  411. void Impl::UpdateThreadContext() {
  412. GetThreadLocalContext().SetGlobalOption(GetMutableGlobalOptions());
  413. GetThreadLocalContext().SetGraphOption(options_);
  414. }
  415. graphStatus Impl::CreateInputsForIRBuild(const ge::Graph &graph, vector<ge::GeTensor> &inputs) {
  416. auto compute_graph = ge::GraphUtils::GetComputeGraph(graph);
  417. GE_CHECK_NOTNULL(compute_graph);
  418. int64_t index = 0;
  419. for (ge::NodePtr &input_node : compute_graph->GetDirectNode()) {
  420. GE_CHECK_NOTNULL(input_node);
  421. ge::OpDescPtr op = input_node->GetOpDesc();
  422. GE_CHECK_NOTNULL(op);
  423. if (op->GetType() == DATA) {
  424. (void)AttrUtils::SetInt(op, ATTR_NAME_INDEX, index++);
  425. GELOGD("Data op inputDesc size: %zu", op->GetAllInputsDesc().size());
  426. ge::GeTensorDesc tensor = op->GetInputDesc(0);
  427. string data_op_name = op->GetName();
  428. GELOGD("Data op name: %s", data_op_name.c_str());
  429. ge::GeShape data_shape;
  430. auto iter = omg_context_.input_dims.find(data_op_name);
  431. if (iter != omg_context_.input_dims.end()) {
  432. data_shape = ge::GeShape(iter->second);
  433. GELOGD("Data op get shape from Context.");
  434. } else {
  435. data_shape = tensor.GetShape();
  436. GELOGD("Data op get shape from InputDesc in ge ir graph.");
  437. }
  438. // If user point input format, do work for all data ops; else do according to tensor_desc
  439. auto data_format = omg_context_.format != domi::DOMI_TENSOR_ND ?
  440. ge::TypeUtils::DomiFormatToFormat(omg_context_.format) : tensor.GetFormat();
  441. ge::DataType data_type = tensor.GetDataType();
  442. string data_type_str = ge::TypeUtils::DataTypeToSerialString(data_type);
  443. GELOGD("Data op get data type:%s from InputDesc in ge ir graph.", data_type_str.c_str());
  444. ge::GeTensor inputTensor;
  445. ge::GeTensorDesc desc(data_shape, ge::Format(data_format), data_type);
  446. inputTensor.SetTensorDesc(desc);
  447. inputs.push_back(inputTensor);
  448. }
  449. }
  450. GELOGD("CreateInputsForIRBuild, inputs size: %zu", inputs.size());
  451. return GRAPH_SUCCESS;
  452. }
  453. graphStatus Impl::BuildModel(const Graph &graph, const std::map<std::string, std::string> &options,
  454. ModelBufferData &model) {
  455. // 1. init GeGenerator with user optios
  456. graphStatus ret = Init(graph, options);
  457. if (ret != GRAPH_SUCCESS) {
  458. GELOGE(ret, "Build ir model Init failed!");
  459. return ret;
  460. }
  461. // 2. construct input
  462. std::vector<GeTensor> inputs;
  463. if (!omg_context_.is_dynamic_input) { // if dynamic input , no need to creat inputs
  464. ret = CreateInputsForIRBuild(graph, inputs);
  465. if (ret != GRAPH_SUCCESS) {
  466. GELOGE(ret, "CreateInputsForIRBuild failed!");
  467. return ret;
  468. }
  469. }
  470. // 3. build IR model
  471. ret = generator_.GenerateOnlineModel(graph, inputs, model);
  472. if (ret != GRAPH_SUCCESS) {
  473. GELOGE(ret, "GenerateOnlineModel failed!");
  474. return ret;
  475. }
  476. return GRAPH_SUCCESS;
  477. }
  478. graphStatus Impl::InitDomiOmgContext(const string &input_shape, const string &input_format, const string &net_format,
  479. bool is_dynamic_input) {
  480. // Clear omgcontext data first
  481. omg_context_.input_dims.clear();
  482. omg_context_.user_input_dims.clear();
  483. omg_context_.is_dynamic_input = is_dynamic_input;
  484. // the default value is ND
  485. omg_context_.format = domi::DOMI_TENSOR_ND;
  486. if (!input_format.empty()) {
  487. auto iter = ge::input_format_str_to_geformat.find(input_format);
  488. if (iter != ge::input_format_str_to_geformat.end()) {
  489. omg_context_.format = iter->second;
  490. } else {
  491. GELOGE(GRAPH_PARAM_INVALID, "Input format %s not support , expect ND/NCHW/NHWC/CHWN/NC1HWC0/NHWC1C0.",
  492. input_format.c_str());
  493. return GRAPH_PARAM_INVALID;
  494. }
  495. }
  496. // Input is empty, do not process
  497. if (input_shape.empty()) {
  498. return GRAPH_SUCCESS;
  499. }
  500. if (!ParseInputShape(input_shape, omg_context_.input_dims, omg_context_.user_input_dims, is_dynamic_input)) {
  501. GELOGE(GRAPH_PARAM_INVALID, "Failed to parse input shape: %s", input_shape.c_str());
  502. return GRAPH_PARAM_INVALID;
  503. }
  504. return GRAPH_SUCCESS;
  505. }
  506. graphStatus aclgrphBuildModel(const ge::Graph &graph, const std::map<std::string, std::string> &build_options,
  507. ModelBufferData &model) {
  508. GELOGD("Enter aclmdlBuildModel process!");
  509. Impl builder;
  510. return builder.BuildModel(graph, build_options, model);
  511. }
  512. graphStatus aclgrphBuildModel(const ge::Graph &graph, const std::map<AscendString, AscendString> &build_options,
  513. ModelBufferData &model) {
  514. GELOGD("Enter aclmdlBuildModel process!");
  515. std::map<std::string, std::string> tmp_build_options;
  516. for (auto &option : build_options) {
  517. if (option.first.GetString() == nullptr || option.second.GetString() == nullptr) {
  518. GELOGE(GRAPH_FAILED, "AclgrphBuildInitialize option is nullptr.");
  519. return GRAPH_FAILED;
  520. }
  521. std::string key = option.first.GetString();
  522. std::string val = option.second.GetString();
  523. tmp_build_options[key] = val;
  524. }
  525. Impl builder;
  526. return builder.BuildModel(graph, tmp_build_options, model);
  527. }
  528. graphStatus aclgrphSaveModel(const string &output_file, const ModelBufferData &model) {
  529. GELOGD("Enter aclmdlSaveModel process!");
  530. if (model.data.get() == nullptr || model.length == 0) {
  531. GELOGE(GRAPH_PARAM_INVALID, "input model is illegal");
  532. return GRAPH_PARAM_INVALID;
  533. }
  534. return FileSaver::SaveToFile((output_file + ".om"), reinterpret_cast<void *>(model.data.get()),
  535. static_cast<uint32_t>(model.length));
  536. }
  537. graphStatus aclgrphSaveModel(const char *output_file, const ModelBufferData &model) {
  538. GELOGD("Enter aclmdlSaveModel process!");
  539. if (model.data.get() == nullptr || model.length == 0) {
  540. GELOGE(GRAPH_PARAM_INVALID, "Input model is illegal");
  541. return GRAPH_PARAM_INVALID;
  542. }
  543. if (output_file == nullptr) {
  544. GELOGE(GRAPH_PARAM_INVALID, "Output file is nullptr.");
  545. return GRAPH_PARAM_INVALID;
  546. }
  547. std::string str_output_file = output_file;
  548. return FileSaver::SaveToFile((str_output_file + ".om"), reinterpret_cast<void *>(model.data.get()),
  549. static_cast<uint32_t>(model.length));
  550. }
  551. graphStatus aclgrphGetIRVersion(int *major_version, int *minor_version, int *patch_version) {
  552. GELOGD("Enter aclgrphGetIRVersion process!");
  553. GE_CHECK_NOTNULL(major_version);
  554. GE_CHECK_NOTNULL(minor_version);
  555. GE_CHECK_NOTNULL(patch_version);
  556. *major_version = IR_MAJOR_VERSION;
  557. *minor_version = IR_MINOR_VERSION;
  558. *patch_version = IR_PATCH_VERSION;
  559. return GRAPH_SUCCESS;
  560. }
  561. graphStatus aclgrphDumpGraph(const ge::Graph &graph, const char *file, const size_t len) {
  562. GE_CHECK_NOTNULL(file);
  563. if (len > PATH_MAX || len != strlen(file) || strlen(file) == 0) {
  564. GELOGE(GRAPH_PARAM_INVALID, "File path invalid.");
  565. return GRAPH_PARAM_INVALID;
  566. }
  567. auto compute_graph = GraphUtils::GetComputeGraph(graph);
  568. GE_CHECK_NOTNULL(compute_graph);
  569. string full_path(file, len);
  570. for (size_t i = 0; i < len; i++) {
  571. if (full_path[i] == '\\') {
  572. full_path.replace(i, 1, "/");
  573. }
  574. }
  575. string suffix;
  576. string file_path;
  577. int pos = full_path.rfind("/");
  578. if (pos != -1) {
  579. suffix = full_path.substr(pos + 1, -1);
  580. file_path = full_path.substr(0, pos);
  581. } else {
  582. suffix = full_path;
  583. file_path = "./";
  584. }
  585. if (suffix.empty()) {
  586. suffix = compute_graph->GetName();
  587. if (suffix.empty()) {
  588. suffix = "graph";
  589. }
  590. }
  591. char path[PATH_MAX] = {0};
  592. if (realpath(file_path.c_str(), path) == nullptr) {
  593. GELOGE(GRAPH_PARAM_INVALID, "Dump file path:%s is invalid.", file);
  594. return GRAPH_PARAM_INVALID;
  595. }
  596. GraphUtils::DumpGEGrph(compute_graph, string(path), suffix);
  597. GraphUtils::DumpGrphToOnnx(*compute_graph, string(path), suffix);
  598. uint64_t i = 0;
  599. for (const auto &sub_graph_func : compute_graph->GetAllSubgraphs()) {
  600. auto sub_graph_func_name = suffix + std::string("_sub_graph_") + std::to_string(i++);
  601. GraphUtils::DumpGEGrph(sub_graph_func, string(path), sub_graph_func_name);
  602. GraphUtils::DumpGrphToOnnx(*sub_graph_func, string(path), sub_graph_func_name);
  603. }
  604. return GRAPH_SUCCESS;
  605. }
  606. graphStatus aclgrphGenerateForOp(const AscendString &op_type, const vector<TensorDesc> &inputs,
  607. const vector<TensorDesc> &outputs, Graph &graph) {
  608. auto op_type_str = std::string(op_type.GetString());
  609. auto op_name = op_type_str + "_" + std::to_string(ge::GetCurrentTimestamp());
  610. auto op_desc = ge::MakeShared<ge::OpDesc>(op_name, op_type_str);
  611. GE_CHECK_NOTNULL(op_desc);
  612. // convert input tensordesc to getensor
  613. std::vector<ge::GeTensor> input_tensors;
  614. for (const auto &input : inputs) {
  615. ge::GeTensorDesc tensor_desc(ge::GeShape(input.GetShape().GetDims()), input.GetFormat(), input.GetDataType());
  616. tensor_desc.SetOriginFormat(input.GetFormat());
  617. ge::TensorUtils::SetRealDimCnt(tensor_desc, static_cast<uint32_t>(input.GetShape().GetDims().size()));
  618. ge::TensorUtils::SetInputTensor(tensor_desc, true);
  619. ge::TensorUtils::SetOutputTensor(tensor_desc, false);
  620. if (op_desc->AddInputDesc(tensor_desc) != ge::GRAPH_SUCCESS) {
  621. GELOGE(ge::FAILED, "AddInputDesc fail.");
  622. return ge::FAILED;
  623. }
  624. input_tensors.emplace_back(tensor_desc);
  625. }
  626. // convert output tensordesc to getensor
  627. std::vector<ge::GeTensor> output_tensors;
  628. for (const auto &output : outputs) {
  629. ge::GeTensorDesc tensor_desc(ge::GeShape(output.GetShape().GetDims()), output.GetFormat(), output.GetDataType());
  630. tensor_desc.SetOriginFormat(output.GetFormat());
  631. ge::TensorUtils::SetRealDimCnt(tensor_desc, static_cast<uint32_t>(output.GetShape().GetDims().size()));
  632. ge::TensorUtils::SetInputTensor(tensor_desc, false);
  633. ge::TensorUtils::SetOutputTensor(tensor_desc, true);
  634. (void)op_desc->AddOutputDesc(tensor_desc);
  635. output_tensors.emplace_back(tensor_desc);
  636. }
  637. // call api to get graph
  638. ge::GeGenerator generator;
  639. std::string graph_name = ge::CurrentTimeInStr() + "_graph";
  640. if (generator.BuildSingleOpGraph(op_desc, input_tensors, output_tensors, graph_name, graph) != ge::SUCCESS) {
  641. GELOGE(GRAPH_FAILED, "make graph fail.");
  642. return GRAPH_FAILED;
  643. }
  644. return GRAPH_SUCCESS;
  645. }
  646. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示