You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 52 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "framework/executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <ctime>
  19. #include <iostream>
  20. #include "framework/common/debug/log.h"
  21. #include "common/ge/ge_util.h"
  22. #include "framework/common/helper/model_helper.h"
  23. #include "common/profiling/profiling_manager.h"
  24. #include "common/dump/dump_manager.h"
  25. #include "graph/execute/graph_execute.h"
  26. #include "graph/load/graph_loader.h"
  27. #include "graph/load/model_manager/model_manager.h"
  28. #include "graph/manager/graph_mem_manager.h"
  29. #include "graph/manager/graph_var_manager.h"
  30. #include "graph/manager/host_mem_manager.h"
  31. #include "single_op/single_op_manager.h"
  32. #include "graph/load/model_manager/davinci_model.h"
  33. #include "opskernel_manager/ops_kernel_builder_manager.h"
  34. #include "graph/opsproto_manager.h"
  35. #include "ge_local_engine/engine/host_cpu_engine.h"
  36. using std::string;
  37. using std::vector;
  38. namespace {
  39. const size_t kDynamicBatchSizeVecSize = 1;
  40. const size_t kStaticBatchInfoSize = 1;
  41. const size_t kDynamicImageSizeVecSize = 2;
  42. const size_t kDynamicImageSizeInputSize = 2;
  43. const char *const kBatchLabel = "Batch_";
  44. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  45. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  46. const std::vector<uint32_t> &formats) {
  47. uint32_t idx = 0;
  48. for (auto desc_item : domi_descs) {
  49. ge::TensorDesc ge_desc;
  50. ge_desc.SetName(desc_item.name.c_str());
  51. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  52. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  53. std::vector<int64_t> shape_dims;
  54. for (auto dim : desc_item.shape_info.dims) {
  55. shape_dims.push_back(dim);
  56. }
  57. ge::Shape ge_shape(shape_dims);
  58. ge_desc.SetShape(ge_shape);
  59. ge_desc.SetSize(desc_item.size);
  60. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  61. ge_descs.emplace_back(ge_desc);
  62. ++idx;
  63. }
  64. }
  65. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  66. inputs.index = input_data.index;
  67. inputs.model_id = input_data.modelId;
  68. inputs.timestamp = input_data.timestamp;
  69. inputs.timeout = input_data.timeout;
  70. inputs.request_id = input_data.request_id;
  71. for (const auto &data_item : input_data.blobs) {
  72. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  73. inputs.blobs.emplace_back(dataBuf);
  74. }
  75. }
  76. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  77. outputs.index = output_data.index;
  78. outputs.model_id = output_data.modelId;
  79. for (const auto &data_item : output_data.blobs) {
  80. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  81. outputs.blobs.emplace_back(dataBuf);
  82. }
  83. }
  84. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  85. ge::InputData &inputs) {
  86. inputs.is_dynamic_batch = true;
  87. std::string batch_label;
  88. size_t match_idx = 0;
  89. for (size_t i = 0; i < batch_info.size(); ++i) {
  90. // dynamic_dims
  91. if (input_data.dynamic_dims.size() != 0) {
  92. bool is_match = true;
  93. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  94. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  95. is_match = false;
  96. break;
  97. }
  98. }
  99. if (is_match) {
  100. match_idx = i;
  101. break;
  102. }
  103. // dynamic_batch_size
  104. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  105. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  106. match_idx = i;
  107. break;
  108. // dynamic_image_size
  109. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  110. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  111. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  112. match_idx = i;
  113. break;
  114. }
  115. }
  116. batch_label = kBatchLabel + std::to_string(match_idx);
  117. inputs.batch_label = batch_label;
  118. GELOGI("current batch label:%s", batch_label.c_str());
  119. }
  120. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  121. if (batch_info.empty()) {
  122. REPORT_INNER_ERROR("E19999", "param Dynamic batch info is empty, check invalid.");
  123. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  124. return false;
  125. }
  126. for (auto batch : batch_info) {
  127. if (batch.size() != kDynamicBatchSizeVecSize) {
  128. REPORT_INNER_ERROR("E19999", "Dynamic batch param num is %zu, current batch size is %zu.",
  129. kDynamicBatchSizeVecSize, batch.size());
  130. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch param num is %zu, current batch size is %zu.",
  131. kDynamicBatchSizeVecSize, batch.size());
  132. return false;
  133. }
  134. if (batch[0] == static_cast<int64_t>(batch_size)) {
  135. return true;
  136. }
  137. }
  138. REPORT_INNER_ERROR("E19999", "Dynamic batch %lu can not match the gear of model.", batch_size);
  139. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch %lu can not match the gear of model.", batch_size);
  140. return false;
  141. }
  142. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  143. const vector<std::vector<int64_t>> &batch_info) {
  144. if (batch_info.empty()) {
  145. REPORT_INNER_ERROR("E19999", "ParamDynamic batch info is empty. check invalid");
  146. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  147. return false;
  148. }
  149. for (auto resolution : batch_info) {
  150. if (resolution.size() != kDynamicImageSizeVecSize) {
  151. REPORT_INNER_ERROR("E19999", "Dynamic resolution param num is %zu, current resolution size is %zu.",
  152. kDynamicImageSizeVecSize, resolution.size());
  153. GELOGE(ge::FAILED, "[Check][Param] Dynamic resolution param num is %zu, current resolution size is %zu.",
  154. kDynamicImageSizeVecSize, resolution.size());
  155. return false;
  156. }
  157. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  158. return true;
  159. }
  160. }
  161. REPORT_INNER_ERROR("E19999", "Dynamic resolution (%lu,%lu) can not match the gear of model.",
  162. image_height, image_width);
  163. GELOGE(ge::FAILED, "[Check][Param]Dynamic resolution (%lu,%lu) can not match the gear of model.",
  164. image_height, image_width);
  165. return false;
  166. }
  167. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  168. const vector<vector<int64_t>> &batch_info) {
  169. if (batch_info.empty()) {
  170. REPORT_INNER_ERROR("E19999", "param batch_info is empty, check invalid");
  171. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] Dynamic batch info is empty.");
  172. return false;
  173. }
  174. bool find_match = false;
  175. for (auto resolution : batch_info) {
  176. if (cur_dynamic_dims.size() != resolution.size()) {
  177. REPORT_INNER_ERROR("E19999", "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  178. cur_dynamic_dims.size(), resolution.size());
  179. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  180. "[Check][Param] Cur dynamic dims param num is %zu, current resolution size is %zu.",
  181. cur_dynamic_dims.size(), resolution.size());
  182. return false;
  183. }
  184. bool flag = true;
  185. for (std::size_t i = 0; i < resolution.size(); ++i) {
  186. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  187. flag = false;
  188. break;
  189. }
  190. }
  191. if (flag) {
  192. find_match = true;
  193. break;
  194. }
  195. }
  196. if (!find_match) {
  197. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] choose dynamic dims can not match the gear of model.");
  198. }
  199. return find_match;
  200. }
  201. } // namespace
  202. namespace ge {
  203. bool GeExecutor::isInit_ = false;
  204. static void InitOpsProtoManager() {
  205. string opsproto_path;
  206. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  207. if (path_env != nullptr) {
  208. string path = path_env;
  209. string file_path = RealPath(path.c_str());
  210. if (file_path.empty()) {
  211. GELOGE(FAILED, "[Check][EnvPath]ASCEND_OPP_PATH path [%s] is invalid.", path.c_str());
  212. REPORT_INPUT_ERROR("E68016", {"ASCEND_OPP_PATH", path});
  213. return;
  214. }
  215. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  216. GELOGI("Get opsproto so path from env : %s", path.c_str());
  217. } else {
  218. string path_base = PluginManager::GetPath();
  219. GELOGI("path_base is %s", path_base.c_str());
  220. path_base = path_base.substr(0, path_base.rfind('/'));
  221. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  222. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  223. }
  224. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  225. OpsProtoManager *manager = OpsProtoManager::Instance();
  226. map<string, string> option_tmp;
  227. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  228. (void)manager->Initialize(option_tmp);
  229. }
  230. GeExecutor::GeExecutor() {}
  231. Status GeExecutor::Initialize(const std::map<string, string> &options) {
  232. if (isInit_) {
  233. GELOGW("Already initialized, no need to be initialized again.");
  234. return ge::SUCCESS;
  235. }
  236. GELOGI("Init GeExecutor begin.");
  237. OpTilingManager::GetInstance().LoadSo();
  238. Status init_hostcpu_engine_status = HostCpuEngine::GetInstance().Initialize();
  239. if (init_hostcpu_engine_status != SUCCESS) {
  240. GELOGE(init_hostcpu_engine_status, "[initialize][HostCpuEngine] failed");
  241. return init_hostcpu_engine_status;
  242. }
  243. InitOpsProtoManager();
  244. GE_CHK_STATUS_RET(HostMemManager::Instance().Initialize());
  245. const std::vector<rtMemType_t> mem_type({1, RT_MEMORY_HBM, RT_MEMORY_P2P_DDR});
  246. Status status = MemManager::Instance().Initialize(mem_type);
  247. if (status != SUCCESS) {
  248. GELOGE(status, "[Init][MemManager] MemoryAllocatorManager initialize failed.");
  249. REPORT_CALL_ERROR("E19999", "MemManager initialize failed.");
  250. return status;
  251. }
  252. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  253. "[Initialize][OpsKernelBuilderManager] failed.");
  254. const auto &model_manager = ModelManager::GetInstance();
  255. GE_CHECK_NOTNULL(model_manager);
  256. status = model_manager->EnableExceptionDump(options);
  257. if (status != SUCCESS) {
  258. GELOGW("[Init][ModelManager] Enable exception dump failed.");
  259. }
  260. ProfilingManager::Instance().Initialize(options);
  261. isInit_ = true;
  262. GELOGI("Init GeExecutor over.");
  263. return SUCCESS;
  264. }
  265. Status GeExecutor::FinalizeEx() {
  266. if (isInit_ == false) {
  267. GELOGW("GeExecutor has not been initialized.");
  268. return ge::SUCCESS;
  269. }
  270. GELOGI("Uninit GeExecutor begin.");
  271. (void)OpsKernelBuilderManager::Instance().Finalize();
  272. HostMemManager::Instance().Finalize();
  273. ProfilingManager::Instance().Finalize();
  274. GELOGI("Uninit GeExecutor over.");
  275. return SUCCESS;
  276. }
  277. Status GeExecutor::Initialize() {
  278. // job id need to be set, the value is meaningless;
  279. const std::map<string, string> options({
  280. {OPTION_EXEC_JOB_ID, "1"}, {OPTION_EXEC_PROFILING_MODE, ""}, {OPTION_EXEC_PROFILING_OPTIONS, ""}
  281. });
  282. return GeExecutor::Initialize(options);
  283. }
  284. Status GeExecutor::Finalize() {
  285. return GeExecutor::FinalizeEx();
  286. }
  287. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  288. uint64_t batch_size) {
  289. if (dynamic_input_addr == nullptr) {
  290. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  291. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  292. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  293. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  294. }
  295. uint64_t size = sizeof(uint32_t);
  296. if (length < size) {
  297. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  298. length, size, model_id);
  299. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  300. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u", length, size, model_id);
  301. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  302. }
  303. if (length >= sizeof(uint64_t)) {
  304. size = sizeof(uint64_t);
  305. }
  306. // Verify whether the input dynamic batch matches the model gear
  307. std::vector<std::vector<int64_t>> batch_info;
  308. std::vector<uint64_t> batch_num{batch_size};
  309. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  310. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  311. if (ret != SUCCESS) {
  312. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u", model_id);
  313. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  314. return ret;
  315. }
  316. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  317. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  318. "[Check][Param] The current dynamic input does not match the gear of the model(id:%u).", model_id);
  319. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  320. }
  321. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  322. if (ret != SUCCESS) {
  323. REPORT_CALL_ERROR("E19999", "set dynamic size failed, model id:%u, dynamic_type:1", model_id);
  324. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u, dynamic_type:1", model_id);
  325. return ret;
  326. }
  327. // memcpy dynamic_batch_size from host to device
  328. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  329. if (rt_ret != RT_ERROR_NONE) {
  330. REPORT_CALL_ERROR("E19999", "Call rtMemcpy, size:%lu ret:0x%X", length, rt_ret);
  331. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic batch input data failed! size:%lu ret:0x%X", length, rt_ret);
  332. return RT_ERROR_TO_GE_STATUS(rt_ret);
  333. }
  334. return SUCCESS;
  335. }
  336. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  337. uint64_t image_height, uint64_t image_width) {
  338. if (dynamic_input_addr == nullptr) {
  339. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  340. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  341. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  342. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  343. }
  344. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  345. if (length < dynamic_input_size) {
  346. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  347. length, dynamic_input_size, model_id);
  348. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  349. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  350. length, dynamic_input_size, model_id);
  351. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  352. }
  353. uint64_t size = sizeof(uint32_t);
  354. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  355. size = sizeof(uint64_t);
  356. }
  357. // Verify whether the input dynamic resolution matches the model gear
  358. std::vector<std::vector<int64_t>> batch_info;
  359. std::vector<uint64_t> batch_num{image_height, image_width};
  360. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  361. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  362. if (ret != SUCCESS) {
  363. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  364. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  365. return ret;
  366. }
  367. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  368. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  369. "[Check][Param] The current dynamic input does not match the gear of the model, "
  370. "image_height:%lu, image_width:%lu.", image_height, image_width);
  371. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  372. }
  373. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  374. if (ret != SUCCESS) {
  375. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u,", model_id);
  376. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  377. return ret;
  378. }
  379. // Memcpy dynamic resolution height from host to device
  380. rtError_t rt_ret =
  381. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  382. if (rt_ret != RT_ERROR_NONE) {
  383. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u", size, rt_ret, model_id);
  384. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  385. size, rt_ret, model_id);
  386. return RT_ERROR_TO_GE_STATUS(rt_ret);
  387. }
  388. uint64_t remain_size = length - size;
  389. // Memcpy dynamic resolution width from host to device
  390. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  391. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  392. if (rt_ret != RT_ERROR_NONE) {
  393. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u",
  394. remain_size, rt_ret, model_id);
  395. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  396. remain_size, rt_ret, model_id);
  397. return RT_ERROR_TO_GE_STATUS(rt_ret);
  398. }
  399. return SUCCESS;
  400. }
  401. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  402. const vector<uint64_t> &dynamic_dims) {
  403. if (dynamic_input_addr == nullptr) {
  404. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  405. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  406. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  407. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  408. }
  409. vector<uint64_t> cur_dynamic_dims;
  410. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  411. if (ret != SUCCESS) {
  412. GELOGE(ret, "[Get][CurDynamicDims] failed, model id:%u", model_id);
  413. return ret;
  414. }
  415. std::vector<std::vector<int64_t>> batch_info;
  416. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  417. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  418. if (ret != SUCCESS) {
  419. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  420. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  421. return ret;
  422. }
  423. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  424. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  425. "[Check][Param] The current dynamic input does not match the gear of the model, id:%u.", model_id);
  426. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  427. }
  428. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  429. if (ret != SUCCESS) {
  430. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u", model_id);
  431. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  432. return ret;
  433. }
  434. size_t dynamic_dim_num = cur_dynamic_dims.size();
  435. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  436. if (length < dynamic_input_size) {
  437. REPORT_INNER_ERROR("E19999", "input dynamic size [%lu] is less than [%lu], model id:%u",
  438. length, dynamic_input_size, model_id);
  439. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  440. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  441. length, dynamic_input_size, model_id);
  442. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  443. }
  444. uint64_t size = sizeof(uint32_t);
  445. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  446. size = sizeof(uint64_t);
  447. }
  448. rtError_t rt_ret;
  449. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  450. // Memcpy dynamic dim[i] from host to device
  451. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  452. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  453. if (rt_ret != RT_ERROR_NONE) {
  454. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", (length - size * i), rt_ret);
  455. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X",
  456. length - size * i, rt_ret);
  457. return RT_ERROR_TO_GE_STATUS(rt_ret);
  458. }
  459. }
  460. return SUCCESS;
  461. }
  462. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  463. vector<uint64_t> &cur_dynamic_dims) {
  464. cur_dynamic_dims.clear();
  465. vector<ge::TensorDesc> input_desc;
  466. vector<ge::TensorDesc> output_desc;
  467. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  468. if (ret != ge::SUCCESS) {
  469. GELOGE(ret, "[Get][ModelDescInfo] failed, model id:%u.", model_id);
  470. return ret;
  471. }
  472. vector<string> user_designate_shape_order;
  473. vector<int64_t> all_data_dims;
  474. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  475. if (ret != ge::SUCCESS) {
  476. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  477. return ret;
  478. }
  479. for (auto &data_name : user_designate_shape_order) {
  480. for (auto &desc : input_desc) {
  481. if (desc.GetName() == data_name) {
  482. for (auto dim : desc.GetShape().GetDims()) {
  483. all_data_dims.push_back(dim);
  484. }
  485. break;
  486. }
  487. }
  488. }
  489. if (dynamic_dims.size() != all_data_dims.size()){
  490. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  491. dynamic_dims.size(), all_data_dims.size());
  492. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  493. "[Check][Param] Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  494. dynamic_dims.size(), all_data_dims.size());
  495. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  496. }
  497. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  498. if (all_data_dims[i] < 0) {
  499. cur_dynamic_dims.push_back(dynamic_dims[i]);
  500. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  501. REPORT_INNER_ERROR("E19999", "Static dims should be same, index:%zu value:%lu should be %ld",
  502. i, dynamic_dims[i], all_data_dims[i]);
  503. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  504. "[Check][Param] Static dims should be same, index:%zu value:%lu should be %ld",
  505. i, dynamic_dims[i], all_data_dims[i]);
  506. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  507. }
  508. }
  509. return SUCCESS;
  510. }
  511. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  512. GELOGI("Begin to get current shape");
  513. if (!isInit_) {
  514. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  515. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  516. return ACL_ERROR_GE_EXEC_NOT_INIT;
  517. }
  518. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  519. if (ret != SUCCESS) {
  520. REPORT_CALL_ERROR("E19999", "Get Cur Shape failed, model id:%u", model_id);
  521. GELOGE(ret, "[Get][CurShape] failed, model id:%u", model_id);
  522. return ret;
  523. }
  524. return SUCCESS;
  525. }
  526. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  527. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  528. const kAippDynamicPara &aippParms) {
  529. GELOGI("Enter to SetDynamicAippData.");
  530. if (dynamic_input_addr == nullptr) {
  531. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  532. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  533. "[Check][Param] Dynamic aipp input addr is nullptr, model id:%u", model_id);
  534. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  535. }
  536. if (aippBatchPara.empty()) {
  537. REPORT_INNER_ERROR("E19999", "Param aippBatchPara is empty, check invalid, model id:%u", model_id);
  538. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "[Check][Param] aippBatchPara is empty, model id:%u", model_id);
  539. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  540. }
  541. uint64_t batch_num = aippBatchPara.size();
  542. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  543. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  544. GELOGI(
  545. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  546. "batch num is %lu, struct_len is %lu",
  547. model_id, length, batch_num, struct_len);
  548. if (struct_len > length) {
  549. REPORT_INNER_ERROR("E19999", "input dynamic aipp param len:%lu is larger than aipp_data size:%lu",
  550. struct_len, length);
  551. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  552. "[Check][Param] input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]",
  553. struct_len, length);
  554. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  555. }
  556. // Memcpy real kAippDynamicBatchPara from host to device
  557. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  558. if (rt_ret != RT_ERROR_NONE) {
  559. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", length, rt_ret);
  560. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy aippParms failed! size:%lu, ret:0x%X", length, rt_ret);
  561. return RT_ERROR_TO_GE_STATUS(rt_ret);
  562. }
  563. uint64_t remain_len = length - real_aippParms_size;
  564. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  565. for (uint64_t i = 0; i < batch_num; ++i) {
  566. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  567. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  568. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  569. if (rt_ret != RT_ERROR_NONE) {
  570. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, ret:0x%X", rt_ret);
  571. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy kAippDynamicBatchPara input data failed! ret:0x%X", rt_ret);
  572. return RT_ERROR_TO_GE_STATUS(rt_ret);
  573. }
  574. }
  575. return SUCCESS;
  576. }
  577. Status GeExecutor::UnloadModel(uint32_t model_id) {
  578. GELOGD("unload model %u begin.", model_id);
  579. if (!isInit_) {
  580. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized");
  581. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  582. return ACL_ERROR_GE_EXEC_NOT_INIT;
  583. }
  584. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  585. if (ret != SUCCESS) {
  586. REPORT_CALL_ERROR("E19999", "Destroy Aicpu Session For Infer failed, model id:%u", model_id);
  587. GELOGE(ret, "[Destroy][AicpuSession] For Infer failed. model id:%u", model_id);
  588. return ret;
  589. }
  590. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model =
  591. ModelManager::GetInstance()->GetHybridModel(model_id);
  592. if (hybrid_davinci_model != nullptr) {
  593. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  594. VarManagerPool::Instance().RemoveVarManager(session_id);
  595. } else {
  596. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  597. if (davinci_model != nullptr) {
  598. uint64_t session_id = davinci_model->GetSessionId();
  599. VarManagerPool::Instance().RemoveVarManager(session_id);
  600. }
  601. }
  602. ret = GraphLoader::UnloadModel(model_id);
  603. if (ret != SUCCESS) {
  604. REPORT_CALL_ERROR("E19999", "unload model failed, model id:%u", model_id);
  605. GELOGE(ret, "[Unload][Model] failed. model id:%u", model_id);
  606. return ret;
  607. }
  608. return SUCCESS;
  609. }
  610. // Get input and output descriptor
  611. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  612. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  613. if (!isInit_) {
  614. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  615. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  616. return ACL_ERROR_GE_EXEC_NOT_INIT;
  617. }
  618. std::vector<InputOutputDescInfo> input_desc_infos;
  619. std::vector<InputOutputDescInfo> output_desc_infos;
  620. std::vector<uint32_t> input_formats;
  621. std::vector<uint32_t> output_formats;
  622. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  623. output_formats, new_model_desc);
  624. if (ret != domi::SUCCESS) {
  625. REPORT_CALL_ERROR("E19999", "get input output desc info failed, ret = %u, model id:%u", ret, model_id);
  626. GELOGE(ret, "[Get][InputOutputDescInfo] failed. ret = %u, model id:%u", ret, model_id);
  627. return ACL_ERROR_GE_GET_TENSOR_INFO;
  628. }
  629. if (input_formats.size() != input_desc_infos.size()) {
  630. REPORT_INNER_ERROR("E19999", "input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  631. input_formats.size(), input_desc_infos.size(), model_id);
  632. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  633. "[Check][Param] input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  634. input_formats.size(), input_desc_infos.size(), model_id);
  635. return ACL_ERROR_GE_PARAM_INVALID;
  636. }
  637. if (output_formats.size() != output_desc_infos.size()) {
  638. REPORT_INNER_ERROR("E19999", "output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  639. output_formats.size(), output_desc_infos.size(), model_id);
  640. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  641. "[Check][Param] output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  642. output_formats.size(), output_desc_infos.size(), model_id);
  643. return ACL_ERROR_GE_PARAM_INVALID;
  644. }
  645. // Transfer data to TensorDesc
  646. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  647. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  648. return ge::SUCCESS;
  649. }
  650. ///
  651. /// @ingroup ge
  652. /// @brief Get dynamic batch_info
  653. /// @param [in] model_id
  654. /// @param [out] batch_info
  655. /// @param [out] dynamic_type
  656. /// @return execute result
  657. ///
  658. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  659. int32_t &dynamic_type) {
  660. if (!isInit_) {
  661. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  662. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  663. return ACL_ERROR_GE_EXEC_NOT_INIT;
  664. }
  665. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  666. if (ret != SUCCESS) {
  667. REPORT_CALL_ERROR("E19999", "Get Dynamic BatchInfo failed, model id:%u.", model_id);
  668. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  669. return ret;
  670. }
  671. return SUCCESS;
  672. }
  673. ///
  674. /// @ingroup ge
  675. /// @brief Get combined dynamic dims info
  676. /// @param [in] model_id
  677. /// @param [out] batch_info
  678. /// @return execute result
  679. ///
  680. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  681. GELOGI("Begin to get combined dynamic dims info.");
  682. if (!isInit_) {
  683. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  684. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  685. return ACL_ERROR_GE_EXEC_NOT_INIT;
  686. }
  687. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  688. if (ret != SUCCESS) {
  689. REPORT_CALL_ERROR("E19999", "Get Combined DynamicDims failed, model id:%u.", model_id);
  690. GELOGE(ret, "[Get][CombinedDynamicDims] failed, model id:%u.", model_id);
  691. return ret;
  692. }
  693. GELOGI("Get combined dynamic dims succ.");
  694. return SUCCESS;
  695. }
  696. ///
  697. /// @ingroup ge
  698. /// @brief Get user designeate shape order
  699. /// @param [in] model_id
  700. /// @param [out] user_designate_shape_order
  701. /// @return execute result
  702. ///
  703. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  704. if (!isInit_) {
  705. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  706. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  707. return ACL_ERROR_GE_EXEC_NOT_INIT;
  708. }
  709. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  710. if (ret != SUCCESS) {
  711. REPORT_CALL_ERROR("E19999", "GetUserDesignateShapeOrder failed, model id:%u.", model_id);
  712. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  713. return ret;
  714. }
  715. return SUCCESS;
  716. }
  717. ///
  718. /// @ingroup ge
  719. /// @brief Get AIPP input format
  720. /// @param [in] model_id
  721. /// @param [in] index
  722. /// @param [out] input_format
  723. /// @return execute result
  724. ///
  725. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  726. GELOGI("Begin to GetAIPPInfo.");
  727. if (!isInit_) {
  728. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  729. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor not inited yet!");
  730. return ACL_ERROR_GE_EXEC_NOT_INIT;
  731. }
  732. Status ret = GraphExecutor::GetAippInfo(model_id, index, aipp_info);
  733. if (ret != SUCCESS) {
  734. GELOGW("GetAIPPInfo is not success.");
  735. return ret;
  736. }
  737. GELOGI("GetAIPPInfo succ.");
  738. return SUCCESS;
  739. }
  740. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  741. GELOGI("Begin to get aipp type.");
  742. if (!isInit_) {
  743. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  744. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not inited yet!");
  745. return ACL_ERROR_GE_EXEC_NOT_INIT;
  746. }
  747. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  748. if (ret != SUCCESS) {
  749. GELOGW("Get aipp type is not success.");
  750. return ret;
  751. }
  752. GELOGI("Get aipp type success.");
  753. return SUCCESS;
  754. }
  755. Status GeExecutor::GetOpAttr(uint32_t model_id, const std::string &op_name, const std::string &attr_name,
  756. std::string &attr_value) {
  757. GELOGI("Begin to get op attr.");
  758. if (!isInit_) {
  759. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Init][GeExecutor]Ge executor not inited yet!");
  760. REPORT_INNER_ERROR("E19999", "Ge executor not inited yet!");
  761. return ACL_ERROR_GE_EXEC_NOT_INIT;
  762. }
  763. Status ret = GraphExecutor::GetOpAttr(model_id, op_name, attr_name, attr_value);
  764. if (ret != SUCCESS) {
  765. GELOGE(ret, "[Get][OpAttr]Get op:%s attr:%s failed, model id:%u.",
  766. op_name.c_str(), attr_name.c_str(), model_id);
  767. REPORT_CALL_ERROR("E19999", "Get op:%s attr:%s failed, model id:%u",
  768. op_name.c_str(), attr_name.c_str(), model_id);
  769. return ret;
  770. }
  771. return SUCCESS;
  772. }
  773. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  774. if (!isInit_) {
  775. REPORT_INNER_ERROR("E19999", "GeExecutor has not inited yet!");
  776. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  777. return ACL_ERROR_GE_EXEC_NOT_INIT;
  778. }
  779. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  780. if (ret != SUCCESS) {
  781. REPORT_CALL_ERROR("E19999", "Get Model Attr failed, model id:%u.", model_id);
  782. GELOGE(ret, "[Get][ModelAttr] failed, model id:%u.", model_id);
  783. return ret;
  784. }
  785. return SUCCESS;
  786. }
  787. Status GeExecutor::CommandHandle(const Command &command) {
  788. Status ret = GraphLoader::CommandHandle(command);
  789. if (ret != SUCCESS) {
  790. REPORT_CALL_ERROR("E19999", "call CommandHandle failed, ret:%u", ret);
  791. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "[Call][CommandHandle] failed, ret:%u", ret);
  792. return ACL_ERROR_GE_COMMAND_HANDLE;
  793. }
  794. return SUCCESS;
  795. }
  796. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  797. GELOGI("Get max used memory begin.");
  798. if (!isInit_) {
  799. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  800. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  801. return ACL_ERROR_GE_EXEC_NOT_INIT;
  802. }
  803. uint64_t max_mem_size = 0;
  804. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  805. max_size = static_cast<uint32_t>(max_mem_size);
  806. return ret;
  807. }
  808. /**
  809. * @ingroup ge
  810. * @brief Load data from model file to memory
  811. * @param [in] const std::string &path: Offline model file path
  812. * @param [out] domi::ModelData &model_data: Offline model memory data
  813. * @return SUCCESS handle successfully / others handle failed
  814. */
  815. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  816. GELOGI("Load data from file begin.");
  817. if (!isInit_) {
  818. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  819. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  820. return ACL_ERROR_GE_EXEC_NOT_INIT;
  821. }
  822. string filePath = RealPath(path.c_str());
  823. if (filePath.empty()) {
  824. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  825. "[Call][RealPath] File path is invalid. please check your text file '%s'.", path.c_str());
  826. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  827. }
  828. GELOGI("load modelData from file: %s.", path.c_str());
  829. int32_t priority = 0;
  830. Status ret = GraphLoader::LoadDataFromFile(path, priority, model_data);
  831. if (ret != SUCCESS) {
  832. if (model_data.model_data != nullptr) {
  833. delete[] static_cast<char *>(model_data.model_data);
  834. model_data.model_data = nullptr;
  835. }
  836. }
  837. return ret;
  838. }
  839. /**
  840. * @ingroup ge
  841. * @brief Load model from offline model memory data
  842. * @param [in] domi::ModelData &model_data: Offline model data
  843. void *dev_ptr: Input/Output memory start address
  844. size_t memsize: Input/Output memory length
  845. void *weight_ptr: Weight memory start address
  846. size_t weightsize: Weight memory length
  847. * @param [out] uint32_t &model_id: identification after model loading
  848. * @return SUCCESS handle successfully / others handle failed
  849. */
  850. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  851. void *weight_ptr, size_t weight_size) {
  852. if (!isInit_) {
  853. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  854. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  855. return ACL_ERROR_GE_EXEC_NOT_INIT;
  856. }
  857. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  858. }
  859. /**
  860. * @ingroup ge
  861. * @brief Load task list from ModelData with queue.
  862. * @param [out] model_id: model id allocate from manager.
  863. * @param [in] ge_model_data: Model data load from offline model.
  864. * @param [in] input_queue_ids: input queue ids create from user.
  865. * @param [in] output_queue_ids: input queue ids create from user.
  866. * @return: 0 for success / others for fail
  867. */
  868. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  869. const std::vector<uint32_t> &input_queue_ids,
  870. const std::vector<uint32_t> &output_queue_ids) {
  871. GELOGI("Load model with queue begin.");
  872. if (!isInit_) {
  873. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  874. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  875. return ACL_ERROR_GE_EXEC_NOT_INIT;
  876. }
  877. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  878. }
  879. /**
  880. * @ingroup ge
  881. * @brief Synchronous execution of offline model(Do not create thread)
  882. * @param [in] uint32_t model_id: Model ID to execute
  883. void* stream: stream to execute
  884. const domi::InputData *input_data: Model input data
  885. bool async_mode: is asynchronize mode.
  886. * @param [out] domi::OutputData *output_data: Model output data
  887. * @return SUCCESS handle successfully / others handle failed
  888. */
  889. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  890. ge::RunModelData &run_output_data, bool async_mode) {
  891. std::vector<GeTensorDesc> input_desc = {};
  892. std::vector<GeTensorDesc> output_desc = {};
  893. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  894. }
  895. /**
  896. * @ingroup ge
  897. * @brief Synchronous execution of offline model(Do not create thread)
  898. * @param [in] uint32_t model_id: Model ID to execute
  899. void* stream: stream to execute
  900. const domi::InputData *input_data: Model input data
  901. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  902. bool async_mode: is asynchronize mode
  903. * @param [out] domi::OutputData *output_data: Model output data
  904. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  905. * @return SUCCESS handle successfully / others handle failed
  906. */
  907. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  908. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  909. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  910. if (!isInit_) {
  911. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  912. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  913. return ACL_ERROR_GE_EXEC_NOT_INIT;
  914. }
  915. InputData input_data;
  916. OutputData output_data;
  917. GetDomiInputData(run_input_data, input_data);
  918. GetDomiOutputData(run_output_data, output_data);
  919. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  920. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  921. std::vector<std::vector<int64_t>> batch_info;
  922. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  923. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  924. if (ret != SUCCESS) {
  925. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u.", model_id);
  926. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  927. return ret;
  928. }
  929. if (!batch_info.empty()) {
  930. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  931. }
  932. }
  933. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  934. }
  935. /**
  936. * @ingroup ge
  937. * @brief Get weight memory size from model file
  938. * @param [in] const std::string &path: Offline model file path
  939. * @param [out] size_t &mem_size Execution memory size
  940. size_t &weight_size Weight memory space size
  941. * @return SUCCESS handle successfully / others handle failed
  942. */
  943. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  944. GELOGI("Get memory and weight size from file begin.");
  945. if (!isInit_) {
  946. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  947. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  948. return ACL_ERROR_GE_EXEC_NOT_INIT;
  949. }
  950. ModelData model;
  951. Status ret = ge::GraphLoader::LoadDataFromFile(path, 0, model);
  952. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  953. REPORT_CALL_ERROR("E19999", "load data from file failed, ret = %d", ret);
  954. GELOGE(ret, "[Load][Data] from file failed. ret = %d", ret);
  955. return ret;
  956. }
  957. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  958. delete[] static_cast<char *>(model.model_data);
  959. model.model_data = nullptr;
  960. return ret;
  961. }
  962. /**
  963. * @ingroup ge
  964. * @brief Get weight memory size from model file
  965. * @param [in] const void *model_data Offline model buffer
  966. size_t model_size Offline model buffer length
  967. * @param [out] size_t &mem_size Execution memory size
  968. size_t &weight_size Weight memory space size
  969. * @return SUCCESS handle successfully / others handle failed
  970. */
  971. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  972. size_t &weight_size) {
  973. GELOGI("Get memory and weight size from data begin.");
  974. if (!isInit_) {
  975. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  976. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  977. return ACL_ERROR_GE_EXEC_NOT_INIT;
  978. }
  979. if (model_data == nullptr) {
  980. REPORT_INNER_ERROR("E19999", "param model_data is nullptr, check invalid!");
  981. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "[Check][Param] invalid model data!");
  982. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  983. }
  984. ModelData model;
  985. model.model_data = const_cast<void *>(model_data);
  986. model.model_len = static_cast<uint32_t>(model_size);
  987. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  988. }
  989. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  990. SingleOp **single_op) {
  991. return LoadSingleOpV2(model_name, modelData, stream, single_op, 0);
  992. }
  993. Status GeExecutor::LoadSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  994. SingleOp **single_op, const uint64_t model_id) {
  995. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op, model_id);
  996. }
  997. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  998. DynamicSingleOp **single_op) {
  999. return LoadDynamicSingleOpV2(model_name, modelData, stream, single_op, 0);
  1000. }
  1001. Status GeExecutor::LoadDynamicSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  1002. DynamicSingleOp **single_op, const uint64_t model_id) {
  1003. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op, model_id);
  1004. }
  1005. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  1006. std::vector<DataBuffer> &outputs) {
  1007. if (executor == nullptr) {
  1008. REPORT_INNER_ERROR("E19999", "Param executor is nullptr, check invalid");
  1009. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] param executor is nullptr");
  1010. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1011. }
  1012. return executor->ExecuteAsync(inputs, outputs);
  1013. }
  1014. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  1015. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  1016. vector<DataBuffer> &outputs) {
  1017. GE_CHECK_NOTNULL(executor);
  1018. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  1019. }
  1020. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  1021. ModelManager::GetInstance()->ClearAicpuSo();
  1022. return SingleOpManager::GetInstance().ReleaseResource(stream);
  1023. }
  1024. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  1025. auto model_manager = ModelManager::GetInstance();
  1026. GE_CHECK_NOTNULL(model_manager);
  1027. auto davinci_model = model_manager->GetModel(model_id);
  1028. if (davinci_model == nullptr) {
  1029. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID,
  1030. "[Get][Model] failed, Model id:%u is invaild or model is not loaded.", model_id);
  1031. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  1032. }
  1033. device_id = davinci_model->GetDeviceId();
  1034. return SUCCESS;
  1035. }
  1036. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  1037. std::vector<std::vector<int64_t>> batch_info;
  1038. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  1039. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  1040. if (ret != SUCCESS) {
  1041. GELOGE(ret, "[Get][DynamicBatchInfo] failed. ret = %d, model id:%u", ret, model_id);
  1042. return ret;
  1043. }
  1044. if (batch_info.empty()) {
  1045. shape_count = kStaticBatchInfoSize;
  1046. } else {
  1047. shape_count = batch_info.size();
  1048. }
  1049. return SUCCESS;
  1050. }
  1051. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  1052. GELOGI("Begin to GetOrigInputInfo.");
  1053. if (!isInit_) {
  1054. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1055. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1056. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1057. }
  1058. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  1059. if (ret != SUCCESS) {
  1060. REPORT_CALL_ERROR("E19999", "Get Orig Input Info failed, model id:%u.", model_id);
  1061. GELOGE(ret, "[Get][OrigInputInfo] failed, model id:%u.", model_id);
  1062. return ret;
  1063. }
  1064. GELOGI("GetOrigInputInfo succ.");
  1065. return SUCCESS;
  1066. }
  1067. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  1068. std::vector<InputOutputDims> &input_dims,
  1069. std::vector<InputOutputDims> &output_dims) {
  1070. GELOGI("Begin to GetAllAippInputOutputDims.");
  1071. if (!isInit_) {
  1072. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1073. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1074. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1075. }
  1076. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  1077. if (ret != SUCCESS) {
  1078. REPORT_CALL_ERROR("E19999", "Get All Aipp Input Output Dims failed, model id:%u.", model_id);
  1079. GELOGE(ret, "[Get][AllAippInputOutputDims] failed, model id:%u.", model_id);
  1080. return ret;
  1081. }
  1082. GELOGI("GetAllAippInputOutputDims succ.");
  1083. return SUCCESS;
  1084. }
  1085. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  1086. GELOGI("Begin to GetOpDescInfo.");
  1087. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  1088. if (ret != SUCCESS) {
  1089. REPORT_CALL_ERROR("E19999", "get opdesc info failed, device_id:%u, stream_id:%u, task_id:%u.",
  1090. device_id, stream_id, task_id);
  1091. GELOGE(ret, "[Get][OpDescInfo] failed, device_id:%u, stream_id:%u, task_id:%u.",
  1092. device_id, stream_id, task_id);
  1093. return ret;
  1094. }
  1095. GELOGI("GetOpDescInfo succ.");
  1096. return SUCCESS;
  1097. }
  1098. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  1099. GELOGI("Start to set dump config");
  1100. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  1101. if (ret != SUCCESS) {
  1102. GELOGE(ret, "[Set][DumpConf] failed, ret:%d", ret);
  1103. return ret;
  1104. }
  1105. GELOGI("Set dump config successfully");
  1106. return SUCCESS;
  1107. }
  1108. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示