You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 42 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <cce/compiler_stub.h>
  19. #include <ctime>
  20. #include <iostream>
  21. #include "common/debug/log.h"
  22. #include "common/ge/ge_util.h"
  23. #include "common/helper/model_helper.h"
  24. #include "common/profiling/profiling_manager.h"
  25. #include "common/dump/dump_manager.h"
  26. #include "common/util.h"
  27. #include "framework/common/debug/ge_log.h"
  28. #include "framework/common/util.h"
  29. #include "graph/execute/graph_execute.h"
  30. #include "graph/load/graph_loader.h"
  31. #include "graph/load/new_model_manager/davinci_model_parser.h"
  32. #include "graph/load/new_model_manager/model_manager.h"
  33. #include "graph/manager/graph_mem_allocator.h"
  34. #include "graph/model.h"
  35. #include "graph/utils/graph_utils.h"
  36. #include "mmpa/mmpa_api.h"
  37. #include "single_op/single_op_manager.h"
  38. #include "graph/manager/graph_var_manager.h"
  39. #include "graph/load/new_model_manager/davinci_model.h"
  40. #include "opskernel_manager/ops_kernel_builder_manager.h"
  41. using std::string;
  42. using std::vector;
  43. namespace {
  44. const size_t kDynamicBatchSizeVecSize = 1;
  45. const size_t kStaticBatchInfoSize = 1;
  46. const size_t kDynamicImageSizeVecSize = 2;
  47. const size_t kDynamicImageSizeInputSize = 2;
  48. const char *const kBatchLabel = "Batch_";
  49. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  50. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  51. const std::vector<uint32_t> &formats) {
  52. uint32_t idx = 0;
  53. for (auto desc_item : domi_descs) {
  54. ge::TensorDesc ge_desc;
  55. ge_desc.SetName(desc_item.name);
  56. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  57. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  58. std::vector<int64_t> shape_dims;
  59. for (auto dim : desc_item.shape_info.dims) {
  60. shape_dims.push_back(dim);
  61. }
  62. ge::Shape ge_shape(shape_dims);
  63. ge_desc.SetShape(ge_shape);
  64. ge_desc.SetSize(desc_item.size);
  65. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  66. ge_descs.emplace_back(ge_desc);
  67. ++idx;
  68. }
  69. }
  70. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  71. inputs.index = input_data.index;
  72. inputs.model_id = input_data.modelId;
  73. inputs.timestamp = input_data.timestamp;
  74. inputs.timeout = input_data.timeout;
  75. inputs.request_id = input_data.request_id;
  76. for (const auto &data_item : input_data.blobs) {
  77. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  78. inputs.blobs.emplace_back(dataBuf);
  79. }
  80. }
  81. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  82. outputs.index = output_data.index;
  83. outputs.model_id = output_data.modelId;
  84. for (const auto &data_item : output_data.blobs) {
  85. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  86. outputs.blobs.emplace_back(dataBuf);
  87. }
  88. }
  89. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  90. ge::InputData &inputs) {
  91. inputs.is_dynamic_batch = true;
  92. std::string batch_label;
  93. size_t match_idx = 0;
  94. for (size_t i = 0; i < batch_info.size(); ++i) {
  95. // dynamic_dims
  96. if (input_data.dynamic_dims.size() != 0) {
  97. bool is_match = true;
  98. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  99. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  100. is_match = false;
  101. break;
  102. }
  103. }
  104. if (is_match) {
  105. match_idx = i;
  106. break;
  107. }
  108. // dynamic_batch_size
  109. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  110. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  111. match_idx = i;
  112. break;
  113. // dynamic_image_size
  114. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  115. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  116. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  117. match_idx = i;
  118. break;
  119. }
  120. }
  121. batch_label = kBatchLabel + std::to_string(match_idx);
  122. inputs.batch_label = batch_label;
  123. GELOGI("current batch label:%s", batch_label.c_str());
  124. }
  125. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  126. if (batch_info.empty()) {
  127. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  128. return false;
  129. }
  130. for (auto batch : batch_info) {
  131. if (batch.size() != kDynamicBatchSizeVecSize) {
  132. GELOGE(ge::FAILED, "Dynamic batch param num is %zu, current batch size is %zu.", kDynamicBatchSizeVecSize,
  133. batch.size());
  134. return false;
  135. }
  136. if (batch[0] == static_cast<int64_t>(batch_size)) {
  137. return true;
  138. }
  139. }
  140. GELOGE(ge::FAILED, "Dynamic batch %lu can not match the gear of model.", batch_size);
  141. return false;
  142. }
  143. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  144. const vector<std::vector<int64_t>> &batch_info) {
  145. if (batch_info.empty()) {
  146. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  147. return false;
  148. }
  149. for (auto resolution : batch_info) {
  150. if (resolution.size() != kDynamicImageSizeVecSize) {
  151. GELOGE(ge::FAILED, "Dynamic resolution param num is %zu, current resolution size is %zu.",
  152. kDynamicImageSizeVecSize, resolution.size());
  153. return false;
  154. }
  155. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  156. return true;
  157. }
  158. }
  159. GELOGE(ge::FAILED, "Dynamic resolution (%lu,%lu) can not match the gear of model.", image_height, image_width);
  160. return false;
  161. }
  162. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims, const vector<vector<int64_t>> &batch_info) {
  163. if (batch_info.empty()) {
  164. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  165. return false;
  166. }
  167. bool find_match = false;
  168. for (auto resolution : batch_info) {
  169. if (cur_dynamic_dims.size() != resolution.size()) {
  170. GELOGE(ge::FAILED, "Cur dynamic dims param num is %zu, current resolution size is %zu.", cur_dynamic_dims.size(),
  171. resolution.size());
  172. return false;
  173. }
  174. bool flag = true;
  175. for (std::size_t i = 0; i < resolution.size(); ++i) {
  176. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  177. flag = false;
  178. break;
  179. }
  180. }
  181. if (flag) {
  182. find_match = true;
  183. break;
  184. }
  185. }
  186. if (!find_match) {
  187. GELOGE(ge::FAILED, "choose dynamic dims can not match the gear of model.");
  188. }
  189. return find_match;
  190. }
  191. } // namespace
  192. namespace ge {
  193. bool GeExecutor::isInit_ = false;
  194. class ModelListenerAdapter : public ModelListener {
  195. public:
  196. domi::Status OnComputeDone(uint32_t model_id, uint32_t dataIndex, uint32_t resultCode,
  197. std::vector<ge::OutputTensorInfo> &outputs) {
  198. if (listener == nullptr) {
  199. GELOGE(ge::FAILED, "listener is null.");
  200. return FAILED;
  201. }
  202. return listener->OnComputeDone(model_id, dataIndex, resultCode, outputs);
  203. }
  204. std::shared_ptr<ge::ModelListener> listener;
  205. };
  206. GeExecutor::GeExecutor() {}
  207. Status GeExecutor::Initialize() {
  208. GELOGI("Init GeExecutor begin.");
  209. if (isInit_) {
  210. GELOGW("Already initialized, no need to be initialized again.");
  211. return ge::SUCCESS;
  212. }
  213. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  214. mem_type.push_back(RT_MEMORY_P2P_DDR);
  215. auto ret = MemManager::Instance().Initialize(mem_type);
  216. if (ret != SUCCESS) {
  217. GELOGE(ret, "Memory Manager init failed.");
  218. return ret;
  219. }
  220. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  221. "Failed to initialize OpsKernelBuilders");
  222. // Start profiling
  223. Options profiling_options;
  224. profiling_options.device_id = 0;
  225. profiling_options.job_id = "";
  226. ProfilingManager::Instance().Init(profiling_options);
  227. isInit_ = true;
  228. GELOGI("Init GeExecutor over.");
  229. return ge::SUCCESS;
  230. }
  231. Status GeExecutor::Finalize() {
  232. GELOGI("Uninit GeExecutor begin.");
  233. if (isInit_ == false) {
  234. GELOGW("GeExecutor has not been initialized.");
  235. return ge::SUCCESS;
  236. }
  237. (void)OpsKernelBuilderManager::Instance().Finalize();
  238. // Stop profiling
  239. if (ProfilingManager::Instance().ProfilingOn()) {
  240. ProfilingManager::Instance().StopProfiling();
  241. ProfilingManager::Instance().PluginUnInit(GE_PROFILING_MODULE);
  242. }
  243. GELOGI("Uninit GeExecutor over.");
  244. return ge::SUCCESS;
  245. }
  246. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  247. uint64_t batch_size) {
  248. if (dynamic_input_addr == nullptr) {
  249. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  250. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  251. }
  252. uint64_t size = sizeof(uint32_t);
  253. if (length < size) {
  254. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length, size);
  255. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  256. }
  257. if (length >= sizeof(uint64_t)) {
  258. size = sizeof(uint64_t);
  259. }
  260. // Verify whether the input dynamic batch matches the model gear
  261. std::vector<std::vector<int64_t>> batch_info;
  262. std::vector<uint64_t> batch_num{batch_size};
  263. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  264. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  265. if (ret != SUCCESS) {
  266. GELOGE(ret, "Get dynamic input info failed.");
  267. return ret;
  268. }
  269. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  270. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  271. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  272. }
  273. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  274. if (ret != SUCCESS) {
  275. GELOGE(ret, "Set dynamic size failed");
  276. return ret;
  277. }
  278. // memcpy dynamic_batch_size from host to device
  279. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  280. if (rt_ret != RT_ERROR_NONE) {
  281. GELOGE(rt_ret, "memcpy dynamic batch input data failed! ret: 0x%X", rt_ret);
  282. return RT_ERROR_TO_GE_STATUS(rt_ret);
  283. }
  284. return SUCCESS;
  285. }
  286. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  287. uint64_t image_height, uint64_t image_width) {
  288. if (dynamic_input_addr == nullptr) {
  289. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  290. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  291. }
  292. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  293. if (length < dynamic_input_size) {
  294. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length,
  295. dynamic_input_size);
  296. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  297. }
  298. uint64_t size = sizeof(uint32_t);
  299. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  300. size = sizeof(uint64_t);
  301. }
  302. // Verify whether the input dynamic resolution matches the model gear
  303. std::vector<std::vector<int64_t>> batch_info;
  304. std::vector<uint64_t> batch_num{image_height, image_width};
  305. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  306. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  307. if (ret != SUCCESS) {
  308. GELOGE(ret, "Get dynamic input info failed.");
  309. return ret;
  310. }
  311. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  312. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  313. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  314. }
  315. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  316. if (ret != SUCCESS) {
  317. GELOGE(ret, "Set dynamic size failed");
  318. return ret;
  319. }
  320. // Memcpy dynamic resolution height from host to device
  321. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  322. if (rt_ret != RT_ERROR_NONE) {
  323. GELOGE(rt_ret, "memcpy dynamic resolution input data failed! ret: 0x%X", rt_ret);
  324. return RT_ERROR_TO_GE_STATUS(rt_ret);
  325. }
  326. uint64_t remain_size = length - size;
  327. // Memcpy dynamic resolution width from host to device
  328. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size), remain_size,
  329. &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  330. if (rt_ret != RT_ERROR_NONE) {
  331. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  332. return RT_ERROR_TO_GE_STATUS(rt_ret);
  333. }
  334. return SUCCESS;
  335. }
  336. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  337. const vector<uint64_t> &dynamic_dims) {
  338. if (dynamic_input_addr == nullptr) {
  339. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  340. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  341. }
  342. vector<uint64_t> cur_dynamic_dims;
  343. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  344. if (ret != SUCCESS) {
  345. GELOGE(ret, "Set cur gear dynamic dims failed");
  346. return ret;
  347. }
  348. std::vector<std::vector<int64_t>> batch_info;
  349. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  350. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  351. if (ret != SUCCESS) {
  352. GELOGE(ret, "Get dynamic input info failed.");
  353. return ret;
  354. }
  355. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  356. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  357. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  358. }
  359. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  360. if (ret != SUCCESS) {
  361. GELOGE(ret, "Set dynamic size failed");
  362. return ret;
  363. }
  364. size_t dynamic_dim_num = cur_dynamic_dims.size();
  365. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  366. if (length < dynamic_input_size) {
  367. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length,
  368. dynamic_input_size);
  369. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  370. }
  371. uint64_t size = sizeof(uint32_t);
  372. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  373. size = sizeof(uint64_t);
  374. }
  375. rtError_t rt_ret;
  376. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  377. // Memcpy dynamic dim[i] from host to device
  378. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  379. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  380. if (rt_ret != RT_ERROR_NONE) {
  381. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  382. return RT_ERROR_TO_GE_STATUS(rt_ret);
  383. }
  384. }
  385. return SUCCESS;
  386. }
  387. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  388. vector<uint64_t> &cur_dynamic_dims) {
  389. cur_dynamic_dims.clear();
  390. vector<ge::TensorDesc> input_desc;
  391. vector<ge::TensorDesc> output_desc;
  392. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  393. if (ret != ge::SUCCESS) {
  394. GELOGE(ret, "GetModelDescInfo failed.");
  395. return ret;
  396. }
  397. vector<string> user_designate_shape_order;
  398. vector<int64_t> all_data_dims;
  399. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  400. if (ret != ge::SUCCESS) {
  401. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  402. return ret;
  403. }
  404. for (auto &data_name : user_designate_shape_order) {
  405. for (auto &desc : input_desc) {
  406. if (desc.GetName() == data_name) {
  407. for (auto dim : desc.GetShape().GetDims()) {
  408. all_data_dims.push_back(dim);
  409. }
  410. break;
  411. }
  412. }
  413. }
  414. if (dynamic_dims.size() != all_data_dims.size()) {
  415. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  416. "Dynamic input size [%lu] is not equal with all data dims size [%lu]!", dynamic_dims.size(),
  417. all_data_dims.size());
  418. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  419. }
  420. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  421. if (all_data_dims[i] < 0) {
  422. cur_dynamic_dims.push_back(dynamic_dims[i]);
  423. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  424. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Static dims should be same, index: %zu value: %d should be %d",
  425. i, dynamic_dims[i], all_data_dims[i]);
  426. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  427. }
  428. }
  429. return SUCCESS;
  430. }
  431. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  432. GELOGI("Begin to get current shape");
  433. if (!isInit_) {
  434. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  435. return ACL_ERROR_GE_EXEC_NOT_INIT;
  436. }
  437. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  438. if (ret != SUCCESS) {
  439. GELOGE(ret, "Get current shape failed");
  440. return ret;
  441. }
  442. return SUCCESS;
  443. }
  444. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  445. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  446. const kAippDynamicPara &aippParms) {
  447. GELOGI("Enter to SetDynamicAippData.");
  448. if (dynamic_input_addr == nullptr) {
  449. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic aipp input addr is nullptr!");
  450. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  451. }
  452. if (aippBatchPara.empty()) {
  453. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "aippBatchPara is empty.");
  454. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  455. }
  456. uint64_t batch_num = aippBatchPara.size();
  457. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  458. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  459. GELOGI(
  460. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  461. "batch num is %lu, struct_len is %lu",
  462. model_id, length, batch_num, struct_len);
  463. if (struct_len > length) {
  464. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  465. "input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]", struct_len, length);
  466. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  467. }
  468. // Memcpy real kAippDynamicBatchPara from host to device
  469. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  470. if (rt_ret != RT_ERROR_NONE) {
  471. GELOGE(rt_ret, "memcpy real_aippParms_size failed! ret: 0x%X", rt_ret);
  472. return RT_ERROR_TO_GE_STATUS(rt_ret);
  473. }
  474. uint64_t remain_len = length - real_aippParms_size;
  475. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  476. for (uint64_t i = 0; i < batch_num; ++i) {
  477. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  478. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  479. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  480. if (rt_ret != RT_ERROR_NONE) {
  481. GELOGE(rt_ret, "memcpy kAippDynamicBatchPara input data failed! ret: 0x%X", rt_ret);
  482. return RT_ERROR_TO_GE_STATUS(rt_ret);
  483. }
  484. }
  485. return SUCCESS;
  486. }
  487. // Load model
  488. Status GeExecutor::LoadModelOffline(uint32_t &model_id, const std::string &path, const std::string &key,
  489. int32_t priority, std::shared_ptr<ge::ModelListener> listener) {
  490. GELOGI("load model offline begin.");
  491. if (!isInit_) {
  492. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  493. return ACL_ERROR_GE_EXEC_NOT_INIT;
  494. }
  495. string filePath = RealPath(path.c_str());
  496. if (filePath.empty()) {
  497. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID, "File path is invalid. please check your text file '%s'.",
  498. path.c_str());
  499. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  500. }
  501. std::shared_ptr<ModelListenerAdapter> listener_adapter = MakeShared<ModelListenerAdapter>();
  502. if (listener_adapter == nullptr) {
  503. GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelListenerAdapter make shared failed!");
  504. return ACL_ERROR_GE_MEMORY_ALLOCATION;
  505. }
  506. listener_adapter->listener = listener;
  507. Status ret = GraphLoader::LoadModelFromFile(path, key, priority, listener_adapter, model_id);
  508. if (ret != SUCCESS) {
  509. GELOGE(ret, "[GeExecutor] LoadModelFromFile failed");
  510. return ACL_ERROR_GE_LOAD_MODEL;
  511. }
  512. return SUCCESS;
  513. }
  514. Status GeExecutor::LoadModel(uint32_t &model_id, const ModelData &model_data,
  515. std::shared_ptr<ge::ModelListener> listener) {
  516. GELOGI("Load model begin.");
  517. if (!isInit_) {
  518. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  519. return ACL_ERROR_GE_EXEC_NOT_INIT;
  520. }
  521. std::shared_ptr<ModelListenerAdapter> listener_adapter = MakeShared<ModelListenerAdapter>();
  522. if (listener_adapter == nullptr) {
  523. GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelListenerAdapter make shared failed!");
  524. return ACL_ERROR_GE_MEMORY_ALLOCATION;
  525. }
  526. listener_adapter->listener = listener;
  527. Status ret = GraphLoader::LoadModel(model_data, listener_adapter, model_id);
  528. if (ret != SUCCESS) {
  529. GELOGE(ret, "[GeExecutor] LoadModel failed.");
  530. return ACL_ERROR_GE_LOAD_MODEL;
  531. }
  532. return ret;
  533. }
  534. Status GeExecutor::UnloadModel(uint32_t model_id) {
  535. GELOGD("unload model %u begin.", model_id);
  536. if (!isInit_) {
  537. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  538. return ACL_ERROR_GE_EXEC_NOT_INIT;
  539. }
  540. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  541. if (ret != SUCCESS) {
  542. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  543. return ACL_ERROR_GE_INTERNAL_ERROR;
  544. }
  545. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  546. if (davinci_model != nullptr) {
  547. uint64_t session_id = davinci_model->GetSessionId();
  548. VarManagerPool::Instance().RemoveVarManager(session_id);
  549. }
  550. ret = GraphLoader::UnloadModel(model_id);
  551. if (ret != SUCCESS) {
  552. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  553. return ACL_ERROR_GE_UNLOAD_MODEL;
  554. }
  555. return SUCCESS;
  556. }
  557. Status GeExecutor::RunModel(const ge::RunModelData &input_data, ge::RunModelData &output_data) {
  558. GELOGI("run model begin.");
  559. if (!isInit_) {
  560. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  561. return ACL_ERROR_GE_EXEC_NOT_INIT;
  562. }
  563. InputData inputs;
  564. GetDomiInputData(input_data, inputs);
  565. OutputData outputs;
  566. GetDomiOutputData(output_data, outputs);
  567. return GraphExecutor::DataInput(inputs, outputs);
  568. }
  569. // Get input and output descriptor
  570. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  571. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  572. if (!isInit_) {
  573. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  574. return ACL_ERROR_GE_EXEC_NOT_INIT;
  575. }
  576. std::vector<InputOutputDescInfo> input_desc_infos;
  577. std::vector<InputOutputDescInfo> output_desc_infos;
  578. std::vector<uint32_t> input_formats;
  579. std::vector<uint32_t> output_formats;
  580. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  581. output_formats, new_model_desc);
  582. if (ret != domi::SUCCESS) {
  583. GELOGE(ret, "GetInputOutputDescInfo failed. ret = %u", ret);
  584. return ACL_ERROR_GE_GET_TENSOR_INFO;
  585. }
  586. if (input_formats.size() != input_desc_infos.size()) {
  587. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "input_formats size %zu is not equal to input_desc_infos size %zu.",
  588. input_formats.size(), input_desc_infos.size());
  589. return ACL_ERROR_GE_PARAM_INVALID;
  590. }
  591. if (output_formats.size() != output_desc_infos.size()) {
  592. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats size %zu is not equal to output_desc_infos size %zu.",
  593. output_formats.size(), output_desc_infos.size());
  594. return ACL_ERROR_GE_PARAM_INVALID;
  595. }
  596. // Transfer data to TensorDesc
  597. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  598. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  599. return ge::SUCCESS;
  600. }
  601. ///
  602. /// @ingroup ge
  603. /// @brief Get dynamic batch_info
  604. /// @param [in] model_id
  605. /// @param [out] batch_info
  606. /// @param [out] dynamic_type
  607. /// @return execute result
  608. ///
  609. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  610. int32_t &dynamic_type) {
  611. if (!isInit_) {
  612. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  613. return ACL_ERROR_GE_EXEC_NOT_INIT;
  614. }
  615. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  616. if (ret != SUCCESS) {
  617. GELOGE(ret, "GetDynamicBatchInfo failed.");
  618. return ret;
  619. }
  620. return SUCCESS;
  621. }
  622. ///
  623. /// @ingroup ge
  624. /// @brief Get combined dynamic dims info
  625. /// @param [in] model_id
  626. /// @param [out] batch_info
  627. /// @return execute result
  628. ///
  629. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  630. GELOGI("Begin to get combined dynamic dims info.");
  631. if (!isInit_) {
  632. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  633. return ACL_ERROR_GE_EXEC_NOT_INIT;
  634. }
  635. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  636. if (ret != SUCCESS) {
  637. GELOGE(ret, "GetCombinedDynamicDims failed.");
  638. return ret;
  639. }
  640. GELOGI("Get combined dynamic dims succ.");
  641. return SUCCESS;
  642. }
  643. ///
  644. /// @ingroup ge
  645. /// @brief Get user designeate shape order
  646. /// @param [in] model_id
  647. /// @param [out] user_designate_shape_order
  648. /// @return execute result
  649. ///
  650. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  651. if (!isInit_) {
  652. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  653. return ACL_ERROR_GE_EXEC_NOT_INIT;
  654. }
  655. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  656. if (ret != SUCCESS) {
  657. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  658. return ret;
  659. }
  660. return SUCCESS;
  661. }
  662. ///
  663. /// @ingroup ge
  664. /// @brief Get AIPP input format
  665. /// @param [in] model_id
  666. /// @param [in] index
  667. /// @param [out] input_format
  668. /// @return execute result
  669. ///
  670. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  671. GELOGI("Begin to GetAIPPInfo.");
  672. if (!isInit_) {
  673. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  674. return ACL_ERROR_GE_EXEC_NOT_INIT;
  675. }
  676. Status ret = GraphExecutor::GetAIPPInfo(model_id, index, aipp_info);
  677. if (ret != SUCCESS) {
  678. GELOGW("GetAIPPInfo is not success.");
  679. return ret;
  680. }
  681. GELOGI("GetAIPPInfo succ.");
  682. return SUCCESS;
  683. }
  684. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  685. GELOGI("Begin to get aipp type.");
  686. if (!isInit_) {
  687. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  688. return ACL_ERROR_GE_EXEC_NOT_INIT;
  689. }
  690. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  691. if (ret != SUCCESS) {
  692. GELOGW("Get aipp type is not success.");
  693. return ret;
  694. }
  695. GELOGI("Get aipp type success.");
  696. return SUCCESS;
  697. }
  698. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  699. if (!isInit_) {
  700. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  701. return ACL_ERROR_GE_EXEC_NOT_INIT;
  702. }
  703. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  704. if (ret != SUCCESS) {
  705. GELOGE(ret, "Get dynamic batch output shape info failed.");
  706. return ret;
  707. }
  708. return SUCCESS;
  709. }
  710. Status GeExecutor::GetModelDescInfoForZeroCopy(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  711. std::vector<TensorDesc> &output_desc) {
  712. GELOGI("get model desc info for zero copy begin.");
  713. if (!isInit_) {
  714. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  715. return ACL_ERROR_GE_EXEC_NOT_INIT;
  716. }
  717. std::vector<InputOutputDescInfo> input_desc_infos;
  718. std::vector<InputOutputDescInfo> output_desc_infos;
  719. std::vector<uint32_t> input_formats;
  720. std::vector<uint32_t> output_formats;
  721. Status ret = GraphExecutor::GetInputOutputDescInfoForZeroCopy(model_id, input_desc_infos, output_desc_infos,
  722. input_formats, output_formats);
  723. if (ret != domi::SUCCESS) {
  724. GELOGE(ret, "Get DescInfo from zero copy failed. ret = %u", ret);
  725. return ACL_ERROR_GE_GET_TENSOR_INFO;
  726. }
  727. if (input_formats.size() != input_desc_infos.size()) {
  728. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "input_formats.size() != input_desc_infos.size().");
  729. return ACL_ERROR_GE_PARAM_INVALID;
  730. }
  731. if (output_formats.size() != output_desc_infos.size()) {
  732. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats.size() != output_desc_infos.size().");
  733. return ACL_ERROR_GE_PARAM_INVALID;
  734. }
  735. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  736. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  737. GELOGI("get model desc info from zero copy end.");
  738. return ge::SUCCESS;
  739. }
  740. Status GeExecutor::CommandHandle(const Command &command) {
  741. Status ret = GraphLoader::CommandHandle(command);
  742. if (ret != SUCCESS) {
  743. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "CommandHandle: Command Handle failed.");
  744. return ACL_ERROR_GE_COMMAND_HANDLE;
  745. }
  746. return SUCCESS;
  747. }
  748. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  749. GELOGI("Get max used memory begin.");
  750. if (!isInit_) {
  751. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  752. return ACL_ERROR_GE_EXEC_NOT_INIT;
  753. }
  754. uint64_t max_mem_size = 0;
  755. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  756. max_size = static_cast<uint32_t>(max_mem_size);
  757. return ret;
  758. }
  759. /**
  760. * @ingroup ge
  761. * @brief Load data from model file to memory
  762. * @param [in] const std::string &path: Offline model file path
  763. * @param [out] domi::ModelData &model_data: Offline model memory data
  764. * @return SUCCESS handle successfully / others handle failed
  765. */
  766. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  767. GELOGI("Load data from file begin.");
  768. if (!isInit_) {
  769. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  770. return ACL_ERROR_GE_EXEC_NOT_INIT;
  771. }
  772. string filePath = RealPath(path.c_str());
  773. if (filePath.empty()) {
  774. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID, "File path is invalid. please check your text file '%s'.",
  775. path.c_str());
  776. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  777. }
  778. GELOGI("load modelData from file: %s.", path.c_str());
  779. std::string key_path;
  780. int32_t priority = 0;
  781. Status ret = GraphLoader::LoadDataFromFile(path, key_path, priority, model_data);
  782. if (ret != SUCCESS) {
  783. if (model_data.model_data != nullptr) {
  784. delete[] static_cast<char *>(model_data.model_data);
  785. model_data.model_data = nullptr;
  786. }
  787. }
  788. return ret;
  789. }
  790. /**
  791. * @ingroup ge
  792. * @brief Load model from offline model memory data
  793. * @param [in] domi::ModelData &model_data: Offline model data
  794. void *dev_ptr: Input/Output memory start address
  795. size_t memsize: Input/Output memory length
  796. void *weight_ptr: Weight memory start address
  797. size_t weightsize: Weight memory length
  798. * @param [out] uint32_t &model_id: identification after model loading
  799. * @return SUCCESS handle successfully / others handle failed
  800. */
  801. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  802. void *weight_ptr, size_t weight_size) {
  803. if (!isInit_) {
  804. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  805. return ACL_ERROR_GE_EXEC_NOT_INIT;
  806. }
  807. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  808. }
  809. /**
  810. * @ingroup ge
  811. * @brief Load task list from ModelData with queue.
  812. * @param [out] model_id: model id allocate from manager.
  813. * @param [in] ge_model_data: Model data load from offline model.
  814. * @param [in] input_queue_ids: input queue ids create from user.
  815. * @param [in] output_queue_ids: input queue ids create from user.
  816. * @return: 0 for success / others for fail
  817. */
  818. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  819. const std::vector<uint32_t> &input_queue_ids,
  820. const std::vector<uint32_t> &output_queue_ids) {
  821. GELOGI("Load model with queue begin.");
  822. if (!isInit_) {
  823. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  824. return ACL_ERROR_GE_EXEC_NOT_INIT;
  825. }
  826. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  827. }
  828. /**
  829. * @ingroup ge
  830. * @brief Synchronous execution of offline model(Do not create thread)
  831. * @param [in] uint32_t model_id: Model ID to execute
  832. void* stream: stream to execute
  833. const domi::InputData *input_data: Model input data
  834. bool async_mode: is asynchronize mode.
  835. * @param [out] domi::OutputData *output_data: Model output data
  836. * @return SUCCESS handle successfully / others handle failed
  837. */
  838. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  839. ge::RunModelData &run_output_data, bool async_mode) {
  840. if (!isInit_) {
  841. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  842. return ACL_ERROR_GE_EXEC_NOT_INIT;
  843. }
  844. InputData input_data;
  845. OutputData output_data;
  846. GetDomiInputData(run_input_data, input_data);
  847. GetDomiOutputData(run_output_data, output_data);
  848. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  849. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  850. std::vector<std::vector<int64_t>> batch_info;
  851. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  852. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  853. if (ret != SUCCESS) {
  854. GELOGE(ret, "Get dynamic input info failed.");
  855. return ret;
  856. }
  857. if (!batch_info.empty()) {
  858. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  859. }
  860. }
  861. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, output_data);
  862. }
  863. /**
  864. * @ingroup ge
  865. * @brief Get weight memory size from model file
  866. * @param [in] const std::string &path: Offline model file path
  867. * @param [out] size_t &mem_size Execution memory size
  868. size_t &weight_size Weight memory space size
  869. * @return SUCCESS handle successfully / others handle failed
  870. */
  871. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  872. GELOGI("Get memory and weight size from file begin.");
  873. if (!isInit_) {
  874. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  875. return ACL_ERROR_GE_EXEC_NOT_INIT;
  876. }
  877. ModelData model;
  878. std::string key;
  879. Status ret = ge::GraphLoader::LoadDataFromFile(path, key, 0, model);
  880. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  881. GELOGE(ret, "Load data from file failed. ret = %d", ret);
  882. return ret;
  883. }
  884. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  885. delete[] static_cast<char *>(model.model_data);
  886. model.model_data = nullptr;
  887. return ret;
  888. }
  889. /**
  890. * @ingroup ge
  891. * @brief Get weight memory size from model file
  892. * @param [in] const void *model_data Offline model buffer
  893. size_t model_size Offline model buffer length
  894. * @param [out] size_t &mem_size Execution memory size
  895. size_t &weight_size Weight memory space size
  896. * @return SUCCESS handle successfully / others handle failed
  897. */
  898. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  899. size_t &weight_size) {
  900. GELOGI("Get memory and weight size from data begin.");
  901. if (!isInit_) {
  902. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  903. return ACL_ERROR_GE_EXEC_NOT_INIT;
  904. }
  905. if (model_data == nullptr) {
  906. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "invalid model data!");
  907. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  908. }
  909. ModelData model;
  910. model.model_data = const_cast<void *>(model_data);
  911. model.model_len = static_cast<uint32_t>(model_size);
  912. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  913. }
  914. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  915. SingleOp **single_op) {
  916. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op);
  917. }
  918. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  919. DynamicSingleOp **single_op) {
  920. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op);
  921. }
  922. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  923. std::vector<DataBuffer> &outputs) {
  924. if (executor == nullptr) {
  925. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "param is NULL");
  926. return ACL_ERROR_GE_EXEC_NOT_INIT;
  927. }
  928. return executor->ExecuteAsync(inputs, outputs);
  929. }
  930. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  931. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  932. vector<DataBuffer> &outputs) {
  933. GE_CHECK_NOTNULL(executor);
  934. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  935. }
  936. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  937. ModelManager::GetInstance()->ClearAicpuSo();
  938. return SingleOpManager::GetInstance().ReleaseResource(stream);
  939. }
  940. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  941. auto model_manager = ModelManager::GetInstance();
  942. GE_CHECK_NOTNULL(model_manager);
  943. auto davinci_model = model_manager->GetModel(model_id);
  944. if (davinci_model == nullptr) {
  945. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id: %d is invaild or model is not loaded.", model_id);
  946. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  947. }
  948. device_id = davinci_model->GetDeviceId();
  949. return SUCCESS;
  950. }
  951. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  952. std::vector<std::vector<int64_t>> batch_info;
  953. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  954. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  955. if (ret != SUCCESS) {
  956. GELOGE(ret, "Calc batch info size failed. ret = %d", ret);
  957. return ret;
  958. }
  959. if (batch_info.empty()) {
  960. shape_count = kStaticBatchInfoSize;
  961. } else {
  962. shape_count = batch_info.size();
  963. }
  964. return SUCCESS;
  965. }
  966. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  967. GELOGI("Begin to GetOrigInputInfo.");
  968. if (!isInit_) {
  969. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  970. return ACL_ERROR_GE_EXEC_NOT_INIT;
  971. }
  972. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  973. if (ret != SUCCESS) {
  974. GELOGE(ret, "GetOrigInputInfo failed.");
  975. return ret;
  976. }
  977. GELOGI("GetOrigInputInfo succ.");
  978. return SUCCESS;
  979. }
  980. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  981. std::vector<InputOutputDims> &input_dims,
  982. std::vector<InputOutputDims> &output_dims) {
  983. GELOGI("Begin to GetAllAippInputOutputDims.");
  984. if (!isInit_) {
  985. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  986. return ACL_ERROR_GE_EXEC_NOT_INIT;
  987. }
  988. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  989. if (ret != SUCCESS) {
  990. GELOGE(ret, "GetAllAippInputOutputDims failed.");
  991. return ret;
  992. }
  993. GELOGI("GetAllAippInputOutputDims succ.");
  994. return SUCCESS;
  995. }
  996. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  997. GELOGI("Begin to GetOpDescInfo.");
  998. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  999. if (ret != SUCCESS) {
  1000. GELOGE(ret, "GetOpDescInfo failed.");
  1001. return ret;
  1002. }
  1003. GELOGI("GetOpDescInfo succ.");
  1004. return SUCCESS;
  1005. }
  1006. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  1007. GELOGI("Start to set dump config");
  1008. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  1009. if (ret != SUCCESS) {
  1010. GELOGE(ret, "Set dump conf failed");
  1011. return ret;
  1012. }
  1013. GELOGI("Set dump config successfully");
  1014. return SUCCESS;
  1015. }
  1016. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知.