You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 51 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205120612071208
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "framework/executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <ctime>
  19. #include <iostream>
  20. #include "framework/common/debug/log.h"
  21. #include "common/ge/ge_util.h"
  22. #include "framework/common/helper/model_helper.h"
  23. #include "common/profiling/profiling_manager.h"
  24. #include "common/profiling/profiling_properties.h"
  25. #include "common/dump/dump_manager.h"
  26. #include "graph/execute/graph_execute.h"
  27. #include "graph/load/graph_loader.h"
  28. #include "graph/load/model_manager/model_manager.h"
  29. #include "graph/manager/graph_mem_manager.h"
  30. #include "graph/manager/graph_var_manager.h"
  31. #include "single_op/single_op_manager.h"
  32. #include "graph/load/model_manager/davinci_model.h"
  33. #include "opskernel_manager/ops_kernel_builder_manager.h"
  34. #include "graph/opsproto_manager.h"
  35. #include "ge_local_engine/engine/host_cpu_engine.h"
  36. #include "runtime/base.h"
  37. #include "common/profiling/command_handle.h"
  38. using std::string;
  39. using std::vector;
  40. namespace {
  41. const size_t kDynamicBatchSizeVecSize = 1;
  42. const size_t kStaticBatchInfoSize = 1;
  43. const size_t kDynamicImageSizeVecSize = 2;
  44. const size_t kDynamicImageSizeInputSize = 2;
  45. const char *const kBatchLabel = "Batch_";
  46. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  47. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  48. const std::vector<uint32_t> &formats) {
  49. uint32_t idx = 0;
  50. for (auto desc_item : domi_descs) {
  51. ge::TensorDesc ge_desc;
  52. ge_desc.SetName(desc_item.name.c_str());
  53. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  54. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  55. std::vector<int64_t> shape_dims;
  56. for (auto dim : desc_item.shape_info.dims) {
  57. shape_dims.push_back(dim);
  58. }
  59. ge::Shape ge_shape(shape_dims);
  60. ge_desc.SetShape(ge_shape);
  61. ge_desc.SetSize(desc_item.size);
  62. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  63. ge_descs.emplace_back(ge_desc);
  64. ++idx;
  65. }
  66. }
  67. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  68. inputs.index = input_data.index;
  69. inputs.model_id = input_data.modelId;
  70. inputs.timestamp = input_data.timestamp;
  71. inputs.timeout = input_data.timeout;
  72. inputs.request_id = input_data.request_id;
  73. for (const auto &data_item : input_data.blobs) {
  74. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  75. inputs.blobs.emplace_back(dataBuf);
  76. }
  77. }
  78. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  79. outputs.index = output_data.index;
  80. outputs.model_id = output_data.modelId;
  81. for (const auto &data_item : output_data.blobs) {
  82. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  83. outputs.blobs.emplace_back(dataBuf);
  84. }
  85. }
  86. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  87. ge::InputData &inputs) {
  88. inputs.is_dynamic_batch = true;
  89. std::string batch_label;
  90. size_t match_idx = 0;
  91. for (size_t i = 0; i < batch_info.size(); ++i) {
  92. // dynamic_dims
  93. if (input_data.dynamic_dims.size() != 0) {
  94. bool is_match = true;
  95. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  96. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  97. is_match = false;
  98. break;
  99. }
  100. }
  101. if (is_match) {
  102. match_idx = i;
  103. break;
  104. }
  105. // dynamic_batch_size
  106. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  107. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  108. match_idx = i;
  109. break;
  110. // dynamic_image_size
  111. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  112. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  113. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  114. match_idx = i;
  115. break;
  116. }
  117. }
  118. batch_label = kBatchLabel + std::to_string(match_idx);
  119. inputs.batch_label = batch_label;
  120. GELOGI("current batch label:%s", batch_label.c_str());
  121. }
  122. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  123. if (batch_info.empty()) {
  124. REPORT_INNER_ERROR("E19999", "param Dynamic batch info is empty, check invalid.");
  125. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  126. return false;
  127. }
  128. for (auto batch : batch_info) {
  129. if (batch.size() != kDynamicBatchSizeVecSize) {
  130. REPORT_INNER_ERROR("E19999", "Dynamic batch param num is %zu, current batch size is %zu.",
  131. kDynamicBatchSizeVecSize, batch.size());
  132. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch param num is %zu, current batch size is %zu.",
  133. kDynamicBatchSizeVecSize, batch.size());
  134. return false;
  135. }
  136. if (batch[0] == static_cast<int64_t>(batch_size)) {
  137. return true;
  138. }
  139. }
  140. REPORT_INNER_ERROR("E19999", "Dynamic batch %lu can not match the gear of model.", batch_size);
  141. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch %lu can not match the gear of model.", batch_size);
  142. return false;
  143. }
  144. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  145. const vector<std::vector<int64_t>> &batch_info) {
  146. if (batch_info.empty()) {
  147. REPORT_INNER_ERROR("E19999", "ParamDynamic batch info is empty. check invalid");
  148. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  149. return false;
  150. }
  151. for (auto resolution : batch_info) {
  152. if (resolution.size() != kDynamicImageSizeVecSize) {
  153. REPORT_INNER_ERROR("E19999", "Dynamic resolution param num is %zu, current resolution size is %zu.",
  154. kDynamicImageSizeVecSize, resolution.size());
  155. GELOGE(ge::FAILED, "[Check][Param] Dynamic resolution param num is %zu, current resolution size is %zu.",
  156. kDynamicImageSizeVecSize, resolution.size());
  157. return false;
  158. }
  159. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  160. return true;
  161. }
  162. }
  163. REPORT_INNER_ERROR("E19999", "Dynamic resolution (%lu,%lu) can not match the gear of model.",
  164. image_height, image_width);
  165. GELOGE(ge::FAILED, "[Check][Param]Dynamic resolution (%lu,%lu) can not match the gear of model.",
  166. image_height, image_width);
  167. return false;
  168. }
  169. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  170. const vector<vector<int64_t>> &batch_info) {
  171. if (batch_info.empty()) {
  172. REPORT_INNER_ERROR("E19999", "param batch_info is empty, check invalid");
  173. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] Dynamic batch info is empty.");
  174. return false;
  175. }
  176. bool find_match = false;
  177. for (auto resolution : batch_info) {
  178. if (cur_dynamic_dims.size() != resolution.size()) {
  179. REPORT_INNER_ERROR("E19999", "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  180. cur_dynamic_dims.size(), resolution.size());
  181. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  182. "[Check][Param] Cur dynamic dims param num is %zu, current resolution size is %zu.",
  183. cur_dynamic_dims.size(), resolution.size());
  184. return false;
  185. }
  186. bool flag = true;
  187. for (std::size_t i = 0; i < resolution.size(); ++i) {
  188. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  189. flag = false;
  190. break;
  191. }
  192. }
  193. if (flag) {
  194. find_match = true;
  195. break;
  196. }
  197. }
  198. if (!find_match) {
  199. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] choose dynamic dims can not match the gear of model.");
  200. }
  201. return find_match;
  202. }
  203. } // namespace
  204. namespace ge {
  205. bool GeExecutor::isInit_ = false;
  206. static void InitOpsProtoManager() {
  207. string opsproto_path;
  208. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  209. if (path_env != nullptr) {
  210. string path = path_env;
  211. string file_path = RealPath(path.c_str());
  212. if (file_path.empty()) {
  213. GELOGE(FAILED, "[Check][EnvPath]ASCEND_OPP_PATH path [%s] is invalid.", path.c_str());
  214. REPORT_INPUT_ERROR("E68016", {"ASCEND_OPP_PATH", path});
  215. return;
  216. }
  217. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  218. GELOGI("Get opsproto so path from env : %s", path.c_str());
  219. } else {
  220. string path_base = PluginManager::GetPath();
  221. GELOGI("path_base is %s", path_base.c_str());
  222. path_base = path_base.substr(0, path_base.rfind('/'));
  223. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  224. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  225. }
  226. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  227. OpsProtoManager *manager = OpsProtoManager::Instance();
  228. map<string, string> option_tmp;
  229. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  230. (void)manager->Initialize(option_tmp);
  231. }
  232. GeExecutor::GeExecutor() {}
  233. Status GeExecutor::Initialize() {
  234. GELOGI("Init GeExecutor begin.");
  235. if (isInit_) {
  236. GELOGW("Already initialized, no need to be initialized again.");
  237. return ge::SUCCESS;
  238. }
  239. OpTilingManager::GetInstance().LoadSo();
  240. Status init_hostcpu_engine_status = HostCpuEngine::GetInstance().Initialize();
  241. if (init_hostcpu_engine_status != SUCCESS) {
  242. GELOGE(init_hostcpu_engine_status, "[initialize][HostCpuEngine] failed");
  243. return init_hostcpu_engine_status;
  244. }
  245. InitOpsProtoManager();
  246. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  247. mem_type.push_back(RT_MEMORY_P2P_DDR);
  248. auto ret = MemManager::Instance().Initialize(mem_type);
  249. if (ret != SUCCESS) {
  250. GELOGE(ret, "[Initialize][MemManager] failed.");
  251. return ret;
  252. }
  253. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  254. "[Initialize][OpsKernelBuilderManager] failed.");
  255. // Start profiling
  256. Options profiling_options;
  257. profiling_options.device_id = 0;
  258. // job id need to be set, the value is meaningless;
  259. profiling_options.job_id = "1";
  260. isInit_ = true;
  261. GELOGI("Init GeExecutor over.");
  262. return ge::SUCCESS;
  263. }
  264. Status GeExecutor::Finalize() {
  265. GELOGI("Uninit GeExecutor begin.");
  266. if (isInit_ == false) {
  267. GELOGW("GeExecutor has not been initialized.");
  268. return ge::SUCCESS;
  269. }
  270. (void) OpsKernelBuilderManager::Instance().Finalize();
  271. // Stop profiling
  272. if (ProfilingProperties::Instance().ProfilingOn()) {
  273. ProfilingManager::Instance().PluginUnInit();
  274. }
  275. GELOGI("Uninit GeExecutor over.");
  276. return ge::SUCCESS;
  277. }
  278. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  279. uint64_t batch_size) {
  280. if (dynamic_input_addr == nullptr) {
  281. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  282. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  283. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  284. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  285. }
  286. uint64_t size = sizeof(uint32_t);
  287. if (length < size) {
  288. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  289. length, size, model_id);
  290. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  291. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u", length, size, model_id);
  292. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  293. }
  294. if (length >= sizeof(uint64_t)) {
  295. size = sizeof(uint64_t);
  296. }
  297. // Verify whether the input dynamic batch matches the model gear
  298. std::vector<std::vector<int64_t>> batch_info;
  299. std::vector<uint64_t> batch_num{batch_size};
  300. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  301. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  302. if (ret != SUCCESS) {
  303. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u", model_id);
  304. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  305. return ret;
  306. }
  307. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  308. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  309. "[Check][Param] The current dynamic input does not match the gear of the model(id:%u).", model_id);
  310. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  311. }
  312. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  313. if (ret != SUCCESS) {
  314. REPORT_CALL_ERROR("E19999", "set dynamic size failed, model id:%u, dynamic_type:1", model_id);
  315. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u, dynamic_type:1", model_id);
  316. return ret;
  317. }
  318. // memcpy dynamic_batch_size from host to device
  319. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  320. if (rt_ret != RT_ERROR_NONE) {
  321. REPORT_CALL_ERROR("E19999", "Call rtMemcpy, size:%lu ret:0x%X", length, rt_ret);
  322. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic batch input data failed! size:%lu ret:0x%X", length, rt_ret);
  323. return RT_ERROR_TO_GE_STATUS(rt_ret);
  324. }
  325. return SUCCESS;
  326. }
  327. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  328. uint64_t image_height, uint64_t image_width) {
  329. if (dynamic_input_addr == nullptr) {
  330. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  331. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  332. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  333. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  334. }
  335. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  336. if (length < dynamic_input_size) {
  337. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  338. length, dynamic_input_size, model_id);
  339. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  340. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  341. length, dynamic_input_size, model_id);
  342. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  343. }
  344. uint64_t size = sizeof(uint32_t);
  345. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  346. size = sizeof(uint64_t);
  347. }
  348. // Verify whether the input dynamic resolution matches the model gear
  349. std::vector<std::vector<int64_t>> batch_info;
  350. std::vector<uint64_t> batch_num{image_height, image_width};
  351. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  352. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  353. if (ret != SUCCESS) {
  354. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  355. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  356. return ret;
  357. }
  358. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  359. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  360. "[Check][Param] The current dynamic input does not match the gear of the model, "
  361. "image_height:%lu, image_width:%lu.", image_height, image_width);
  362. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  363. }
  364. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  365. if (ret != SUCCESS) {
  366. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u,", model_id);
  367. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  368. return ret;
  369. }
  370. // Memcpy dynamic resolution height from host to device
  371. rtError_t rt_ret =
  372. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  373. if (rt_ret != RT_ERROR_NONE) {
  374. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u", size, rt_ret, model_id);
  375. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  376. size, rt_ret, model_id);
  377. return RT_ERROR_TO_GE_STATUS(rt_ret);
  378. }
  379. uint64_t remain_size = length - size;
  380. // Memcpy dynamic resolution width from host to device
  381. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  382. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  383. if (rt_ret != RT_ERROR_NONE) {
  384. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u",
  385. remain_size, rt_ret, model_id);
  386. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  387. remain_size, rt_ret, model_id);
  388. return RT_ERROR_TO_GE_STATUS(rt_ret);
  389. }
  390. return SUCCESS;
  391. }
  392. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  393. const vector<uint64_t> &dynamic_dims) {
  394. if (dynamic_input_addr == nullptr) {
  395. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  396. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  397. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  398. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  399. }
  400. vector<uint64_t> cur_dynamic_dims;
  401. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  402. if (ret != SUCCESS) {
  403. GELOGE(ret, "[Get][CurDynamicDims] failed, model id:%u", model_id);
  404. return ret;
  405. }
  406. std::vector<std::vector<int64_t>> batch_info;
  407. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  408. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  409. if (ret != SUCCESS) {
  410. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  411. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  412. return ret;
  413. }
  414. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  415. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  416. "[Check][Param] The current dynamic input does not match the gear of the model, id:%u.", model_id);
  417. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  418. }
  419. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  420. if (ret != SUCCESS) {
  421. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u", model_id);
  422. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  423. return ret;
  424. }
  425. size_t dynamic_dim_num = cur_dynamic_dims.size();
  426. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  427. if (length < dynamic_input_size) {
  428. REPORT_INNER_ERROR("E19999", "input dynamic size [%lu] is less than [%lu], model id:%u",
  429. length, dynamic_input_size, model_id);
  430. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  431. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  432. length, dynamic_input_size, model_id);
  433. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  434. }
  435. uint64_t size = sizeof(uint32_t);
  436. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  437. size = sizeof(uint64_t);
  438. }
  439. rtError_t rt_ret;
  440. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  441. // Memcpy dynamic dim[i] from host to device
  442. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  443. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  444. if (rt_ret != RT_ERROR_NONE) {
  445. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", (length - size * i), rt_ret);
  446. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X",
  447. length - size * i, rt_ret);
  448. return RT_ERROR_TO_GE_STATUS(rt_ret);
  449. }
  450. }
  451. return SUCCESS;
  452. }
  453. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  454. vector<uint64_t> &cur_dynamic_dims) {
  455. cur_dynamic_dims.clear();
  456. vector<ge::TensorDesc> input_desc;
  457. vector<ge::TensorDesc> output_desc;
  458. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  459. if (ret != ge::SUCCESS) {
  460. GELOGE(ret, "[Get][ModelDescInfo] failed, model id:%u.", model_id);
  461. return ret;
  462. }
  463. vector<string> user_designate_shape_order;
  464. vector<int64_t> all_data_dims;
  465. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  466. if (ret != ge::SUCCESS) {
  467. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  468. return ret;
  469. }
  470. for (auto &data_name : user_designate_shape_order) {
  471. for (auto &desc : input_desc) {
  472. if (desc.GetName() == data_name) {
  473. for (auto dim : desc.GetShape().GetDims()) {
  474. all_data_dims.push_back(dim);
  475. }
  476. break;
  477. }
  478. }
  479. }
  480. if (dynamic_dims.size() != all_data_dims.size()){
  481. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  482. dynamic_dims.size(), all_data_dims.size());
  483. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  484. "[Check][Param] Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  485. dynamic_dims.size(), all_data_dims.size());
  486. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  487. }
  488. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  489. if (all_data_dims[i] < 0) {
  490. cur_dynamic_dims.push_back(dynamic_dims[i]);
  491. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  492. REPORT_INNER_ERROR("E19999", "Static dims should be same, index:%zu value:%lu should be %ld",
  493. i, dynamic_dims[i], all_data_dims[i]);
  494. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  495. "[Check][Param] Static dims should be same, index:%zu value:%lu should be %ld",
  496. i, dynamic_dims[i], all_data_dims[i]);
  497. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  498. }
  499. }
  500. return SUCCESS;
  501. }
  502. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  503. GELOGI("Begin to get current shape");
  504. if (!isInit_) {
  505. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  506. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  507. return ACL_ERROR_GE_EXEC_NOT_INIT;
  508. }
  509. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  510. if (ret != SUCCESS) {
  511. REPORT_CALL_ERROR("E19999", "Get Cur Shape failed, model id:%u", model_id);
  512. GELOGE(ret, "[Get][CurShape] failed, model id:%u", model_id);
  513. return ret;
  514. }
  515. return SUCCESS;
  516. }
  517. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  518. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  519. const kAippDynamicPara &aippParms) {
  520. GELOGI("Enter to SetDynamicAippData.");
  521. if (dynamic_input_addr == nullptr) {
  522. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  523. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  524. "[Check][Param] Dynamic aipp input addr is nullptr, model id:%u", model_id);
  525. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  526. }
  527. if (aippBatchPara.empty()) {
  528. REPORT_INNER_ERROR("E19999", "Param aippBatchPara is empty, check invalid, model id:%u", model_id);
  529. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "[Check][Param] aippBatchPara is empty, model id:%u", model_id);
  530. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  531. }
  532. uint64_t batch_num = aippBatchPara.size();
  533. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  534. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  535. GELOGI(
  536. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  537. "batch num is %lu, struct_len is %lu",
  538. model_id, length, batch_num, struct_len);
  539. if (struct_len > length) {
  540. REPORT_INNER_ERROR("E19999", "input dynamic aipp param len:%lu is larger than aipp_data size:%lu",
  541. struct_len, length);
  542. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  543. "[Check][Param] input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]",
  544. struct_len, length);
  545. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  546. }
  547. // Memcpy real kAippDynamicBatchPara from host to device
  548. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  549. if (rt_ret != RT_ERROR_NONE) {
  550. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", length, rt_ret);
  551. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy aippParms failed! size:%lu, ret:0x%X", length, rt_ret);
  552. return RT_ERROR_TO_GE_STATUS(rt_ret);
  553. }
  554. uint64_t remain_len = length - real_aippParms_size;
  555. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  556. for (uint64_t i = 0; i < batch_num; ++i) {
  557. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  558. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  559. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  560. if (rt_ret != RT_ERROR_NONE) {
  561. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, ret:0x%X", rt_ret);
  562. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy kAippDynamicBatchPara input data failed! ret:0x%X", rt_ret);
  563. return RT_ERROR_TO_GE_STATUS(rt_ret);
  564. }
  565. }
  566. return SUCCESS;
  567. }
  568. Status GeExecutor::UnloadModel(uint32_t model_id) {
  569. GELOGD("unload model %u begin.", model_id);
  570. if (!isInit_) {
  571. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized");
  572. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  573. return ACL_ERROR_GE_EXEC_NOT_INIT;
  574. }
  575. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  576. if (ret != SUCCESS) {
  577. REPORT_CALL_ERROR("E19999", "Destroy Aicpu Session For Infer failed, model id:%u", model_id);
  578. GELOGE(ret, "[Destroy][AicpuSession] For Infer failed. model id:%u", model_id);
  579. return ret;
  580. }
  581. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model =
  582. ModelManager::GetInstance()->GetHybridModel(model_id);
  583. if (hybrid_davinci_model != nullptr) {
  584. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  585. VarManagerPool::Instance().RemoveVarManager(session_id);
  586. } else {
  587. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  588. if (davinci_model != nullptr) {
  589. uint64_t session_id = davinci_model->GetSessionId();
  590. VarManagerPool::Instance().RemoveVarManager(session_id);
  591. }
  592. }
  593. ret = GraphLoader::UnloadModel(model_id);
  594. if (ret != SUCCESS) {
  595. REPORT_CALL_ERROR("E19999", "unload model failed, model id:%u", model_id);
  596. GELOGE(ret, "[Unload][Model] failed. model id:%u", model_id);
  597. return ret;
  598. }
  599. return SUCCESS;
  600. }
  601. // Get input and output descriptor
  602. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  603. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  604. if (!isInit_) {
  605. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  606. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  607. return ACL_ERROR_GE_EXEC_NOT_INIT;
  608. }
  609. std::vector<InputOutputDescInfo> input_desc_infos;
  610. std::vector<InputOutputDescInfo> output_desc_infos;
  611. std::vector<uint32_t> input_formats;
  612. std::vector<uint32_t> output_formats;
  613. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  614. output_formats, new_model_desc);
  615. if (ret != domi::SUCCESS) {
  616. REPORT_CALL_ERROR("E19999", "get input output desc info failed, ret = %u, model id:%u", ret, model_id);
  617. GELOGE(ret, "[Get][InputOutputDescInfo] failed. ret = %u, model id:%u", ret, model_id);
  618. return ACL_ERROR_GE_GET_TENSOR_INFO;
  619. }
  620. if (input_formats.size() != input_desc_infos.size()) {
  621. REPORT_INNER_ERROR("E19999", "input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  622. input_formats.size(), input_desc_infos.size(), model_id);
  623. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  624. "[Check][Param] input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  625. input_formats.size(), input_desc_infos.size(), model_id);
  626. return ACL_ERROR_GE_PARAM_INVALID;
  627. }
  628. if (output_formats.size() != output_desc_infos.size()) {
  629. REPORT_INNER_ERROR("E19999", "output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  630. output_formats.size(), output_desc_infos.size(), model_id);
  631. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  632. "[Check][Param] output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  633. output_formats.size(), output_desc_infos.size(), model_id);
  634. return ACL_ERROR_GE_PARAM_INVALID;
  635. }
  636. // Transfer data to TensorDesc
  637. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  638. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  639. return ge::SUCCESS;
  640. }
  641. ///
  642. /// @ingroup ge
  643. /// @brief Get dynamic batch_info
  644. /// @param [in] model_id
  645. /// @param [out] batch_info
  646. /// @param [out] dynamic_type
  647. /// @return execute result
  648. ///
  649. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  650. int32_t &dynamic_type) {
  651. if (!isInit_) {
  652. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  653. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  654. return ACL_ERROR_GE_EXEC_NOT_INIT;
  655. }
  656. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  657. if (ret != SUCCESS) {
  658. REPORT_CALL_ERROR("E19999", "Get Dynamic BatchInfo failed, model id:%u.", model_id);
  659. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  660. return ret;
  661. }
  662. return SUCCESS;
  663. }
  664. ///
  665. /// @ingroup ge
  666. /// @brief Get combined dynamic dims info
  667. /// @param [in] model_id
  668. /// @param [out] batch_info
  669. /// @return execute result
  670. ///
  671. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  672. GELOGI("Begin to get combined dynamic dims info.");
  673. if (!isInit_) {
  674. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  675. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  676. return ACL_ERROR_GE_EXEC_NOT_INIT;
  677. }
  678. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  679. if (ret != SUCCESS) {
  680. REPORT_CALL_ERROR("E19999", "Get Combined DynamicDims failed, model id:%u.", model_id);
  681. GELOGE(ret, "[Get][CombinedDynamicDims] failed, model id:%u.", model_id);
  682. return ret;
  683. }
  684. GELOGI("Get combined dynamic dims succ.");
  685. return SUCCESS;
  686. }
  687. ///
  688. /// @ingroup ge
  689. /// @brief Get user designeate shape order
  690. /// @param [in] model_id
  691. /// @param [out] user_designate_shape_order
  692. /// @return execute result
  693. ///
  694. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  695. if (!isInit_) {
  696. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  697. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  698. return ACL_ERROR_GE_EXEC_NOT_INIT;
  699. }
  700. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  701. if (ret != SUCCESS) {
  702. REPORT_CALL_ERROR("E19999", "GetUserDesignateShapeOrder failed, model id:%u.", model_id);
  703. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  704. return ret;
  705. }
  706. return SUCCESS;
  707. }
  708. ///
  709. /// @ingroup ge
  710. /// @brief Get AIPP input format
  711. /// @param [in] model_id
  712. /// @param [in] index
  713. /// @param [out] input_format
  714. /// @return execute result
  715. ///
  716. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  717. GELOGI("Begin to GetAIPPInfo.");
  718. if (!isInit_) {
  719. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  720. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor not inited yet!");
  721. return ACL_ERROR_GE_EXEC_NOT_INIT;
  722. }
  723. Status ret = GraphExecutor::GetAippInfo(model_id, index, aipp_info);
  724. if (ret != SUCCESS) {
  725. GELOGW("GetAIPPInfo is not success.");
  726. return ret;
  727. }
  728. GELOGI("GetAIPPInfo succ.");
  729. return SUCCESS;
  730. }
  731. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  732. GELOGI("Begin to get aipp type.");
  733. if (!isInit_) {
  734. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  735. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not inited yet!");
  736. return ACL_ERROR_GE_EXEC_NOT_INIT;
  737. }
  738. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  739. if (ret != SUCCESS) {
  740. GELOGW("Get aipp type is not success.");
  741. return ret;
  742. }
  743. GELOGI("Get aipp type success.");
  744. return SUCCESS;
  745. }
  746. Status GeExecutor::GetOpAttr(uint32_t model_id, const std::string &op_name, const std::string &attr_name,
  747. std::string &attr_value) {
  748. GELOGI("Begin to get op attr.");
  749. if (!isInit_) {
  750. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Init][GeExecutor]Ge executor not inited yet!");
  751. REPORT_INNER_ERROR("E19999", "Ge executor not inited yet!");
  752. return ACL_ERROR_GE_EXEC_NOT_INIT;
  753. }
  754. Status ret = GraphExecutor::GetOpAttr(model_id, op_name, attr_name, attr_value);
  755. if (ret != SUCCESS) {
  756. GELOGE(ret, "[Get][OpAttr]Get op:%s attr:%s failed, model id:%u.",
  757. op_name.c_str(), attr_name.c_str(), model_id);
  758. REPORT_CALL_ERROR("E19999", "Get op:%s attr:%s failed, model id:%u",
  759. op_name.c_str(), attr_name.c_str(), model_id);
  760. return ret;
  761. }
  762. return SUCCESS;
  763. }
  764. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  765. if (!isInit_) {
  766. REPORT_INNER_ERROR("E19999", "GeExecutor has not inited yet!");
  767. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  768. return ACL_ERROR_GE_EXEC_NOT_INIT;
  769. }
  770. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  771. if (ret != SUCCESS) {
  772. REPORT_CALL_ERROR("E19999", "Get Model Attr failed, model id:%u.", model_id);
  773. GELOGE(ret, "[Get][ModelAttr] failed, model id:%u.", model_id);
  774. return ret;
  775. }
  776. return SUCCESS;
  777. }
  778. Status GeExecutor::CommandHandle(const Command &command) {
  779. Status ret = GraphLoader::CommandHandle(command);
  780. if (ret != SUCCESS) {
  781. REPORT_CALL_ERROR("E19999", "call CommandHandle failed, ret:%u", ret);
  782. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "[Call][CommandHandle] failed, ret:%u", ret);
  783. return ACL_ERROR_GE_COMMAND_HANDLE;
  784. }
  785. return SUCCESS;
  786. }
  787. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  788. GELOGI("Get max used memory begin.");
  789. if (!isInit_) {
  790. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  791. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  792. return ACL_ERROR_GE_EXEC_NOT_INIT;
  793. }
  794. uint64_t max_mem_size = 0;
  795. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  796. max_size = static_cast<uint32_t>(max_mem_size);
  797. return ret;
  798. }
  799. /**
  800. * @ingroup ge
  801. * @brief Load data from model file to memory
  802. * @param [in] const std::string &path: Offline model file path
  803. * @param [out] domi::ModelData &model_data: Offline model memory data
  804. * @return SUCCESS handle successfully / others handle failed
  805. */
  806. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  807. GELOGI("Load data from file begin.");
  808. if (!isInit_) {
  809. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  810. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  811. return ACL_ERROR_GE_EXEC_NOT_INIT;
  812. }
  813. string filePath = RealPath(path.c_str());
  814. if (filePath.empty()) {
  815. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  816. "[Call][RealPath] File path is invalid. please check your text file '%s'.", path.c_str());
  817. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  818. }
  819. GELOGI("load modelData from file: %s.", path.c_str());
  820. int32_t priority = 0;
  821. Status ret = GraphLoader::LoadDataFromFile(path, priority, model_data);
  822. if (ret != SUCCESS) {
  823. if (model_data.model_data != nullptr) {
  824. delete[] static_cast<char *>(model_data.model_data);
  825. model_data.model_data = nullptr;
  826. }
  827. }
  828. return ret;
  829. }
  830. /**
  831. * @ingroup ge
  832. * @brief Load model from offline model memory data
  833. * @param [in] domi::ModelData &model_data: Offline model data
  834. void *dev_ptr: Input/Output memory start address
  835. size_t memsize: Input/Output memory length
  836. void *weight_ptr: Weight memory start address
  837. size_t weightsize: Weight memory length
  838. * @param [out] uint32_t &model_id: identification after model loading
  839. * @return SUCCESS handle successfully / others handle failed
  840. */
  841. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  842. void *weight_ptr, size_t weight_size) {
  843. if (!isInit_) {
  844. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  845. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  846. return ACL_ERROR_GE_EXEC_NOT_INIT;
  847. }
  848. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  849. }
  850. /**
  851. * @ingroup ge
  852. * @brief Load task list from ModelData with queue.
  853. * @param [out] model_id: model id allocate from manager.
  854. * @param [in] ge_model_data: Model data load from offline model.
  855. * @param [in] input_queue_ids: input queue ids create from user.
  856. * @param [in] output_queue_ids: input queue ids create from user.
  857. * @return: 0 for success / others for fail
  858. */
  859. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  860. const std::vector<uint32_t> &input_queue_ids,
  861. const std::vector<uint32_t> &output_queue_ids) {
  862. GELOGI("Load model with queue begin.");
  863. if (!isInit_) {
  864. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  865. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  866. return ACL_ERROR_GE_EXEC_NOT_INIT;
  867. }
  868. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  869. }
  870. /**
  871. * @ingroup ge
  872. * @brief Synchronous execution of offline model(Do not create thread)
  873. * @param [in] uint32_t model_id: Model ID to execute
  874. void* stream: stream to execute
  875. const domi::InputData *input_data: Model input data
  876. bool async_mode: is asynchronize mode.
  877. * @param [out] domi::OutputData *output_data: Model output data
  878. * @return SUCCESS handle successfully / others handle failed
  879. */
  880. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  881. ge::RunModelData &run_output_data, bool async_mode) {
  882. std::vector<GeTensorDesc> input_desc = {};
  883. std::vector<GeTensorDesc> output_desc = {};
  884. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  885. }
  886. /**
  887. * @ingroup ge
  888. * @brief Synchronous execution of offline model(Do not create thread)
  889. * @param [in] uint32_t model_id: Model ID to execute
  890. void* stream: stream to execute
  891. const domi::InputData *input_data: Model input data
  892. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  893. bool async_mode: is asynchronize mode
  894. * @param [out] domi::OutputData *output_data: Model output data
  895. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  896. * @return SUCCESS handle successfully / others handle failed
  897. */
  898. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  899. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  900. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  901. if (!isInit_) {
  902. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  903. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  904. return ACL_ERROR_GE_EXEC_NOT_INIT;
  905. }
  906. InputData input_data;
  907. OutputData output_data;
  908. GetDomiInputData(run_input_data, input_data);
  909. GetDomiOutputData(run_output_data, output_data);
  910. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  911. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  912. std::vector<std::vector<int64_t>> batch_info;
  913. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  914. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  915. if (ret != SUCCESS) {
  916. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u.", model_id);
  917. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  918. return ret;
  919. }
  920. if (!batch_info.empty()) {
  921. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  922. }
  923. }
  924. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  925. }
  926. /**
  927. * @ingroup ge
  928. * @brief Get weight memory size from model file
  929. * @param [in] const std::string &path: Offline model file path
  930. * @param [out] size_t &mem_size Execution memory size
  931. size_t &weight_size Weight memory space size
  932. * @return SUCCESS handle successfully / others handle failed
  933. */
  934. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  935. GELOGI("Get memory and weight size from file begin.");
  936. if (!isInit_) {
  937. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  938. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  939. return ACL_ERROR_GE_EXEC_NOT_INIT;
  940. }
  941. ModelData model;
  942. Status ret = ge::GraphLoader::LoadDataFromFile(path, 0, model);
  943. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  944. REPORT_CALL_ERROR("E19999", "load data from file failed, ret = %d", ret);
  945. GELOGE(ret, "[Load][Data] from file failed. ret = %d", ret);
  946. return ret;
  947. }
  948. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  949. delete[] static_cast<char *>(model.model_data);
  950. model.model_data = nullptr;
  951. return ret;
  952. }
  953. /**
  954. * @ingroup ge
  955. * @brief Get weight memory size from model file
  956. * @param [in] const void *model_data Offline model buffer
  957. size_t model_size Offline model buffer length
  958. * @param [out] size_t &mem_size Execution memory size
  959. size_t &weight_size Weight memory space size
  960. * @return SUCCESS handle successfully / others handle failed
  961. */
  962. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  963. size_t &weight_size) {
  964. GELOGI("Get memory and weight size from data begin.");
  965. if (!isInit_) {
  966. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  967. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  968. return ACL_ERROR_GE_EXEC_NOT_INIT;
  969. }
  970. if (model_data == nullptr) {
  971. REPORT_INNER_ERROR("E19999", "param model_data is nullptr, check invalid!");
  972. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "[Check][Param] invalid model data!");
  973. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  974. }
  975. ModelData model;
  976. model.model_data = const_cast<void *>(model_data);
  977. model.model_len = static_cast<uint32_t>(model_size);
  978. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  979. }
  980. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  981. SingleOp **single_op) {
  982. return LoadSingleOpV2(model_name, modelData, stream, single_op, 0);
  983. }
  984. Status GeExecutor::LoadSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  985. SingleOp **single_op, const uint64_t model_id) {
  986. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op, model_id);
  987. }
  988. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  989. DynamicSingleOp **single_op) {
  990. return LoadDynamicSingleOpV2(model_name, modelData, stream, single_op, 0);
  991. }
  992. Status GeExecutor::LoadDynamicSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  993. DynamicSingleOp **single_op, const uint64_t model_id) {
  994. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op, model_id);
  995. }
  996. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  997. std::vector<DataBuffer> &outputs) {
  998. if (executor == nullptr) {
  999. REPORT_INNER_ERROR("E19999", "Param executor is nullptr, check invalid");
  1000. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] param executor is nullptr");
  1001. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1002. }
  1003. return executor->ExecuteAsync(inputs, outputs);
  1004. }
  1005. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  1006. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  1007. vector<DataBuffer> &outputs) {
  1008. GE_CHECK_NOTNULL(executor);
  1009. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  1010. }
  1011. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  1012. ModelManager::GetInstance()->ClearAicpuSo();
  1013. return SingleOpManager::GetInstance().ReleaseResource(stream);
  1014. }
  1015. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  1016. auto model_manager = ModelManager::GetInstance();
  1017. GE_CHECK_NOTNULL(model_manager);
  1018. auto davinci_model = model_manager->GetModel(model_id);
  1019. if (davinci_model == nullptr) {
  1020. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID,
  1021. "[Get][Model] failed, Model id:%u is invaild or model is not loaded.", model_id);
  1022. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  1023. }
  1024. device_id = davinci_model->GetDeviceId();
  1025. return SUCCESS;
  1026. }
  1027. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  1028. std::vector<std::vector<int64_t>> batch_info;
  1029. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  1030. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  1031. if (ret != SUCCESS) {
  1032. GELOGE(ret, "[Get][DynamicBatchInfo] failed. ret = %d, model id:%u", ret, model_id);
  1033. return ret;
  1034. }
  1035. if (batch_info.empty()) {
  1036. shape_count = kStaticBatchInfoSize;
  1037. } else {
  1038. shape_count = batch_info.size();
  1039. }
  1040. return SUCCESS;
  1041. }
  1042. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  1043. GELOGI("Begin to GetOrigInputInfo.");
  1044. if (!isInit_) {
  1045. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1046. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1047. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1048. }
  1049. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  1050. if (ret != SUCCESS) {
  1051. REPORT_CALL_ERROR("E19999", "Get Orig Input Info failed, model id:%u.", model_id);
  1052. GELOGE(ret, "[Get][OrigInputInfo] failed, model id:%u.", model_id);
  1053. return ret;
  1054. }
  1055. GELOGI("GetOrigInputInfo succ.");
  1056. return SUCCESS;
  1057. }
  1058. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  1059. std::vector<InputOutputDims> &input_dims,
  1060. std::vector<InputOutputDims> &output_dims) {
  1061. GELOGI("Begin to GetAllAippInputOutputDims.");
  1062. if (!isInit_) {
  1063. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1064. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1065. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1066. }
  1067. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  1068. if (ret != SUCCESS) {
  1069. REPORT_CALL_ERROR("E19999", "Get All Aipp Input Output Dims failed, model id:%u.", model_id);
  1070. GELOGE(ret, "[Get][AllAippInputOutputDims] failed, model id:%u.", model_id);
  1071. return ret;
  1072. }
  1073. GELOGI("GetAllAippInputOutputDims succ.");
  1074. return SUCCESS;
  1075. }
  1076. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  1077. GELOGI("Begin to GetOpDescInfo.");
  1078. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  1079. if (ret != SUCCESS) {
  1080. REPORT_CALL_ERROR("E19999", "get opdesc info failed, device_id:%u, stream_id:%u, task_id:%u.",
  1081. device_id, stream_id, task_id);
  1082. GELOGE(ret, "[Get][OpDescInfo] failed, device_id:%u, stream_id:%u, task_id:%u.",
  1083. device_id, stream_id, task_id);
  1084. return ret;
  1085. }
  1086. GELOGI("GetOpDescInfo succ.");
  1087. return SUCCESS;
  1088. }
  1089. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  1090. GELOGI("Start to set dump config");
  1091. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  1092. if (ret != SUCCESS) {
  1093. GELOGE(ret, "[Set][DumpConf] failed, ret:%d", ret);
  1094. return ret;
  1095. }
  1096. GELOGI("Set dump config successfully");
  1097. return SUCCESS;
  1098. }
  1099. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示