You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

kernel_task_info_unittest.cc 40 kB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107110811091110111111121113111411151116111711181119112011211122112311241125112611271128112911301131113211331134113511361137113811391140114111421143114411451146114711481149115011511152115311541155115611571158115911601161116211631164116511661167116811691170117111721173117411751176117711781179118011811182118311841185118611871188118911901191119211931194119511961197119811991200120112021203120412051206120712081209121012111212121312141215121612171218121912201221122212231224122512261227
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <gtest/gtest.h>
  17. #define private public
  18. #define protected public
  19. #include "graph/load/model_manager/davinci_model.h"
  20. #include "graph/load/model_manager/task_info/kernel_task_info.h"
  21. #include "graph/load/model_manager/task_info/hccl_task_info.h"
  22. namespace ge {
  23. extern OpDescPtr CreateOpDesc(string name, string type);
  24. class UtestKernelTaskInfo : public testing::Test {
  25. protected:
  26. void SetUp() {}
  27. void TearDown() {}
  28. };
  29. // test KernelTaskInfo Init.
  30. TEST_F(UtestKernelTaskInfo, success_kernel_taskInfo_not_te) {
  31. DavinciModel model(0, nullptr);
  32. domi::ModelTaskDef model_task_def;
  33. domi::TaskDef *task = model_task_def.add_task();
  34. task->set_type(RT_MODEL_TASK_KERNEL);
  35. TaskInfoPtr task_info = TaskInfoFactory::Instance().Create(static_cast<rtModelTaskType_t>(task->type()));
  36. task->stream_id_ = 0;
  37. rtStream_t stream = nullptr;
  38. rtStreamCreate(&stream, 0);
  39. model.stream_list_ = { stream };
  40. domi::KernelDef *kernel_def = task->mutable_kernel();
  41. domi::KernelContext *ctx = kernel_def->mutable_context();
  42. model.op_list_[0] = CreateOpDesc("relu", RELU);
  43. ctx->set_op_index(0);
  44. EXPECT_EQ(task_info->Init(*task, &model), FAILED);
  45. kernel_def->set_block_dim(10);
  46. kernel_def->set_args("args111111", 10);
  47. kernel_def->set_args_size(10);
  48. ctx->set_kernel_type(0);
  49. EXPECT_EQ(task_info->Init(*task, &model), INTERNAL_ERROR);
  50. task_info->Release();
  51. }
  52. TEST_F(UtestKernelTaskInfo, success_init_kernel_task_info_fail) {
  53. DavinciModel model(0, nullptr);
  54. KernelTaskInfo kernel_task_info;
  55. domi::TaskDef task_def;
  56. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  57. domi::KernelContext *ctx = kernel_def->mutable_context();
  58. model.op_list_[0] = CreateOpDesc("relu", RELU);
  59. ctx->set_op_index(0);
  60. rtStream_t stream = nullptr;
  61. rtStreamCreate(&stream, 0);
  62. model.stream_list_ = { stream };
  63. // Failed by rtGetFunctionByName.
  64. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  65. }
  66. // test InitTVMTask failed
  67. TEST_F(UtestKernelTaskInfo, init_tvm_task_fail) {
  68. DavinciModel model(0, nullptr);
  69. domi::TaskDef task_def;
  70. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  71. KernelTaskInfo kernel_task_info;
  72. kernel_task_info.davinci_model_ = &model;
  73. EXPECT_EQ(kernel_task_info.InitTVMTask(0, *kernel_def), PARAM_INVALID);
  74. task_def.clear_kernel();
  75. }
  76. // test InitTVMTask with kernel_type is TE
  77. TEST_F(UtestKernelTaskInfo, init_tvm_task_info_with_te_kernel_type) {
  78. DavinciModel model(0, nullptr);
  79. domi::TaskDef task_def;
  80. // DavinciModel is nullptr
  81. KernelTaskInfo kernel_task_info;
  82. EXPECT_EQ(kernel_task_info.Init(task_def, nullptr), PARAM_INVALID);
  83. rtStream_t stream = nullptr;
  84. rtStreamCreate(&stream, 0);
  85. model.stream_list_ = { stream };
  86. model.op_list_[0] = CreateOpDesc("", "");
  87. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  88. rtSmDesc_t l2CtrlInfo;
  89. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  90. kernel_def->set_args("args111111", 10);
  91. kernel_def->set_args_size(10);
  92. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  93. kernel_def->set_flowtable("fl", 2);
  94. kernel_def->set_block_dim(10);
  95. domi::KernelContext *ctx = kernel_def->mutable_context();
  96. ctx->set_kernel_type(2);
  97. ctx->set_op_index(4);
  98. ctx->set_args_offset("\0\0"); // args_offset = 0
  99. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  100. ctx->clear_args_offset();
  101. ctx->set_args_offset("args111111", 10);
  102. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  103. ctx->clear_op_index();
  104. ctx->set_op_index(0);
  105. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  106. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  107. kernel_def->clear_context();
  108. task_def.clear_kernel();
  109. }
  110. // test InitAICPUCustomTask with kernel_type is CUSTOMIZED
  111. TEST_F(UtestKernelTaskInfo, init_kernel_task_info_with_customized_kernel_type) {
  112. DavinciModel model(0, nullptr);
  113. rtStream_t stream = nullptr;
  114. rtStreamCreate(&stream, 0);
  115. model.stream_list_ = { stream };
  116. model.op_list_[0] = CreateOpDesc("", "");
  117. domi::TaskDef task_def;
  118. KernelTaskInfo kernel_task_info;
  119. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  120. rtSmDesc_t l2CtrlInfo;
  121. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  122. kernel_def->set_args("args111111", 10);
  123. kernel_def->set_args_size(10);
  124. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  125. kernel_def->set_flowtable("fl", 2);
  126. kernel_def->set_block_dim(10);
  127. domi::KernelContext *ctx = kernel_def->mutable_context();
  128. ctx->set_kernel_type(3);
  129. ctx->set_op_index(4);
  130. ctx->set_args_offset("\0\0"); // args_offset = 0
  131. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  132. ctx->clear_args_offset();
  133. ctx->set_args_offset("args111111", 10);
  134. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  135. ctx->clear_args_offset();
  136. ctx->set_op_index(0);
  137. const char task[] = "opattr";
  138. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  139. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  140. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  141. kernel_def->clear_context();
  142. task_def.clear_kernel();
  143. }
  144. // test InitAICPUCustomTask failed
  145. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed) {
  146. DavinciModel model(0, nullptr);
  147. rtStream_t stream = nullptr;
  148. rtStreamCreate(&stream, 0);
  149. model.stream_list_ = { stream };
  150. model.op_list_[0] = CreateOpDesc("", "");
  151. domi::TaskDef task_def;
  152. KernelTaskInfo kernel_task_info;
  153. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  154. domi::KernelContext *context = kernel_def->mutable_context();
  155. context->set_args_offset("\0\0");
  156. kernel_task_info.davinci_model_ = &model;
  157. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  158. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  159. context->clear_args_offset();
  160. context->set_args_offset("args111111", 10);
  161. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  162. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  163. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  164. kernel_def->clear_context();
  165. task_def.clear_kernel();
  166. }
  167. // test InitAICPUCustomTask failed
  168. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed2) {
  169. DavinciModel model(0, nullptr);
  170. rtStream_t stream = nullptr;
  171. rtStreamCreate(&stream, 0);
  172. model.stream_list_ = { stream };
  173. model.op_list_[0] = CreateOpDesc("", "");
  174. domi::TaskDef task_def;
  175. KernelTaskInfo kernel_task_info;
  176. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  177. domi::KernelContext *context = kernel_def->mutable_context();
  178. kernel_task_info.davinci_model_ = &model;
  179. context->set_args_offset("\0\0");
  180. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  181. // AttrUtils::GetBytes -> true
  182. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  183. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  184. kernel_def->clear_context();
  185. task_def.clear_kernel();
  186. }
  187. // test InitAICPUCustomTask failed
  188. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed3) {
  189. DavinciModel model(0, nullptr);
  190. rtStream_t stream = nullptr;
  191. rtStreamCreate(&stream, 0);
  192. model.stream_list_ = { stream };
  193. model.op_list_[0] = CreateOpDesc("", "");
  194. domi::TaskDef task_def;
  195. KernelTaskInfo kernel_task_info;
  196. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  197. domi::KernelContext *context = kernel_def->mutable_context();
  198. kernel_task_info.davinci_model_ = &model;
  199. context->set_args_offset("\0\0");
  200. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  201. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  202. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  203. kernel_def->clear_context();
  204. task_def.clear_kernel();
  205. }
  206. // test InitAICPUCustomTask failed
  207. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed4) {
  208. DavinciModel model(0, nullptr);
  209. rtStream_t stream = nullptr;
  210. rtStreamCreate(&stream, 0);
  211. model.stream_list_ = { stream };
  212. model.op_list_[0] = CreateOpDesc("", "");
  213. const char task[] = "opattr";
  214. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  215. domi::TaskDef task_def;
  216. KernelTaskInfo kernel_task_info;
  217. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  218. domi::KernelContext *context = kernel_def->mutable_context();
  219. kernel_task_info.davinci_model_ = &model;
  220. context->set_args_offset("args111111", 10);
  221. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  222. // rtMalloc RT_ERROR_NONE
  223. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  224. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  225. kernel_def->clear_context();
  226. task_def.clear_kernel();
  227. }
  228. // test InitAICPUCustomTask failed
  229. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed5) {
  230. DavinciModel model(0, nullptr);
  231. rtStream_t stream = nullptr;
  232. rtStreamCreate(&stream, 0);
  233. model.stream_list_ = { stream };
  234. model.op_list_[0] = CreateOpDesc("", "");
  235. const char task[] = "opattr";
  236. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  237. domi::TaskDef task_def;
  238. KernelTaskInfo kernel_task_info;
  239. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  240. domi::KernelContext *context = kernel_def->mutable_context();
  241. kernel_task_info.davinci_model_ = &model;
  242. context->set_args_offset("args111111", 10);
  243. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  244. // rtMalloc RT_ERROR_NONE
  245. // rtMemcpy RT_ERROR_INVALID_VALIUE
  246. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  247. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  248. kernel_def->clear_context();
  249. task_def.clear_kernel();
  250. }
  251. // test InitAICPUCustomTask failed
  252. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed6) {
  253. DavinciModel model(0, nullptr);
  254. rtStream_t stream = nullptr;
  255. rtStreamCreate(&stream, 0);
  256. model.stream_list_ = { stream };
  257. model.op_list_[0] = CreateOpDesc("", "");
  258. const char task[] = "opattr";
  259. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  260. domi::TaskDef task_def;
  261. KernelTaskInfo kernel_task_info;
  262. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  263. domi::KernelContext *context = kernel_def->mutable_context();
  264. kernel_task_info.davinci_model_ = &model;
  265. context->set_args_offset("args111111", 10);
  266. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  267. // rtMalloc RT_ERROR_NONE
  268. // rtMemcpy RT_ERROR_NONE
  269. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  270. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  271. kernel_def->clear_context();
  272. task_def.clear_kernel();
  273. }
  274. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type) {
  275. DavinciModel model(0, nullptr);
  276. rtStream_t stream = nullptr;
  277. rtStreamCreate(&stream, 0);
  278. model.stream_list_ = { stream };
  279. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  280. domi::TaskDef task_def;
  281. KernelTaskInfo kernel_task_info;
  282. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  283. task_def.set_type(RT_MODEL_TASK_KERNEL);
  284. string args;
  285. args.append(100, '1');
  286. kernel_def->set_so_name("libDvpp.so");
  287. kernel_def->set_kernel_name("DvppResize");
  288. kernel_def->set_args(args.data(), 100);
  289. kernel_def->set_args_size(100);
  290. domi::KernelContext *ctx = kernel_def->mutable_context();
  291. ctx->set_kernel_type(6);
  292. ctx->set_op_index(0);
  293. // ModelUtils::GetInputDataAddrs -> ok
  294. // ModelUtils::GetOutputDataAddrs -> ok
  295. // rtMalloc -> RT_ERROR_NONE
  296. // rtMemcpy -> RT_ERROR_NONE
  297. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  298. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  299. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  300. kernel_def->clear_context();
  301. task_def.clear_kernel();
  302. }
  303. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type_fail) {
  304. DavinciModel model(0, nullptr);
  305. rtStream_t stream = nullptr;
  306. rtStreamCreate(&stream, 0);
  307. model.stream_list_ = { stream };
  308. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  309. AttrUtils::SetBool(model.op_list_[0], "_AllShape", true);
  310. domi::TaskDef task_def;
  311. KernelTaskInfo kernel_task_info;
  312. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  313. task_def.set_type(RT_MODEL_TASK_KERNEL);
  314. string args;
  315. args.append(100, '1');
  316. kernel_def->set_so_name("libDvpp.so");
  317. kernel_def->set_kernel_name("DvppResize");
  318. kernel_def->set_args(args.data(), 100);
  319. kernel_def->set_args_size(100);
  320. domi::KernelContext *ctx = kernel_def->mutable_context();
  321. ctx->set_kernel_type(6);
  322. ctx->set_op_index(0);
  323. // ModelUtils::GetInputDataAddrs -> ok
  324. // ModelUtils::GetOutputDataAddrs -> ok
  325. // rtMalloc -> RT_ERROR_NONE
  326. // rtMemcpy -> RT_ERROR_INVALID_VALUE
  327. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  328. const string ext_info = {1, 1, 1, 1, 0, 0, 0, 0};
  329. EXPECT_EQ(kernel_task_info.InitAicpuTaskExtInfo(ext_info), SUCCESS);
  330. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  331. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  332. kernel_def->clear_context();
  333. task_def.clear_kernel();
  334. }
  335. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type_fail2) {
  336. DavinciModel model(0, nullptr);
  337. rtStream_t stream = nullptr;
  338. rtStreamCreate(&stream, 0);
  339. model.stream_list_ = { stream };
  340. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  341. domi::TaskDef task_def;
  342. KernelTaskInfo kernel_task_info;
  343. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  344. task_def.set_type(RT_MODEL_TASK_KERNEL);
  345. string args;
  346. args.append(100, '1');
  347. kernel_def->set_so_name("libDvpp.so");
  348. kernel_def->set_kernel_name("DvppResize");
  349. kernel_def->set_args(args.data(), 100);
  350. kernel_def->set_args_size(100);
  351. domi::KernelContext *ctx = kernel_def->mutable_context();
  352. ctx->set_kernel_type(6);
  353. ctx->set_op_index(0);
  354. // ModelUtils::GetInputDataAddrs -> ok
  355. // ModelUtils::GetOutputDataAddrs -> ok
  356. // rtMalloc -> RT_ERROR_INVALID_VALUE
  357. // rtMemcpy -> RT_ERROR_NONE
  358. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  359. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  360. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  361. kernel_def->clear_context();
  362. task_def.clear_kernel();
  363. }
  364. // test StoreInputOutputTensor failed
  365. TEST_F(UtestKernelTaskInfo, store_input_output_tensor_fail) {
  366. std::vector<void *> input_data_addrs;
  367. std::vector<void *> output_data_addrs;
  368. std::vector<::tagCcAICPUTensor> input_descs;
  369. std::vector<::tagCcAICPUTensor> output_descs;
  370. KernelTaskInfo kernel_task_info;
  371. // rtMalloc -> RT_ERROR_INVALID_VALUE
  372. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  373. }
  374. TEST_F(UtestKernelTaskInfo, store_input_output_tensor_fail2) {
  375. std::vector<void *> input_data_addrs;
  376. std::vector<void *> output_data_addrs;
  377. std::vector<::tagCcAICPUTensor> input_descs;
  378. std::vector<::tagCcAICPUTensor> output_descs;
  379. KernelTaskInfo kernel_task_info;
  380. // rtMalloc -> RT_ERROR_INVALID_VALUE
  381. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  382. }
  383. // test InitCceTask success
  384. TEST_F(UtestKernelTaskInfo, kernel_task_info_init_cce_task) {
  385. DavinciModel model(0, nullptr);
  386. rtStream_t stream = nullptr;
  387. rtStreamCreate(&stream, 0);
  388. model.stream_list_ = { stream };
  389. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  390. domi::TaskDef task_def;
  391. KernelTaskInfo kernel_task_info;
  392. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  393. kernel_task_info.davinci_model_ = &model;
  394. kernel_task_info.op_desc_ = model.op_list_[0];
  395. kernel_def->set_flowtable("InitCceTask");
  396. domi::KernelContext *context = kernel_def->mutable_context();
  397. context->set_is_flowtable(true);
  398. rtSmDesc_t l2CtrlInfo;
  399. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  400. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  401. model.runtime_param_.logic_mem_base = 0;
  402. model.runtime_param_.mem_size = 0;
  403. model.runtime_param_.logic_weight_base = 0;
  404. model.runtime_param_.weight_size = 0;
  405. model.runtime_param_.logic_var_base = 0;
  406. model.runtime_param_.var_size = 0;
  407. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  408. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  409. // rtMalloc -> RT_ERROR_NONE
  410. // rtMemcpy -> RT_ERROR_NONE
  411. // rtMemAllocManaged -> RT_ERROR_NONE
  412. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  413. kernel_def->clear_context();
  414. task_def.clear_kernel();
  415. }
  416. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed1) {
  417. DavinciModel model(0, nullptr);
  418. domi::TaskDef task_def;
  419. KernelTaskInfo kernel_task_info;
  420. kernel_task_info.davinci_model_ = &model;
  421. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  422. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  423. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  424. task_def.clear_kernel();
  425. }
  426. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed2) {
  427. DavinciModel model(0, nullptr);
  428. rtStream_t stream = nullptr;
  429. rtStreamCreate(&stream, 0);
  430. model.stream_list_ = { stream };
  431. model.op_list_[0] = CreateOpDesc("", "");
  432. domi::TaskDef task_def;
  433. KernelTaskInfo kernel_task_info;
  434. kernel_task_info.davinci_model_ = &model;
  435. kernel_task_info.op_desc_ = model.op_list_[0];
  436. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  437. // KernelTaskInfo::SetContext -> SUCCESS
  438. domi::KernelContext *context = kernel_def->mutable_context();
  439. context->set_is_flowtable(true);
  440. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  441. kernel_def->clear_context();
  442. task_def.clear_kernel();
  443. }
  444. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed3) {
  445. DavinciModel model(0, nullptr);
  446. rtStream_t stream = nullptr;
  447. rtStreamCreate(&stream, 0);
  448. model.stream_list_ = { stream };
  449. model.op_list_[0] = CreateOpDesc("", "");
  450. domi::TaskDef task_def;
  451. KernelTaskInfo kernel_task_info;
  452. kernel_task_info.davinci_model_ = &model;
  453. kernel_task_info.op_desc_ = model.op_list_[0];
  454. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  455. // KernelTaskInfo::SetContext -> SUCCESS
  456. kernel_def->set_flowtable("InitCceTask");
  457. domi::KernelContext *context = kernel_def->mutable_context();
  458. context->set_is_flowtable(true);
  459. // KernelTaskInfo::UpdateCceArgs -> CCE_FAILED
  460. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  461. kernel_def->clear_context();
  462. task_def.clear_kernel();
  463. }
  464. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed4) {
  465. DavinciModel model(0, nullptr);
  466. rtStream_t stream = nullptr;
  467. rtStreamCreate(&stream, 0);
  468. model.stream_list_ = { stream };
  469. model.op_list_[0] = CreateOpDesc("", "");
  470. domi::TaskDef task_def;
  471. KernelTaskInfo kernel_task_info;
  472. kernel_task_info.davinci_model_ = &model;
  473. kernel_task_info.op_desc_ = model.op_list_[0];
  474. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  475. // KernelTaskInfo::SetContext -> SUCCESS
  476. kernel_def->set_flowtable("InitCceTask");
  477. domi::KernelContext *context = kernel_def->mutable_context();
  478. context->set_is_flowtable(true);
  479. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  480. // KernelTaskInfo::SetFlowtable -> RT_FAILED
  481. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  482. kernel_def->clear_context();
  483. task_def.clear_kernel();
  484. }
  485. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed5) {
  486. DavinciModel model(0, nullptr);
  487. rtStream_t stream = nullptr;
  488. rtStreamCreate(&stream, 0);
  489. model.stream_list_ = { stream };
  490. model.op_list_[0] = CreateOpDesc("", "");
  491. domi::TaskDef task_def;
  492. KernelTaskInfo kernel_task_info;
  493. kernel_task_info.davinci_model_ = &model;
  494. kernel_task_info.op_desc_ = model.op_list_[0];
  495. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  496. // KernelTaskInfo::SetContext -> SUCCESS
  497. kernel_def->set_flowtable("InitCceTask");
  498. domi::KernelContext *context = kernel_def->mutable_context();
  499. context->set_is_flowtable(true);
  500. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  501. // KernelTaskInfo::SetFlowtable -> SUCCESS
  502. // rtMalloc -> RT_ERROR_INVALID_VALUE
  503. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  504. kernel_def->clear_context();
  505. task_def.clear_kernel();
  506. }
  507. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed6) {
  508. DavinciModel model(0, nullptr);
  509. rtStream_t stream = nullptr;
  510. rtStreamCreate(&stream, 0);
  511. model.stream_list_ = { stream };
  512. model.op_list_[0] = CreateOpDesc("", "");
  513. domi::TaskDef task_def;
  514. KernelTaskInfo kernel_task_info;
  515. kernel_task_info.davinci_model_ = &model;
  516. kernel_task_info.op_desc_ = model.op_list_[0];
  517. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  518. // KernelTaskInfo::SetContext -> SUCCESS
  519. kernel_def->set_flowtable("InitCceTask");
  520. domi::KernelContext *context = kernel_def->mutable_context();
  521. context->set_is_flowtable(true);
  522. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  523. // KernelTaskInfo::SetFlowtable -> SUCCESS
  524. // rtMalloc -> RT_ERROR_NONE
  525. // rtMemcpy -> RT_ERROR_INVALID_VALUE
  526. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  527. kernel_def->clear_context();
  528. task_def.clear_kernel();
  529. }
  530. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed7) {
  531. DavinciModel model(0, nullptr);
  532. rtStream_t stream = nullptr;
  533. rtStreamCreate(&stream, 0);
  534. model.stream_list_ = { stream };
  535. model.op_list_[0] = CreateOpDesc("", "");
  536. domi::TaskDef task_def;
  537. KernelTaskInfo kernel_task_info;
  538. kernel_task_info.davinci_model_ = &model;
  539. kernel_task_info.op_desc_ = model.op_list_[0];
  540. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  541. // KernelTaskInfo::SetContext -> SUCCESS
  542. kernel_def->set_flowtable("InitCceTask");
  543. domi::KernelContext *context = kernel_def->mutable_context();
  544. context->set_is_flowtable(true);
  545. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  546. // KernelTaskInfo::SetFlowtable -> SUCCESS
  547. rtSmDesc_t l2CtrlInfo;
  548. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  549. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  550. // rtMalloc -> RT_ERROR_NONE
  551. // rtMemcpy -> RT_ERROR_NONE
  552. // rtMemAllocManaged -> RT_ERROR_INVALID_VALUE
  553. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  554. kernel_def->clear_context();
  555. task_def.clear_kernel();
  556. }
  557. // test SetContext success
  558. TEST_F(UtestKernelTaskInfo, success_kernel_taskInfo_init_set_context) {
  559. DavinciModel model(0, nullptr);
  560. domi::TaskDef task_def;
  561. KernelTaskInfo kernel_task_info;
  562. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  563. domi::KernelContext *context = kernel_def->mutable_context();
  564. context->set_op_id(1);
  565. context->set_kernel_func_id(1);
  566. context->set_is_flowtable(true);
  567. context->set_args_count(1);
  568. context->set_args_offset("args111111", 10);
  569. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  570. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), SUCCESS);
  571. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  572. kernel_def->clear_context();
  573. task_def.clear_kernel();
  574. }
  575. // test SetContext failed
  576. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_set_context_failed1) {
  577. DavinciModel model(0, nullptr);
  578. domi::TaskDef task_def;
  579. KernelTaskInfo kernel_task_info;
  580. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  581. domi::KernelContext *context = kernel_def->mutable_context();
  582. context->set_op_id(1);
  583. context->set_kernel_func_id(1);
  584. context->set_is_flowtable(true);
  585. context->set_args_count(0);
  586. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  587. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), INTERNAL_ERROR);
  588. kernel_def->clear_context();
  589. task_def.clear_kernel();
  590. }
  591. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_set_context_failed2) {
  592. DavinciModel model(0, nullptr);
  593. domi::TaskDef task_def;
  594. KernelTaskInfo kernel_task_info;
  595. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  596. domi::KernelContext *context = kernel_def->mutable_context();
  597. context->set_op_id(1);
  598. context->set_kernel_func_id(1);
  599. context->set_is_flowtable(true);
  600. context->set_args_count(5);
  601. context->set_args_offset("\0\0"); // args_offset = 0
  602. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  603. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), PARAM_INVALID);
  604. kernel_def->clear_context();
  605. task_def.clear_kernel();
  606. }
  607. // test UpdateCceArgs success
  608. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_cce_args) {
  609. DavinciModel model(0, nullptr);
  610. rtStream_t stream = nullptr;
  611. rtStreamCreate(&stream, 0);
  612. model.stream_list_ = { stream };
  613. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  614. domi::TaskDef task_def;
  615. KernelTaskInfo kernel_task_info;
  616. kernel_task_info.davinci_model_ = &model;
  617. kernel_task_info.op_desc_ = model.op_list_[0];
  618. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  619. domi::KernelContext *context = kernel_def->mutable_context();
  620. string flowtable("InitCceTask");
  621. string sm_desc("args");
  622. uint8_t test = 2;
  623. model.mem_base_ = &test;
  624. model.runtime_param_.logic_mem_base = 0;
  625. model.weights_mem_base_ = &test;
  626. model.runtime_param_.logic_weight_base = 0;
  627. uint8_t test1 = 16;
  628. model.var_mem_base_ = &test1;
  629. model.runtime_param_.logic_var_base = 0;
  630. context->set_is_flowtable(true);
  631. // KernelTaskInfo::CceUpdateKernelArgs ->SUCCESS
  632. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  633. context->clear_is_flowtable();
  634. context->set_is_flowtable(false);
  635. // KernelTaskInfo::CceUpdateKernelArgs ->SUCCESS
  636. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  637. kernel_def->clear_context();
  638. task_def.clear_kernel();
  639. model.mem_base_ = nullptr;
  640. model.weights_mem_base_ = nullptr;
  641. model.var_mem_base_ = nullptr;
  642. }
  643. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_cce_args_failed1) {
  644. DavinciModel model(0, nullptr);
  645. rtStream_t stream = nullptr;
  646. rtStreamCreate(&stream, 0);
  647. model.stream_list_ = { stream };
  648. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  649. domi::TaskDef task_def;
  650. KernelTaskInfo kernel_task_info;
  651. kernel_task_info.davinci_model_ = &model;
  652. kernel_task_info.op_desc_ = model.op_list_[0];
  653. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  654. domi::KernelContext *context = kernel_def->mutable_context();
  655. string flowtable("InitCceTask");
  656. string sm_desc("args");
  657. uint8_t test = 2;
  658. model.mem_base_ = &test;
  659. model.runtime_param_.logic_mem_base = 0;
  660. uint8_t test1 = 10;
  661. model.weights_mem_base_ = &test1;
  662. model.runtime_param_.logic_weight_base = 0;
  663. model.var_mem_base_ = &test1;
  664. model.runtime_param_.logic_var_base = 0;
  665. context->set_is_flowtable(true);
  666. // KernelTaskInfo::CceUpdateKernelArgs -> FAILED
  667. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  668. kernel_def->clear_context();
  669. task_def.clear_kernel();
  670. model.mem_base_ = nullptr;
  671. model.weights_mem_base_ = nullptr;
  672. model.var_mem_base_ = nullptr;
  673. }
  674. // test SetFlowtable
  675. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable) {
  676. DavinciModel model(0, nullptr);
  677. rtStream_t stream = nullptr;
  678. rtStreamCreate(&stream, 0);
  679. model.stream_list_ = { stream };
  680. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  681. domi::TaskDef task_def;
  682. KernelTaskInfo kernel_task_info;
  683. kernel_task_info.davinci_model_ = &model;
  684. kernel_task_info.op_desc_ = model.op_list_[0];
  685. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  686. domi::KernelContext *context = kernel_def->mutable_context();
  687. string flowtable("InitCceTask");
  688. context->set_is_flowtable(false);
  689. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), SUCCESS);
  690. context->clear_is_flowtable();
  691. context->set_is_flowtable(true);
  692. // rtMalloc ->RT_ERROR_NONE
  693. // rtMemcpy ->RT_ERROR_NONE
  694. kernel_def->set_args("args111111", 10);
  695. context->set_args_offset("\0\0");
  696. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), SUCCESS);
  697. kernel_def->clear_context();
  698. task_def.clear_kernel();
  699. }
  700. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed1) {
  701. DavinciModel model(0, nullptr);
  702. rtStream_t stream = nullptr;
  703. rtStreamCreate(&stream, 0);
  704. model.stream_list_ = { stream };
  705. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  706. domi::TaskDef task_def;
  707. KernelTaskInfo kernel_task_info;
  708. kernel_task_info.davinci_model_ = &model;
  709. kernel_task_info.op_desc_ = model.op_list_[0];
  710. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  711. domi::KernelContext *context = kernel_def->mutable_context();
  712. string flowtable("SetFlowtable");
  713. context->set_is_flowtable(true);
  714. // rtMalloc -> RT_ERROR_INVALID_VALUE
  715. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  716. kernel_def->clear_context();
  717. task_def.clear_kernel();
  718. }
  719. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed2) {
  720. DavinciModel model(0, nullptr);
  721. rtStream_t stream = nullptr;
  722. rtStreamCreate(&stream, 0);
  723. model.stream_list_ = { stream };
  724. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  725. domi::TaskDef task_def;
  726. KernelTaskInfo kernel_task_info;
  727. kernel_task_info.davinci_model_ = &model;
  728. kernel_task_info.op_desc_ = model.op_list_[0];
  729. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  730. domi::KernelContext *context = kernel_def->mutable_context();
  731. string flowtable("SetFlowtable");
  732. context->set_is_flowtable(true);
  733. // rtMalloc ->RT_ERROR_NONE
  734. // rtMemcpy ->RT_ERROR_INVALID_VALUE
  735. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  736. kernel_def->clear_context();
  737. task_def.clear_kernel();
  738. }
  739. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed3) {
  740. DavinciModel model(0, nullptr);
  741. rtStream_t stream = nullptr;
  742. rtStreamCreate(&stream, 0);
  743. model.stream_list_ = { stream };
  744. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  745. domi::TaskDef task_def;
  746. KernelTaskInfo kernel_task_info;
  747. kernel_task_info.davinci_model_ = &model;
  748. kernel_task_info.op_desc_ = model.op_list_[0];
  749. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  750. domi::KernelContext *context = kernel_def->mutable_context();
  751. string flowtable("SetFlowtable");
  752. context->set_is_flowtable(true);
  753. // rtMalloc ->RT_ERROR_NONE
  754. // rtMemcpy ->RT_ERROR_NONE
  755. kernel_def->set_args("args", 4);
  756. context->set_args_offset("args111111", 10);
  757. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  758. kernel_def->clear_context();
  759. task_def.clear_kernel();
  760. }
  761. TEST_F(UtestKernelTaskInfo, distribute_failed) {
  762. KernelTaskInfo kernel_task_info;
  763. DavinciModel model(0, nullptr);
  764. domi::TaskDef task_def;
  765. // Failed for SetStream
  766. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  767. // rtKernelLaunchWithFlag -> RT_ERROR_INVALID_VALUE
  768. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  769. }
  770. TEST_F(UtestKernelTaskInfo, distribute_success) {
  771. KernelTaskInfo kernel_task_info;
  772. DavinciModel model(0, nullptr);
  773. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  774. domi::TaskDef task_def;
  775. // rtModelGetTaskId -> RT_ERROR_INVALID_VALUE
  776. rtModel_t rt_model_handle = (rtModel_t *)0x12345678;
  777. model.rt_model_handle_ = rt_model_handle;
  778. // Failed for SetStream
  779. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  780. // rtKernelLaunchWithFlag -> RT_ERROR_INVALID_VALUE
  781. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  782. model.rt_model_handle_ = nullptr;
  783. }
  784. // test success DistributeDumpTask
  785. TEST_F(UtestKernelTaskInfo, success_distribute_dump_task) {
  786. DavinciModel model(0, nullptr);
  787. domi::TaskDef task_def;
  788. KernelTaskInfo kernel_task_info;
  789. kernel_task_info.davinci_model_ = &model;
  790. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  791. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  792. kernel_def->set_stub_func("kerneltaskinfo");
  793. kernel_def->set_block_dim(10);
  794. kernel_def->set_args("args111111", 10);
  795. kernel_def->set_args_size(10);
  796. rtSmDesc_t l2CtrlInfo;
  797. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  798. kernel_def->set_sm_desc((void *)&l2CtrlInfo, sizeof(rtSmDesc_t));
  799. // for SetStream
  800. rtStream_t stream = nullptr;
  801. rtStreamCreate(&stream, 0);
  802. std::vector<rtStream_t> stream_list = { stream };
  803. EXPECT_EQ(kernel_task_info.SetStream(0, stream_list), SUCCESS);
  804. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  805. rtStreamDestroy(stream);
  806. task_def.clear_kernel();
  807. }
  808. // test success GetTaskID
  809. TEST_F(UtestKernelTaskInfo, success_get_task_id) {
  810. domi::ModelTaskDef model_task_def;
  811. domi::TaskDef *task = model_task_def.add_task();
  812. task->set_type(RT_MODEL_TASK_KERNEL);
  813. TaskInfoPtr task_info = TaskInfoFactory::Instance().Create(static_cast<rtModelTaskType_t>(task->type()));
  814. EXPECT_EQ(task_info->GetTaskID(), 0);
  815. KernelTaskInfo kernel_task_info;
  816. EXPECT_EQ(kernel_task_info.GetTaskID(), 0);
  817. HcclTaskInfo hccl_task_info;
  818. EXPECT_EQ(hccl_task_info.GetTaskID(), 0);
  819. }
  820. // test StoreInputOutputTensor success
  821. TEST_F(UtestKernelTaskInfo, success_store_input_output_tensor) {
  822. DavinciModel model(0, nullptr);
  823. domi::TaskDef task_def;
  824. KernelTaskInfo kernel_task_info;
  825. kernel_task_info.davinci_model_ = &model;
  826. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  827. std::vector<void *> input_data_addrs;
  828. std::vector<void *> output_data_addrs;
  829. std::vector<::tagCcAICPUTensor> input_descs;
  830. std::vector<::tagCcAICPUTensor> output_descs;
  831. int test = 1;
  832. int *addr = &test;
  833. void *input = addr;
  834. void *output = addr;
  835. input_data_addrs.push_back(input);
  836. output_data_addrs.push_back(output);
  837. tagCcAICPUTensor input_desc;
  838. tagCcAICPUTensor output_desc;
  839. input_descs.push_back(input_desc);
  840. output_descs.push_back(output_desc);
  841. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  842. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  843. }
  844. // test KernelTaskInfo release fail
  845. TEST_F(UtestKernelTaskInfo, fail_release) {
  846. DavinciModel model(0, nullptr);
  847. domi::TaskDef task_def;
  848. KernelTaskInfo kernel_task_info;
  849. kernel_task_info.davinci_model_ = &model;
  850. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  851. std::vector<void *> input_data_addrs;
  852. std::vector<void *> output_data_addrs;
  853. std::vector<::tagCcAICPUTensor> input_descs;
  854. std::vector<::tagCcAICPUTensor> output_descs;
  855. int test = 1;
  856. int *addr = &test;
  857. void *input = addr;
  858. void *output = addr;
  859. input_data_addrs.push_back(input);
  860. output_data_addrs.push_back(output);
  861. tagCcAICPUTensor input_desc;
  862. tagCcAICPUTensor output_desc;
  863. input_descs.push_back(input_desc);
  864. output_descs.push_back(output_desc);
  865. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  866. // rtMemFreeManaged -> RT_ERROR_INVALID_VALUE
  867. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  868. }
  869. // test KernelTaskInfo release fail
  870. TEST_F(UtestKernelTaskInfo, update_l2data_success) {
  871. DavinciModel model(0, nullptr);
  872. KernelTaskInfo kernel_task_info;
  873. kernel_task_info.davinci_model_ = &model;
  874. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  875. domi::KernelDef kernel_def;
  876. EXPECT_EQ(kernel_task_info.UpdateL2Data(kernel_def), SUCCESS);
  877. }
  878. // test fusion_end_task Init
  879. TEST_F(UtestKernelTaskInfo, kernel_task_info_init_success) {
  880. rtStream_t stream = nullptr;
  881. rtStreamCreate(&stream, 0);
  882. DavinciModel model(0, nullptr);
  883. auto model_def = MakeShared<domi::ModelTaskDef>();
  884. model.model_id_ = 1;
  885. model.name_ = "test";
  886. model.version_ = 0x01;
  887. model.stream_list_ = { stream };
  888. model.ge_model_ = MakeShared<GeModel>();
  889. model.ge_model_->SetModelTaskDef(model_def);
  890. auto op_desc = CreateOpDesc("data", DATA);
  891. op_desc->SetInputOffset({1});
  892. op_desc->SetOutputOffset({100});
  893. GeTensorDesc descin(GeShape({1, 1, 1, 1}), FORMAT_NCHW, DT_FLOAT);
  894. TensorUtils::SetSize(descin, 4);
  895. op_desc->AddInputDesc(descin);
  896. GeTensorDesc descout(GeShape({1, 1, 1, 1}), FORMAT_NCHW, DT_FLOAT16);
  897. TensorUtils::SetSize(descout, 32);
  898. op_desc->AddOutputDesc(descout);
  899. op_desc->SetId(0);
  900. model.op_list_[0] = op_desc;
  901. domi::TaskDef task_def;
  902. task_def.set_stream_id(0);
  903. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  904. domi::KernelContext *ctx = kernel_def->mutable_context();
  905. ctx->set_op_index(0);
  906. vector<string> original_op_names = { "conv", "add" };
  907. AttrUtils::GetListStr(op_desc, ATTR_NAME_DATA_DUMP_ORIGIN_OP_NAMES, original_op_names);
  908. KernelTaskInfo kernel_task_info;
  909. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  910. }
  911. TEST_F(UtestKernelTaskInfo, kernel_task_info_calculate_args_te) {
  912. DavinciModel model(0, nullptr);
  913. domi::TaskDef task_def;
  914. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  915. domi::KernelContext *ctx = kernel_def->mutable_context();
  916. ctx->set_kernel_type(2);
  917. KernelTaskInfo kernel_task_info;
  918. EXPECT_EQ(kernel_task_info.CalculateArgs(task_def, &model), SUCCESS);
  919. }
  920. TEST_F(UtestKernelTaskInfo, kernel_task_info_calculate_args_aicpu) {
  921. DavinciModel model(0, nullptr);
  922. domi::TaskDef task_def;
  923. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  924. domi::KernelContext *ctx = kernel_def->mutable_context();
  925. ctx->set_kernel_type(6);
  926. KernelTaskInfo kernel_task_info;
  927. EXPECT_EQ(kernel_task_info.CalculateArgs(task_def, &model), SUCCESS);
  928. }
  929. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_args_te) {
  930. DavinciModel model(0, nullptr);
  931. KernelTaskInfo kernel_task_info;
  932. kernel_task_info.kernel_type_ = ccKernelType::TE;
  933. kernel_task_info.davinci_model_ = &model;
  934. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  935. EXPECT_EQ(kernel_task_info.UpdateArgs(), SUCCESS);
  936. }
  937. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_args_aicpu) {
  938. DavinciModel model(0, nullptr);
  939. KernelTaskInfo kernel_task_info;
  940. kernel_task_info.kernel_type_ = ccKernelType::TE;
  941. kernel_task_info.davinci_model_ = &model;
  942. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  943. kernel_task_info.args_size_ = 120;
  944. kernel_task_info.args_addr = std::unique_ptr<uint8_t[]>(new (std::nothrow) uint8_t[kernel_task_info.args_size_]);
  945. kernel_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  946. rtMalloc(&kernel_task_info.args_, kernel_task_info.args_size_, RT_MEMORY_HBM);
  947. EXPECT_EQ(kernel_task_info.UpdateArgs(), SUCCESS);
  948. }
  949. TEST_F(UtestKernelTaskInfo, kernel_task_info_super_kernel_info) {
  950. DavinciModel model(0, nullptr);
  951. KernelTaskInfo kernel_task_info;
  952. kernel_task_info.davinci_model_ = &model;
  953. kernel_task_info.op_desc_ = CreateOpDesc("FrameworkOp", "FrameworkOp");
  954. EXPECT_EQ(kernel_task_info.SaveSuperKernelInfo(), SUCCESS);
  955. kernel_task_info.UpdateSKTTaskId();
  956. EXPECT_EQ(kernel_task_info.SKTFinalize(), SUCCESS);
  957. }
  958. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示