You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

rt_model.h 8.8 kB

5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef __CCE_RUNTIME_MODEL_H__
  17. #define __CCE_RUNTIME_MODEL_H__
  18. #include "base.h"
  19. #ifdef __cplusplus
  20. extern "C" {
  21. #endif // __cplusplus
  22. typedef enum tagModelTaskType {
  23. RT_MODEL_TASK_KERNEL = 0,
  24. RT_MODEL_TASK_EVENT_RECORD,
  25. RT_MODEL_TASK_EVENT_WAIT,
  26. RT_MODEL_TASK_FUSION_START,
  27. RT_MODEL_TASK_FUSION_END,
  28. RT_MODEL_TASK_KERNEL_EX,
  29. RT_MODEL_TASK_HCCL,
  30. RT_MODEL_TASK_STREAM_SWITCH,
  31. RT_MODEL_TASK_STREAM_ACTIVE,
  32. RT_MODEL_TASK_LABEL_SET,
  33. RT_MODEL_TASK_LABEL_SWITCH,
  34. RT_MODEL_TASK_LABEL_GOTO,
  35. RT_MODEL_TASK_PROFILER_TRACE,
  36. RT_MODEL_TASK_MEMCPY_ASYNC,
  37. RT_MODEL_TASK_NOTIFY_RECORD,
  38. RT_MODEL_TASK_NOTIFY_WAIT,
  39. RT_MODEL_TASK_REDUCE_ASYNC,
  40. RT_MODEL_TASK_RDMA_SEND,
  41. RT_MODEL_TASK_EVENT_RESET = 18,
  42. RT_MODEL_TASK_MODEL_END_GRAPH,
  43. RT_MODEL_TASK_STREAM_SWITCH_N
  44. } rtModelTaskType_t;
  45. typedef enum tagModelStreamType {
  46. RT_MODEL_HEAD_STREAM = 0,
  47. RT_MODEL_WAIT_ACTIVE_STREAM = 1
  48. } rtModelStreamType_t;
  49. #define EXECUTOR_NONE ((uint32_t)0x0)
  50. #define EXECUTOR_TS ((uint32_t)0x01)
  51. #define EXECUTOR_AICPU ((uint32_t)0x02)
  52. /**
  53. * @ingroup
  54. * @brief the type defination of aicpu model task command
  55. */
  56. typedef enum tagTsAicpuModelCmd {
  57. TS_AICPU_MODEL_LOAD = 1,
  58. TS_AICPU_MODEL_EXECUTE,
  59. TS_AICPU_MODEL_DESTROY,
  60. TS_AICPU_MODEL_ABORT,
  61. TS_AICPU_MODEL_RESERVED,
  62. } tsAicpuModelCmd;
  63. typedef struct tagAicpuTaskInfo {
  64. uint32_t taskID;
  65. uint32_t streamID;
  66. uint32_t kernelType;
  67. uint64_t kernelName;
  68. uint64_t kernelSo;
  69. uint64_t paraBase;
  70. uint32_t taskFlag;
  71. } rtAicpuTaskInfo_t;
  72. typedef struct tagModelStreamInfo {
  73. uint32_t streamID;
  74. uint32_t streamFlag;
  75. } rtModelStreamInfo_t;
  76. typedef struct tagAicpuModelInfo {
  77. uint32_t moduleID;
  78. uint32_t tsId;
  79. uint16_t streamInfoNum;
  80. uint16_t aicpuTaskNum;
  81. uint64_t streamInfoPtr;
  82. uint64_t aicpuTaskPtr;
  83. } rtAicpuModelInfo_t;
  84. /* lint -e148 */
  85. typedef struct tagKernelTaskInfo {
  86. uint16_t blockDim;
  87. uint16_t argsCount;
  88. uint16_t argsSize;
  89. uint16_t reserved;
  90. char *stubFunc;
  91. uint8_t *smDesc;
  92. uint8_t *args;
  93. uint16_t *argsOffset;
  94. } rtKernelTaskInfo_t; /* lint +e148 */
  95. typedef struct tagKernelTaskInfoEx {
  96. uint32_t flags;
  97. uint32_t argsSize;
  98. void *args;
  99. uint32_t reserved[6];
  100. } rtKernelTaskInfoEx_t;
  101. typedef struct tagEventTaskInfo {
  102. uint32_t eventID;
  103. uint32_t reserved[9];
  104. } rtEventTaskInfo_t;
  105. typedef struct tagStreamSwitchTaskInfo {
  106. int64_t value;
  107. uint64_t pValuePtr;
  108. uint32_t trueStreamID;
  109. uint32_t dataType;
  110. uint32_t reserved[4];
  111. } rtStreamSwitchTaskInfo_t;
  112. typedef struct tagStreamSwitchNTaskInfo {
  113. uint64_t pValuePtr;
  114. uint64_t pTrueStreamPtr;
  115. uint32_t size;
  116. uint32_t elementSize;
  117. uint32_t dataType;
  118. uint32_t reserved[3];
  119. } rtStreamSwitchNTaskInfo_t;
  120. typedef struct tagStreamActiveTaskInfo {
  121. uint32_t activeStreamID;
  122. uint32_t reserved[9];
  123. } rtStreamActiveTaskInfo_t;
  124. typedef struct tagSetTaskInfo {
  125. uint16_t labelId;
  126. uint32_t reserved[9];
  127. } rtLabelSetTaskInfo_t;
  128. typedef struct tagSwitchTaskInfo {
  129. uint32_t value;
  130. uint32_t reserved[9];
  131. } rtLabelSwitchTaskInfo_t;
  132. typedef struct tagLabelGotoTaskInfo {
  133. uint16_t labelId;
  134. uint32_t reserved[9];
  135. } rtLabelGotoTaskInfo_t;
  136. typedef struct tagProfilerTraceTaskInfo {
  137. uint64_t profilerTraceId;
  138. uint32_t notify : 8;
  139. uint32_t reserved_ : 24;
  140. uint32_t flags;
  141. uint32_t reserved[6];
  142. } rtProfilerTrace_t;
  143. typedef struct tagrtMemcpyAsyncTaskInfo {
  144. void *dst;
  145. uint64_t destMax;
  146. void *src;
  147. uint64_t count;
  148. uint32_t kind;
  149. uint32_t reserved;
  150. } rtMemcpyAsyncTaskInfo_t;
  151. typedef struct tagrtNotifyTaskInfo {
  152. uint32_t notifyID;
  153. uint32_t reserved[9];
  154. } rtNotifyTaskInfo_t;
  155. typedef struct tagrtReduceAsyncTaskInfo {
  156. void *dst;
  157. uint64_t destMax;
  158. void *src;
  159. uint64_t count;
  160. uint32_t kind;
  161. uint32_t type;
  162. } rtReduceAsyncTaskInfo_t;
  163. typedef struct tagrtRdmaSendTaskInfo {
  164. uint32_t index;
  165. uint32_t wqe_index;
  166. uint32_t reserved[8];
  167. } rtRdmaSendTaskInfo_t;
  168. typedef struct tagrtModelEndGraphTaskInfo {
  169. uint32_t modelId;
  170. uint32_t executorFlag;
  171. uint32_t reserved[8];
  172. } rtModelEndGraphTaskInfo_t;
  173. typedef struct tagTaskInfo {
  174. uint32_t type;
  175. uint32_t streamID;
  176. union {
  177. rtKernelTaskInfoEx_t kernelTaskEx;
  178. rtKernelTaskInfo_t kernelTask;
  179. rtEventTaskInfo_t eventTask;
  180. rtStreamSwitchTaskInfo_t streamSwitchTask;
  181. rtStreamActiveTaskInfo_t streamActiveTask;
  182. rtLabelSetTaskInfo_t labelSetTask;
  183. rtLabelSwitchTaskInfo_t labelSwitchTask;
  184. rtLabelGotoTaskInfo_t labelGotoTask;
  185. rtProfilerTrace_t profilertraceTask;
  186. rtMemcpyAsyncTaskInfo_t memcpyAsyncTask;
  187. rtNotifyTaskInfo_t notifyTask;
  188. rtReduceAsyncTaskInfo_t reduceAsyncTask;
  189. rtRdmaSendTaskInfo_t rdmaSendTask;
  190. rtModelEndGraphTaskInfo_t modelEndGraphTask;
  191. rtStreamSwitchNTaskInfo_t streamSwitchNTask;
  192. uint32_t reserved[10];
  193. } u;
  194. } rtTaskInfo_t;
  195. typedef void *rtModel_t;
  196. typedef rtError_t (*rtTaskGenCallback)(rtModel_t model, rtTaskInfo_t *taskInfo);
  197. /**
  198. * @ingroup rt_model
  199. * @brief set callback for generate model
  200. * @param [in] callBack callback function
  201. * @return RT_ERROR_NONE for ok
  202. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  203. */
  204. RTS_API rtError_t rtSetTaskGenCallback(rtTaskGenCallback callback);
  205. /**
  206. * @ingroup rt_model
  207. * @brief create model instance
  208. * @param [out] model created model
  209. * @param [in] flag reserved
  210. * @return RT_ERROR_NONE for ok
  211. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  212. */
  213. RTS_API rtError_t rtModelCreate(rtModel_t *model, uint32_t flag);
  214. /**
  215. * @ingroup rt_model
  216. * @brief destroy model instance
  217. * @param [in] model model to destroy
  218. * @return RT_ERROR_NONE for ok
  219. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  220. */
  221. RTS_API rtError_t rtModelDestroy(rtModel_t model);
  222. /**
  223. * @ingroup rt_model
  224. * @brief bind model and stream instance
  225. * @param [in] model binded model
  226. * @param [in] stream binded stream
  227. * @param [in] flag reserved
  228. * @return RT_ERROR_NONE for ok
  229. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  230. */
  231. RTS_API rtError_t rtModelBindStream(rtModel_t model, rtStream_t stream, uint32_t flag);
  232. /**
  233. * @ingroup rt_model
  234. * @brief unbind model and stream instance
  235. * @param [in] model unbinded model
  236. * @param [in] stream unbinded stream
  237. * @return RT_ERROR_NONE for ok
  238. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  239. */
  240. RTS_API rtError_t rtModelUnbindStream(rtModel_t model, rtStream_t stream);
  241. /**
  242. * @ingroup rt_model
  243. * @brief tell runtime Model has been Loaded
  244. * @param [in] model model to execute
  245. * @return RT_ERROR_NONE for ok
  246. */
  247. RTS_API rtError_t rtModelLoadComplete(rtModel_t model);
  248. /**
  249. * @ingroup rt_model
  250. * @brief execute model instance
  251. * @param [in] model model to execute
  252. * @return RT_ERROR_NONE for ok
  253. * @return RT_ERROR_INVALID_RESOURCE_HANDLE for error input handle
  254. */
  255. RTS_API rtError_t rtModelExecute(rtModel_t model, rtStream_t stream, uint32_t flag);
  256. /**
  257. * @ingroup rt_model
  258. * @brief get model the last persist task id
  259. * @param [in] model model to execute
  260. * @param [out] taskid task id of the model
  261. * @return RT_ERROR_NONE for ok
  262. * @return RT_ERROR_INVALID_VALUE for error input handle
  263. */
  264. RTS_API rtError_t rtModelGetTaskId(rtModel_t model, uint32_t *taskid);
  265. /**
  266. * @ingroup rt_model
  267. * @brief add a end graph task to stream
  268. * @param [in] model model to execute
  269. * @param [in] end graph stream
  270. * @return RT_ERROR_NONE for ok
  271. * @return RT_ERROR_INVALID_VALUE for error input handle
  272. */
  273. RTS_API rtError_t rtEndGraph(rtModel_t model, rtStream_t stream);
  274. /**
  275. * @ingroup rt_model
  276. * @brief add a end graph task to stream
  277. * @param [in] model model to execute
  278. * @param [in] flags EXECUTOR_TS | EXECUTOR_AICPU
  279. * @return RT_ERROR_NONE for ok
  280. * @return RT_ERROR_INVALID_VALUE for error input handle
  281. */
  282. RTS_API rtError_t rtModelExecutorSet(rtModel_t model, uint8_t flags);
  283. /**
  284. * @ingroup rt_model
  285. * @brief abort model
  286. * @param [in] model model to abort
  287. * @return RT_ERROR_NONE for ok
  288. * @return RT_ERROR_INVALID_VALUE for error input handle
  289. */
  290. RTS_API rtError_t rtModelAbort(rtModel_t model);
  291. #ifdef __cplusplus
  292. }
  293. #endif
  294. #endif // __CCE_RUNTIME_MODEL_H__

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示