You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

rt_model.h 14 kB

5 years ago
5 years ago
3 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
3 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513
  1. /*
  2. * Copyright (c) Huawei Technologies Co., Ltd. 2020-2021. All rights reserved.
  3. * Description: rt_model.h
  4. * Create: 2020-01-01
  5. */
  6. #ifndef CCE_RUNTIME_RT_MODEL_H
  7. #define CCE_RUNTIME_RT_MODEL_H
  8. #include "base.h"
  9. #if defined(__cplusplus)
  10. extern "C" {
  11. #endif
  12. typedef enum tagModelTaskType {
  13. RT_MODEL_TASK_KERNEL = 0,
  14. RT_MODEL_TASK_EVENT_RECORD,
  15. RT_MODEL_TASK_EVENT_WAIT,
  16. RT_MODEL_TASK_FUSION_START,
  17. RT_MODEL_TASK_FUSION_END,
  18. RT_MODEL_TASK_KERNEL_EX,
  19. RT_MODEL_TASK_HCCL,
  20. RT_MODEL_TASK_STREAM_SWITCH,
  21. RT_MODEL_TASK_STREAM_ACTIVE,
  22. RT_MODEL_TASK_LABEL_SET,
  23. RT_MODEL_TASK_LABEL_SWITCH,
  24. RT_MODEL_TASK_LABEL_GOTO,
  25. RT_MODEL_TASK_PROFILER_TRACE,
  26. RT_MODEL_TASK_MEMCPY_ASYNC,
  27. RT_MODEL_TASK_NOTIFY_RECORD,
  28. RT_MODEL_TASK_NOTIFY_WAIT,
  29. RT_MODEL_TASK_REDUCE_ASYNC,
  30. RT_MODEL_TASK_RDMA_SEND,
  31. RT_MODEL_TASK_EVENT_RESET,
  32. RT_MODEL_TASK_MODEL_END_GRAPH,
  33. RT_MODEL_TASK_STREAM_SWITCH_N,
  34. RT_MODEL_TASK_RDMA_DB_SEND,
  35. RT_MODEL_TASK_MEMCPY_ADDR_ASYNC,
  36. RT_MODEL_TASK_STREAM_LABEL_SWITCH_BY_INDEX,
  37. RT_MODEL_TASK_STREAM_LABEL_GOTO,
  38. RT_MODEL_TASK_MODEL_EXIT,
  39. RT_MODEL_TASK_ALL_KERNEL,
  40. RT_MODEL_TASK_PROFILER_TRACE_EX,
  41. RT_MODEL_TASK_FFTS_TASK,
  42. RT_MODEL_TASK_FFTS_PLUS_TASK,
  43. RT_MODEL_TASK_DSA_TASK,
  44. RT_MODEL_TASK_CMO,
  45. RT_MODEL_TASK_BARRIER,
  46. RT_MODEL_TASK_NPU_GET_FLOAT_STATUS,
  47. RT_MODEL_TASK_NPU_CLEAR_FLOAT_STATUS,
  48. } rtModelTaskType_t;
  49. typedef enum tagModelStreamType {
  50. RT_MODEL_HEAD_STREAM = 0,
  51. RT_MODEL_WAIT_ACTIVE_STREAM = 1
  52. } rtModelStreamType_t;
  53. typedef enum tagModelQueueFlag {
  54. RT_MODEL_INPUT_QUEUE = 0,
  55. RT_MODEL_OUTPUT_QUEUE = 1
  56. } rtModelQueueFlag_t;
  57. #define EXECUTOR_NONE (0x0U)
  58. #define EXECUTOR_TS (0x01U)
  59. #define EXECUTOR_AICPU (0x02U)
  60. /*
  61. * @ingroup rt_model
  62. * @brief debug flag for kernel exception dump
  63. */
  64. #define RT_DEBUG_FLAG_AICORE_OVERFLOW (0x1U << 0U)
  65. #define RT_DEBUG_FLAG_ATOMIC_ADD_OVERFLOW (0x1U << 1U)
  66. /**
  67. * @ingroup
  68. * @brief the type defination of aicpu model task command
  69. */
  70. typedef enum tagTsAicpuModelCmd {
  71. TS_AICPU_MODEL_LOAD = 1,
  72. TS_AICPU_MODEL_EXECUTE,
  73. TS_AICPU_MODEL_DESTROY,
  74. TS_AICPU_MODEL_ABORT,
  75. TS_AICPU_MODEL_RESERVED,
  76. } tsAicpuModelCmd;
  77. typedef struct tagAicpuTaskInfo {
  78. uint32_t taskID;
  79. uint32_t streamID;
  80. uint32_t kernelType;
  81. uint64_t kernelName;
  82. uint64_t kernelSo;
  83. uint64_t paraBase;
  84. uint32_t taskFlag;
  85. } rtAicpuTaskInfo_t;
  86. typedef struct tagModelStreamInfo {
  87. uint32_t streamID;
  88. uint32_t streamFlag;
  89. } rtModelStreamInfo_t;
  90. typedef struct tagModelQueueInfo {
  91. uint32_t queueID;
  92. uint32_t flag;
  93. } rtModelQueueInfo_t;
  94. typedef struct tagAicpuModelInfo {
  95. uint32_t moduleID;
  96. uint32_t tsId;
  97. uint16_t streamInfoNum;
  98. uint16_t aicpuTaskNum;
  99. uint64_t streamInfoPtr;
  100. uint64_t aicpuTaskPtr;
  101. uint16_t queueSize;
  102. uint64_t queueInfoPtr;
  103. } rtAicpuModelInfo_t;
  104. typedef struct tagKernelTaskInfo {
  105. uint16_t blockDim;
  106. uint16_t argsCount;
  107. uint16_t argsSize;
  108. uint16_t reserved;
  109. const char_t *stubFunc;
  110. uint8_t *smDesc;
  111. const uint8_t *args;
  112. uint16_t *argsOffset;
  113. } rtKernelTaskInfo_t;
  114. typedef struct tagAllKernelTaskInfo {
  115. uint16_t blockDim;
  116. uint16_t argsCount;
  117. uint16_t argsSize;
  118. uint16_t reserved;
  119. uint64_t tilingKey;
  120. void *handle;
  121. uint8_t *smDesc;
  122. const uint8_t *args;
  123. uint16_t *argsOffset;
  124. } rtAllKernelTaskInfo_t;
  125. typedef struct tagKernelTaskInfoEx {
  126. uint32_t flags;
  127. uint32_t argsSize;
  128. const void *args;
  129. uint32_t reserved[6];
  130. } rtKernelTaskInfoEx_t;
  131. typedef struct tagEventTaskInfo {
  132. uint32_t eventID;
  133. uint32_t reserved[9];
  134. } rtEventTaskInfo_t;
  135. typedef struct tagStreamSwitchTaskInfo {
  136. int64_t value;
  137. uint64_t pValuePtr;
  138. uint32_t trueStreamID;
  139. uint32_t dataType;
  140. uint32_t reserved[4];
  141. } rtStreamSwitchTaskInfo_t;
  142. typedef struct tagStreamSwitchNTaskInfo {
  143. uint64_t pValuePtr;
  144. uint64_t pTrueStreamPtr;
  145. uint32_t size;
  146. uint32_t elementSize;
  147. uint32_t dataType;
  148. uint32_t reserved[3];
  149. } rtStreamSwitchNTaskInfo_t;
  150. typedef struct tagStreamActiveTaskInfo {
  151. uint32_t activeStreamID;
  152. uint32_t reserved[9];
  153. } rtStreamActiveTaskInfo_t;
  154. typedef struct tagSetTaskInfo {
  155. uint16_t labelId;
  156. uint32_t reserved[9];
  157. } rtLabelSetTaskInfo_t;
  158. typedef struct tagSwitchTaskInfo {
  159. uint32_t value;
  160. uint32_t reserved[9];
  161. } rtLabelSwitchTaskInfo_t;
  162. typedef struct tagLabelGotoTaskInfo {
  163. uint16_t labelId;
  164. uint32_t reserved[9];
  165. } rtLabelGotoTaskInfo_t;
  166. typedef struct tagProfilerTraceTaskInfo {
  167. uint64_t profilerTraceId;
  168. uint32_t notify : 8;
  169. uint32_t reserved_ : 24;
  170. uint32_t flags;
  171. uint32_t reserved[6];
  172. } rtProfilerTrace_t;
  173. typedef struct tagProfilerTraceExTaskInfo {
  174. uint64_t profilerTraceId;
  175. uint64_t modelId;
  176. uint16_t tagId;
  177. uint8_t reserved[22];
  178. } rtProfilerTraceEx_t;
  179. typedef struct tagrtMemcpyAsyncTaskInfo {
  180. const void *dst;
  181. uint64_t destMax;
  182. const void *src;
  183. uint64_t count;
  184. uint32_t kind;
  185. uint32_t reserved;
  186. } rtMemcpyAsyncTaskInfo_t;
  187. typedef struct tagrtNotifyTaskInfo {
  188. uint32_t notifyID;
  189. uint32_t reserved[9];
  190. } rtNotifyTaskInfo_t;
  191. typedef struct tagrtReduceAsyncTaskInfo {
  192. const void *dst;
  193. uint64_t destMax;
  194. const void *src;
  195. uint64_t count;
  196. uint32_t kind;
  197. uint32_t type;
  198. } rtReduceAsyncTaskInfo_t;
  199. typedef struct tagrtRdmaSendTaskInfo {
  200. uint32_t index;
  201. uint32_t wqe_index;
  202. uint32_t reserved[8];
  203. } rtRdmaSendTaskInfo_t;
  204. typedef struct tagrtRdmaDbSendTaskInfo {
  205. uint64_t dbInfo;
  206. uint32_t dbIndex;
  207. uint32_t reserved[7]; // offset 7
  208. } rtRdmaDbSendTaskInfo_t;
  209. typedef struct tagrtModelEndGraphTaskInfo {
  210. uint32_t modelId;
  211. uint32_t executorFlag;
  212. uint32_t reserved[8];
  213. } rtModelEndGraphTaskInfo_t;
  214. typedef struct tagrtModelExitInfo {
  215. uint32_t modelId;
  216. uint32_t streamId;
  217. uint32_t reserved[8];
  218. } rtModelExitTaskInfo_t;
  219. typedef struct tagrtStreamLabelSwitchByIndexTask_t {
  220. uint64_t indexPtr;
  221. uint64_t labelInfoPtr;
  222. uint32_t max;
  223. uint8_t reserved[20];
  224. } rtStreamLabelSwitchByIndexTask_t;
  225. typedef struct tagrtStreamLabelGotoTask_t {
  226. uint16_t labelId;
  227. uint16_t modelId;
  228. uint8_t reserved[36];
  229. } rtStreamLabelGotoTask_t;
  230. typedef struct tagTaskInfo {
  231. uint32_t type;
  232. uint32_t streamID;
  233. union {
  234. rtKernelTaskInfoEx_t kernelTaskEx;
  235. rtKernelTaskInfo_t kernelTask;
  236. rtAllKernelTaskInfo_t allKernelTask;
  237. rtEventTaskInfo_t eventTask;
  238. rtStreamSwitchTaskInfo_t streamSwitchTask;
  239. rtStreamActiveTaskInfo_t streamActiveTask;
  240. rtLabelSetTaskInfo_t labelSetTask;
  241. rtLabelSwitchTaskInfo_t labelSwitchTask;
  242. rtLabelGotoTaskInfo_t labelGotoTask;
  243. rtProfilerTrace_t profilertraceTask;
  244. rtProfilerTraceEx_t profilertraceExTask;
  245. rtMemcpyAsyncTaskInfo_t memcpyAsyncTask;
  246. rtNotifyTaskInfo_t notifyTask;
  247. rtReduceAsyncTaskInfo_t reduceAsyncTask;
  248. rtRdmaSendTaskInfo_t rdmaSendTask;
  249. rtRdmaDbSendTaskInfo_t rdmaDbSendTask;
  250. rtModelEndGraphTaskInfo_t modelEndGraphTask;
  251. rtModelExitTaskInfo_t modelExitTask;
  252. rtStreamSwitchNTaskInfo_t streamSwitchNTask;
  253. rtStreamLabelSwitchByIndexTask_t streamLabelSwitchIndexTask;
  254. rtStreamLabelGotoTask_t streamLabelGotoTask;
  255. uint32_t reserved[10];
  256. } u;
  257. } rtTaskInfo_t;
  258. typedef struct tagNodeInfo_t {
  259. uint32_t nodeIdx;
  260. uint32_t reserved[1];
  261. } rtNodeInfo;
  262. typedef struct tagHwtsInfo_t {
  263. uint16_t taskId;
  264. uint16_t sqExeHead;
  265. uint16_t streamExeHead;
  266. uint16_t reserved[2];
  267. } rtHwtsInfo;
  268. typedef struct tagLabelDevInfo_t {
  269. uint16_t modelId;
  270. uint16_t streamId;
  271. uint16_t labelId;
  272. union {
  273. rtNodeInfo nodeInfo;
  274. rtHwtsInfo hwtsInfo;
  275. uint16_t reserved[5];
  276. }u;
  277. }rtLabelDevInfo;
  278. typedef rtError_t (*rtTaskGenCallback)(rtModel_t mdl, rtTaskInfo_t *taskInfo);
  279. /**
  280. * @ingroup rt_model
  281. * @brief set callback for generate model
  282. * @param [in] callBack callback function
  283. * @return RT_ERROR_NONE for ok
  284. * @return RT_ERROR_INVALID_VALUE for error input
  285. */
  286. RTS_API rtError_t rtSetTaskGenCallback(rtTaskGenCallback callback);
  287. /**
  288. * @ingroup rt_model
  289. * @brief create model instance
  290. * @param [out] mdl created model
  291. * @param [in] flag reserved
  292. * @return RT_ERROR_NONE for ok
  293. * @return RT_ERROR_INVALID_VALUE for error input
  294. */
  295. RTS_API rtError_t rtModelCreate(rtModel_t *mdl, uint32_t flag);
  296. /**
  297. * @ingroup rt_model
  298. * @brief set ge model id to aicpu
  299. * @param [in] model aicpu model
  300. * @param [in] extid ge model id
  301. * @return RT_ERROR_NONE for ok
  302. * @return RT_ERROR_INVALID_VALUE for error input
  303. */
  304. rtError_t rtModelSetExtId(rtModel_t mdl, uint32_t extId);
  305. /**
  306. * @ingroup rt_model
  307. * @brief destroy model instance
  308. * @param [in] mdl model to destroy
  309. * @return RT_ERROR_NONE for ok
  310. * @return RT_ERROR_INVALID_VALUE for error input
  311. */
  312. RTS_API rtError_t rtModelDestroy(rtModel_t mdl);
  313. /**
  314. * @ingroup rt_model
  315. * @brief bind model and stream instance
  316. * @param [in] mdl binded model
  317. * @param [in] stm binded stream
  318. * @param [in] flag reserved
  319. * @return RT_ERROR_NONE for ok
  320. * @return RT_ERROR_INVALID_VALUE for error input
  321. */
  322. RTS_API rtError_t rtModelBindStream(rtModel_t mdl, rtStream_t stm, uint32_t flag);
  323. /**
  324. * @ingroup rt_model
  325. * @brief unbind model and stream instance
  326. * @param [in] mdl unbinded model
  327. * @param [in] stm unbinded stream
  328. * @return RT_ERROR_NONE for ok
  329. * @return RT_ERROR_INVALID_VALUE for error input
  330. */
  331. RTS_API rtError_t rtModelUnbindStream(rtModel_t mdl, rtStream_t stm);
  332. /**
  333. * @ingroup rt_model
  334. * @brief tell runtime Model has been Loaded
  335. * @param [in] mdl model to execute
  336. * @return RT_ERROR_NONE for ok
  337. */
  338. RTS_API rtError_t rtModelLoadComplete(rtModel_t mdl);
  339. /**
  340. * @ingroup rt_model
  341. * @brief execute model instance
  342. * @param [in] mdl model to execute
  343. * @return RT_ERROR_NONE for ok
  344. * @return RT_ERROR_INVALID_VALUE for error input
  345. */
  346. RTS_API rtError_t rtModelExecute(rtModel_t mdl, rtStream_t stm, uint32_t flag);
  347. /**
  348. * @ingroup rt_model
  349. * @brief get model the last persist task id
  350. * @param [in] mdl model to execute
  351. * @param [out] taskId last task id of the model
  352. * @param [out] streamId last steam id of the model
  353. * @return RT_ERROR_NONE for ok
  354. * @return RT_ERROR_INVALID_VALUE for error input
  355. */
  356. RTS_API rtError_t rtModelGetTaskId(rtModel_t mdl, uint32_t *taskId, uint32_t *streamId);
  357. /**
  358. * @ingroup rt_model
  359. * @brief add a end graph task to stream
  360. * @param [in] mdl model to execute
  361. * @param [in] end graph stream
  362. * @return RT_ERROR_NONE for ok
  363. * @return RT_ERROR_INVALID_VALUE for error input
  364. */
  365. RTS_API rtError_t rtEndGraph(rtModel_t mdl, rtStream_t stm);
  366. /**
  367. * @ingroup rt_model
  368. * @brief add a end graph task with flag to stream
  369. * @param [in] mdl model to execute
  370. * @param [in] end graph stream
  371. * @param [in] flags AICPU datadump
  372. * @return RT_ERROR_NONE for ok
  373. * @return RT_ERROR_INVALID_VALUE for error input
  374. */
  375. RTS_API rtError_t rtEndGraphEx(rtModel_t mdl, rtStream_t stm, uint32_t flags);
  376. /**
  377. * @ingroup rt_model
  378. * @brief add a end graph task to stream
  379. * @param [in] mdl model to execute
  380. * @param [in] flags EXECUTOR_TS | EXECUTOR_AICPU
  381. * @return RT_ERROR_NONE for ok
  382. * @return RT_ERROR_INVALID_VALUE for error input
  383. */
  384. RTS_API rtError_t rtModelExecutorSet(rtModel_t mdl, uint8_t flags);
  385. /**
  386. * @ingroup rt_model
  387. * @brief abort model
  388. * @param [in] mdl model to abort
  389. * @return RT_ERROR_NONE for ok
  390. * @return RT_ERROR_INVALID_VALUE for error input
  391. */
  392. RTS_API rtError_t rtModelAbort(rtModel_t mdl);
  393. /**
  394. * @ingroup rt_model
  395. * @brief end graph task to model default stream
  396. * @param [in] mdl model to execute
  397. * @param [in] end graph stream
  398. * @return RT_ERROR_NONE for ok
  399. * @return RT_ERROR_INVALID_VALUE for error input
  400. */
  401. RTS_API rtError_t rtModelExit(rtModel_t mdl, rtStream_t stm);
  402. /**
  403. * @ingroup rt_model
  404. * @brief bind queue
  405. * @param [in] mdl model to bind
  406. * @param [in] queueId queueId to bind
  407. * @param [in] flag
  408. * @return RT_ERROR_NONE for ok
  409. * @return RT_ERROR_INVALID_VALUE for error input
  410. */
  411. RTS_API rtError_t rtModelBindQueue(rtModel_t mdl, uint32_t queueId, rtModelQueueFlag_t flag);
  412. /**
  413. * @ingroup rt_model
  414. * @brief get model id
  415. * @param [in] mdl
  416. * @param [out] modelId model id
  417. * @return RT_ERROR_NONE for ok
  418. * @return RT_ERROR_INVALID_VALUE for error input
  419. */
  420. RTS_API rtError_t rtModelGetId(rtModel_t mdl, uint32_t *modelId);
  421. /*
  422. * @ingroup rt_model
  423. * @brief enable debug for dump overflow exception
  424. * @param [in] addr: ddr address of kernel exception dumpped
  425. * @param [in] mdl: model handle
  426. * @param [in] flag: debug flag
  427. * @return RT_ERROR_NONE for ok
  428. * @return RT_ERROR_INVALID_VALUE for error input
  429. */
  430. RTS_API rtError_t rtDebugRegister(rtModel_t mdl, uint32_t flag, const void *addr,
  431. uint32_t *streamId, uint32_t *taskId);
  432. /*
  433. * @ingroup rt_model
  434. * @brief disable debug for dump overflow exception
  435. * @param [in] mdl: model handle
  436. * @return RT_ERROR_NONE for ok
  437. * @return RT_ERROR_INVALID_VALUE for error input
  438. */
  439. RTS_API rtError_t rtDebugUnRegister(rtModel_t mdl);
  440. /**
  441. * @ingroup rt_model
  442. * @brief set model group id
  443. * @param [in] mdl model
  444. * @param [in] schGrpId groupId (0,4) 0:default invalid value 1-4 valid value Maximum support 4 groups
  445. * @return RT_ERROR_NONE for ok
  446. * @return RT_ERROR_INVALID_VALUE for error input
  447. */
  448. RTS_API rtError_t rtModelSetSchGroupId(rtModel_t mdl, const int16_t schGrpId);
  449. #if defined(__cplusplus)
  450. }
  451. #endif
  452. #endif // CCE_RUNTIME_RT_MODEL_H

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示