You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

stream.h 7.8 kB

5 years ago
5 years ago
3 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
3 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240
  1. /*
  2. * Copyright (c) Huawei Technologies Co., Ltd. 2020-2021. All rights reserved.
  3. * Description: stream.h
  4. * Create: 2020-01-01
  5. */
  6. #ifndef CCE_RUNTIME_STREAM_H
  7. #define CCE_RUNTIME_STREAM_H
  8. #include "base.h"
  9. #include "event.h"
  10. #if defined(__cplusplus)
  11. extern "C" {
  12. #endif
  13. /**
  14. * @ingroup stream_flags
  15. * @brief stream op bit flags
  16. */
  17. #define RT_STREAM_DEFAULT (0x00U)
  18. #define RT_STREAM_PERSISTENT (0x01U)
  19. #define RT_STREAM_FORCE_COPY (0x02U)
  20. #define RT_STREAM_HUGE (0x04U)
  21. #define RT_STREAM_AICPU (0x08U)
  22. #define RT_STREAM_FORBIDDEN_DEFAULT (0x10U)
  23. #define RT_STREAM_HEAD (0x20U)
  24. #define RT_STREAM_PRIMARY_DEFAULT (0x40U)
  25. #define RT_STREAM_PRIMARY_FIRST_DEFAULT (0x80U)
  26. #define RT_STREAM_OVERFLOW (0x100U)
  27. /**
  28. * @ingroup stream_type
  29. * @brief stream type
  30. */
  31. #define RT_NORMAL_STREAM (0x00U)
  32. #define RT_HUGE_STREAM (0x01U)
  33. /**
  34. * priority level default value when create a stream
  35. */
  36. #define RT_STREAM_PRIORITY_DEFAULT (0U)
  37. /**
  38. * @ingroup dvrt_stream
  39. * @brief create stream instance
  40. * @param [in|out] stm created stream
  41. * @param [in] priority stream priority
  42. * @return RT_ERROR_NONE for ok
  43. * @return RT_ERROR_INVALID_VALUE for error input
  44. */
  45. RTS_API rtError_t rtStreamCreate(rtStream_t *stm, int32_t priority);
  46. /**
  47. * @ingroup dvrt_stream
  48. * @brief create stream instance
  49. * @param [in|out] stm created stream
  50. * @param [in] priority stream priority
  51. * @param [in] flags stream op flags
  52. * @return RT_ERROR_NONE for ok
  53. * @return RT_ERROR_INVALID_VALUE for error input
  54. */
  55. RTS_API rtError_t rtStreamCreateWithFlags(rtStream_t *stm, int32_t priority, uint32_t flags);
  56. /**
  57. * @ingroup dvrt_stream
  58. * @brief destroy stream instance.
  59. * @param [in] stm the stream to destroy
  60. * @return RT_ERROR_NONE for ok
  61. * @return RT_ERROR_INVALID_VALUE for error input
  62. */
  63. RTS_API rtError_t rtStreamDestroy(rtStream_t stm);
  64. /**
  65. * @ingroup dvrt_stream
  66. * @brief wait an recorded event for stream
  67. * @param [in] stm the wait stream
  68. * @param [in] event the event to wait
  69. * @return RT_ERROR_NONE for ok
  70. * @return RT_ERROR_INVALID_VALUE for error input
  71. */
  72. RTS_API rtError_t rtStreamWaitEvent(rtStream_t stm, rtEvent_t evt);
  73. /**
  74. * @ingroup dvrt_stream
  75. * @brief wait an recorded event for stream, used for 1951 pg1
  76. * @param [in] stm the wait stream
  77. * @param [in] event the event to wait
  78. * @param [in] timeout timeout value for 1951 pg1
  79. * @return RT_ERROR_NONE for ok
  80. * @return RT_ERROR_INVALID_VALUE for error input
  81. */
  82. RTS_API rtError_t rtStreamWaitEventWithTimeout(rtStream_t stm, rtEvent_t evt, uint32_t timeout);
  83. /**
  84. * @ingroup dvrt_stream
  85. * @brief wait stream to be complete
  86. * @param [in] stm stream to wait
  87. * @return RT_ERROR_NONE for ok
  88. * @return RT_ERROR_INVALID_VALUE for error input
  89. */
  90. RTS_API rtError_t rtStreamSynchronize(rtStream_t stm);
  91. /**
  92. * @ingroup dvrt_stream
  93. * @brief queries an asynchronous stream for completion status
  94. * @param [in] stm stream to query
  95. * @return RT_ERROR_NONE for complete
  96. * @return RT_ERROR_STREAM_NOT_COMPLETE for not complete
  97. */
  98. RTS_API rtError_t rtStreamQuery(rtStream_t stm);
  99. /**
  100. * @ingroup dvrt_stream
  101. * @brief get stream id from a stream handle
  102. * @param [in] stm stream hadle
  103. * @param [in] streamId stream id
  104. * @return RT_ERROR_NONE for complete
  105. * @return RT_ERROR_INVALID_VALUE for error input
  106. */
  107. RTS_API rtError_t rtGetStreamId(rtStream_t stm, int32_t *streamId);
  108. /**
  109. * @ingroup dvrt_stream
  110. * @brief inquire max stream count and max task count per stream
  111. * @param [in] streamType Stream Type
  112. * @param [in] MaxStrCount Max stream count
  113. * @param [in] MaxTaskCount max task count per stream
  114. * @return RT_ERROR_NONE for complete
  115. * @return RT_ERROR_INVALID_VALUE for error input
  116. */
  117. RTS_API rtError_t rtGetMaxStreamAndTask(uint32_t streamType, uint32_t *maxStrCount, uint32_t *maxTaskCount);
  118. /**
  119. * @ingroup dvrt_stream
  120. * @brief Name a stream
  121. * @param [in] stm stream to be named
  122. * @param [in] name identification name
  123. * @return RT_ERROR_NONE for complete
  124. * @return RT_ERROR_INVALID_VALUE for error input
  125. */
  126. RTS_API rtError_t rtNameStream(rtStream_t stm, const char_t *name);
  127. /**
  128. * @ingroup dvrt_stream
  129. * @brief switch to the corresponding stream according to the contents of the ptr
  130. * @param [in] ptr Determine the address where the value of the true and false branches is located
  131. * @param [in] condition switch condition
  132. * @param [in] val switch value
  133. * @param [in] trueStream Stream that needs to be activated when the value is non-zero
  134. * @param [in] stm input stream to init task
  135. * @return RT_ERROR_NONE for complete
  136. * @return RT_ERROR_INVALID_VALUE for error input
  137. */
  138. RTS_API rtError_t rtStreamSwitch(void *ptr, rtCondition_t condition, int64_t val, rtStream_t trueStream,
  139. rtStream_t stm);
  140. /**
  141. * @brief execute extensible stream switch task
  142. * @param [in] ptr pointer of value
  143. * @param [in] condition judge condition
  144. * @param [in] value_ptr pointer of target value
  145. * @param [in] true_stream stream to be activated when value is not zero
  146. * @param [in] stm stream id
  147. * @param [in] dataType data type of target value
  148. * @return RT_ERROR_NONE for complete
  149. */
  150. RTS_API rtError_t rtStreamSwitchEx(void *ptr, rtCondition_t condition, void *valuePtr, rtStream_t trueStream,
  151. rtStream_t stm, rtSwitchDataType_t dataType);
  152. /**
  153. * @ingroup dvrt_stream
  154. * @brief Active a stream
  155. * @param [in] activeStream stream to be activated
  156. * @param [in] stm input stream to init task
  157. * @return RT_ERROR_NONE for complete
  158. * @return RT_ERROR_INVALID_VALUE for error input
  159. */
  160. RTS_API rtError_t rtStreamActive(rtStream_t activeStream, rtStream_t stm);
  161. /**
  162. * @brief execute extensible stream case switch task
  163. * @param [in] ptr pointer of value
  164. * @param [in] size pointer num of value
  165. * @param [in] valuePtr pointer of target value, length = size * elementSize
  166. * @param [in] trueStreamPtr streams to be activated
  167. * @param [in] elementSize size of to be activated true streams
  168. * @param [in] stm input stream to init task
  169. * @param [in] dataType data type of target value
  170. * @return RT_ERROR_NONE for complete
  171. */
  172. RTS_API rtError_t rtStreamSwitchN(void *ptr, uint32_t size, void *valuePtr, rtStream_t *trueStreamPtr,
  173. uint32_t elementSize, rtStream_t stm, rtSwitchDataType_t dataType);
  174. /*
  175. * @ingroup dvrt_stream
  176. * @brief enable debug for dump overflow exception with stream
  177. * @param [in] addr: ddr address of kernel exception dumpped
  178. * @param [in] stm: stream handle
  179. * @param [in] flag: debug flag
  180. * @return RT_ERROR_NONE for ok
  181. * @return RT_ERROR_INVALID_VALUE for error input
  182. */
  183. RTS_API rtError_t rtDebugRegisterForStream(rtStream_t stm, uint32_t flag, const void *addr,
  184. uint32_t *streamId, uint32_t *taskId);
  185. /*
  186. * @ingroup rt_model
  187. * @brief disable debug for dump overflow exception with stream
  188. * @param [in] stm: stream handle
  189. * @return RT_ERROR_NONE for ok
  190. * @return RT_ERROR_INVALID_VALUE for error input
  191. */
  192. RTS_API rtError_t rtDebugUnRegisterForStream(rtStream_t stm);
  193. /*
  194. * @ingroup dvrt_stream
  195. * @brief enable or disable stream overflow
  196. * @param [in] stm: stream handle
  197. * @param [in] flag: 0:disable others:enable
  198. * @return RT_ERROR_NONE for ok
  199. * @return RT_ERROR_INVALID_VALUE for error input
  200. */
  201. RTS_API rtError_t rtSetStreamOverflowSwitch(rtStream_t stm, uint32_t flags);
  202. /*
  203. * @ingroup dvrt_stream
  204. * @brief get whether overflow of the stream is enable or disable
  205. * @param [in] stm: stream handle
  206. * @param [out] flag: 0:disable others:enable
  207. * @return RT_ERROR_NONE for ok
  208. * @return RT_ERROR_INVALID_VALUE for error input
  209. */
  210. RTS_API rtError_t rtGetStreamOverflowSwitch(rtStream_t stm, uint32_t *flags);
  211. #if defined(__cplusplus)
  212. }
  213. #endif
  214. #endif // CCE_RUNTIME_STREAM_H

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示