You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

stream.h 7.3 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
3 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
3 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. * Licensed under the Apache License, Version 2.0 (the "License");
  4. * you may not use this file except in compliance with the License.
  5. * You may obtain a copy of the License at
  6. * http://www.apache.org/licenses/LICENSE-2.0
  7. * Unless required by applicable law or agreed to in writing, software
  8. * distributed under the License is distributed on an "AS IS" BASIS,
  9. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  10. * See the License for the specific language governing permissions and
  11. * limitations under the License.
  12. */
  13. #ifndef CCE_RUNTIME_STREAM_H
  14. #define CCE_RUNTIME_STREAM_H
  15. #include "base.h"
  16. #include "event.h"
  17. #if defined(__cplusplus)
  18. extern "C" {
  19. #endif
  20. /**
  21. * @ingroup stream_flags
  22. * @brief stream op bit flags
  23. */
  24. #define RT_STREAM_DEFAULT (0x00U)
  25. #define RT_STREAM_PERSISTENT (0x01U)
  26. #define RT_STREAM_FORCE_COPY (0x02U)
  27. #define RT_STREAM_HUGE (0x04U)
  28. #define RT_STREAM_AICPU (0x08U)
  29. #define RT_STREAM_FORBIDDEN_DEFAULT (0x10U)
  30. #define RT_STREAM_HEAD (0x20U)
  31. #define RT_STREAM_PRIMARY_DEFAULT (0x40U)
  32. #define RT_STREAM_PRIMARY_FIRST_DEFAULT (0x80U)
  33. /**
  34. * @ingroup stream_type
  35. * @brief stream type
  36. */
  37. #define RT_NORMAL_STREAM (0x00U)
  38. #define RT_HUGE_STREAM (0x01U)
  39. /**
  40. * priority level default value when create a stream
  41. */
  42. #define RT_STREAM_PRIORITY_DEFAULT (0U)
  43. /**
  44. * @ingroup dvrt_stream
  45. * @brief create stream instance
  46. * @param [in|out] stream created stream
  47. * @param [in] priority stream priority
  48. * @return RT_ERROR_NONE for ok
  49. * @return RT_ERROR_INVALID_VALUE for error input
  50. */
  51. RTS_API rtError_t rtStreamCreate(rtStream_t *stream, int32_t priority);
  52. /**
  53. * @ingroup dvrt_stream
  54. * @brief create stream instance
  55. * @param [in|out] stream created stream
  56. * @param [in] priority stream priority
  57. * @param [in] flags stream op flags
  58. * @return RT_ERROR_NONE for ok
  59. * @return RT_ERROR_INVALID_VALUE for error input
  60. */
  61. RTS_API rtError_t rtStreamCreateWithFlags(rtStream_t *stream, int32_t priority, uint32_t flags);
  62. /**
  63. * @ingroup dvrt_stream
  64. * @brief destroy stream instance.
  65. * @param [in] stream the stream to destroy
  66. * @return RT_ERROR_NONE for ok
  67. * @return RT_ERROR_INVALID_VALUE for error input
  68. */
  69. RTS_API rtError_t rtStreamDestroy(rtStream_t stream);
  70. /**
  71. * @ingroup dvrt_stream
  72. * @brief wait an recorded event for stream
  73. * @param [in] stream the wait stream
  74. * @param [in] event the event to wait
  75. * @return RT_ERROR_NONE for ok
  76. * @return RT_ERROR_INVALID_VALUE for error input
  77. */
  78. RTS_API rtError_t rtStreamWaitEvent(rtStream_t stream, rtEvent_t event);
  79. /**
  80. * @ingroup dvrt_stream
  81. * @brief wait stream to be complete
  82. * @param [in] stream stream to wait
  83. * @return RT_ERROR_NONE for ok
  84. * @return RT_ERROR_INVALID_VALUE for error input
  85. */
  86. RTS_API rtError_t rtStreamSynchronize(rtStream_t stream);
  87. /**
  88. * @ingroup dvrt_stream
  89. * @brief queries an asynchronous stream for completion status
  90. * @param [in] stream stream to query
  91. * @return RT_ERROR_NONE for complete
  92. * @return RT_ERROR_STREAM_NOT_COMPLETE for not complete
  93. */
  94. RTS_API rtError_t rtStreamQuery(rtStream_t stream);
  95. /**
  96. * @ingroup dvrt_stream
  97. * @brief get stream id from a stream handle
  98. * @param [in] stream stream hadle
  99. * @param [in] streamId stream id
  100. * @return RT_ERROR_NONE for complete
  101. * @return RT_ERROR_INVALID_VALUE for error input
  102. */
  103. RTS_API rtError_t rtGetStreamId(rtStream_t stream, int32_t *streamId);
  104. /**
  105. * @ingroup dvrt_stream
  106. * @brief inquire max stream count and max task count per stream
  107. * @param [in] streamType Stream Type
  108. * @param [in] MaxStrCount Max stream count
  109. * @param [in] MaxTaskCount max task count per stream
  110. * @return RT_ERROR_NONE for complete
  111. * @return RT_ERROR_INVALID_VALUE for error input
  112. */
  113. RTS_API rtError_t rtGetMaxStreamAndTask(uint32_t streamType, uint32_t *maxStrCount, uint32_t *maxTaskCount);
  114. /**
  115. * @ingroup dvrt_stream
  116. * @brief Name a stream
  117. * @param [in] stream stream to be named
  118. * @param [in] name identification name
  119. * @return RT_ERROR_NONE for complete
  120. * @return RT_ERROR_INVALID_VALUE for error input
  121. */
  122. RTS_API rtError_t rtNameStream(rtStream_t stream, const char *name);
  123. /**
  124. * @ingroup dvrt_stream
  125. * @brief switch to the corresponding stream according to the contents of the ptr
  126. * @param [in] ptr Determine the address where the value of the true and false branches is located
  127. * @param [in] condition switch condition
  128. * @param [in] value switch value
  129. * @param [in] trueStream Stream that needs to be activated when the value is non-zero
  130. * @param [in] stream input stream to init task
  131. * @return RT_ERROR_NONE for complete
  132. * @return RT_ERROR_INVALID_VALUE for error input
  133. */
  134. RTS_API rtError_t rtStreamSwitch(void *ptr, rtCondition_t condition, int64_t value, rtStream_t trueStream,
  135. rtStream_t stream);
  136. /**
  137. * @brief execute extensible stream switch task
  138. * @param [in] ptr pointer of value
  139. * @param [in] condition judge condition
  140. * @param [in] value_ptr pointer of target value
  141. * @param [in] true_stream stream to be activated when value is not zero
  142. * @param [in] stream stream id
  143. * @param [in] dataType data type of target value
  144. * @return RT_ERROR_NONE for complete
  145. */
  146. RTS_API rtError_t rtStreamSwitchEx(void *ptr, rtCondition_t condition, void *valuePtr, rtStream_t trueStream,
  147. rtStream_t stream, rtSwitchDataType_t dataType);
  148. /**
  149. * @ingroup dvrt_stream
  150. * @brief Active a stream
  151. * @param [in] activeStream stream to be activated
  152. * @param [in] stream input stream to init task
  153. * @return RT_ERROR_NONE for complete
  154. * @return RT_ERROR_INVALID_VALUE for error input
  155. */
  156. RTS_API rtError_t rtStreamActive(rtStream_t activeStream, rtStream_t stream);
  157. /**
  158. * @brief execute extensible stream case switch task
  159. * @param [in] ptr pointer of value
  160. * @param [in] size pointer num of value
  161. * @param [in] valuePtr pointer of target value, length = size * elementSize
  162. * @param [in] trueStreamPtr streams to be activated
  163. * @param [in] elementSize size of to be activated true streams
  164. * @param [in] stream input stream to init task
  165. * @param [in] dataType data type of target value
  166. * @return RT_ERROR_NONE for complete
  167. */
  168. RTS_API rtError_t rtStreamSwitchN(void *ptr, uint32_t size, void *valuePtr, rtStream_t *trueStreamPtr,
  169. uint32_t elementSize, rtStream_t stream, rtSwitchDataType_t dataType);
  170. /*
  171. * @ingroup dvrt_stream
  172. * @brief enable debug for dump overflow exception with stream
  173. * @param [in] addr: ddr address of kernel exception dumpped
  174. * @param [in] stream: stream handle
  175. * @param [in] flag: debug flag
  176. * @return RT_ERROR_NONE for ok
  177. * @return RT_ERROR_INVALID_VALUE for error input
  178. */
  179. RTS_API rtError_t rtDebugRegisterForStream(rtStream_t stream, uint32_t flag, const void *addr,
  180. uint32_t *streamId, uint32_t *taskId);
  181. /*
  182. * @ingroup rt_model
  183. * @brief disable debug for dump overflow exception with stream
  184. * @param [in] stream: stream handle
  185. * @return RT_ERROR_NONE for ok
  186. * @return RT_ERROR_INVALID_VALUE for error input
  187. */
  188. RTS_API rtError_t rtDebugUnRegisterForStream(rtStream_t stream);
  189. #if defined(__cplusplus)
  190. }
  191. #endif
  192. #endif // CCE_RUNTIME_STREAM_H

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示