You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

run_context.cc 7.7 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "graph/build/run_context.h"
  17. #include "common/util.h"
  18. #include "framework/common/debug/ge_log.h"
  19. #include "graph/debug/ge_attr_define.h"
  20. namespace ge {
  21. RunContextUtil::~RunContextUtil() { DestroyRtModelResources(); }
  22. Status RunContextUtil::InitMemInfo(uint8_t *data_mem_base, uint64_t data_mem_size,
  23. std::map<int64_t, uint8_t *> mem_type_to_data_mem_base,
  24. std::map<int64_t, uint64_t> mem_type_to_data_mem_size, uint8_t *weight_mem_base,
  25. uint64_t weight_mem_size) {
  26. if ((data_mem_size > 0) && (data_mem_base == nullptr)) {
  27. GELOGE(PARAM_INVALID, "InitMemInfo param data_mem_base is null but data_mem_size = %lu.", data_mem_size);
  28. return PARAM_INVALID;
  29. }
  30. if ((weight_mem_size > 0) && (weight_mem_base == nullptr)) {
  31. GELOGE(PARAM_INVALID, "InitMemInfo param weight_mem_base is null but weight_mem_size = %lu.", weight_mem_size);
  32. return PARAM_INVALID;
  33. }
  34. if (mem_type_to_data_mem_base.empty() || mem_type_to_data_mem_size.empty() ||
  35. mem_type_to_data_mem_base.size() != mem_type_to_data_mem_size.size()) {
  36. GELOGE(PARAM_INVALID,
  37. "InitMemInfo param mem_type_to_data_mem_base size[%zu] is not equal to the size of "
  38. "mem_type_to_data_mem_size[%zu].",
  39. mem_type_to_data_mem_base.size(), mem_type_to_data_mem_size.size());
  40. return PARAM_INVALID;
  41. }
  42. data_mem_base_ = data_mem_base;
  43. data_mem_size_ = data_mem_size;
  44. weight_mem_base_ = weight_mem_base;
  45. weight_mem_size_ = weight_mem_size;
  46. mem_type_to_data_mem_base_ = mem_type_to_data_mem_base;
  47. mem_type_to_data_mem_size_ = mem_type_to_data_mem_size;
  48. return SUCCESS;
  49. }
  50. Status RunContextUtil::CreateRtModelResources(uint32_t stream_num, uint32_t event_num, uint32_t label_num) {
  51. // Create rt model
  52. rtError_t rt_ret = rtModelCreate(&rt_model_, 0);
  53. if (rt_ret != RT_ERROR_NONE) {
  54. GELOGE(RT_FAILED, "rtModelCreate failed. rt_ret = %d", static_cast<int>(rt_ret));
  55. return RT_FAILED;
  56. }
  57. // Create rt Stream and bind with model
  58. for (uint32_t i = 0; i < stream_num; ++i) {
  59. rtStream_t stream = nullptr;
  60. rt_ret = rtStreamCreate(&stream, 0);
  61. if (rt_ret != RT_ERROR_NONE) {
  62. GELOGE(RT_FAILED, "rtStreamCreate failed. rt_ret = %d, index = %u", static_cast<int>(rt_ret), i);
  63. return RT_FAILED;
  64. }
  65. stream_list_.emplace_back(stream);
  66. rt_ret = rtModelBindStream(rt_model_, stream, 0);
  67. if (rt_ret != RT_ERROR_NONE) {
  68. GELOGE(RT_FAILED, "Bind stream and model failed. rt_ret = %d, index = %u", static_cast<int>(rt_ret), i);
  69. return RT_FAILED;
  70. }
  71. }
  72. // Create rt event
  73. for (uint32_t i = 0; i < event_num; ++i) {
  74. rtEvent_t event = nullptr;
  75. rt_ret = rtEventCreate(&event);
  76. if (rt_ret != RT_ERROR_NONE) {
  77. GELOGE(RT_FAILED, "rtEventCreate failed. rt_ret = %d, index = %u", static_cast<int>(rt_ret), i);
  78. return RT_FAILED;
  79. }
  80. event_list_.emplace_back(event);
  81. }
  82. // Create rt label
  83. for (uint32_t i = 0; i < label_num; ++i) {
  84. rtLabel_t label = nullptr;
  85. rt_ret = rtLabelCreate(&label);
  86. if (rt_ret != RT_ERROR_NONE) {
  87. GELOGE(RT_FAILED, "rtLabelCreate failed. rt_ret = %d, index = %u", static_cast<int>(rt_ret), i);
  88. return RT_FAILED;
  89. }
  90. label_list_.emplace_back(label);
  91. }
  92. return SUCCESS;
  93. }
  94. void RunContextUtil::DestroyRtModelResources() noexcept {
  95. rtError_t rt_ret;
  96. for (size_t i = 0; i < stream_list_.size(); i++) {
  97. // Unbind stream to model first
  98. (void)rtModelUnbindStream(rt_model_, stream_list_[i]);
  99. rt_ret = rtStreamDestroy(stream_list_[i]);
  100. if (rt_ret != RT_ERROR_NONE) {
  101. GELOGW("Destroy stream failed. rt_ret = %d, index = %zu.", static_cast<int>(rt_ret), i);
  102. }
  103. }
  104. stream_list_.clear();
  105. for (size_t i = 0; i < event_list_.size(); i++) {
  106. rt_ret = rtEventDestroy(event_list_[i]);
  107. if (rt_ret != RT_ERROR_NONE) {
  108. GELOGW("Destroy event failed. rt_ret = %d, index = %zu.", static_cast<int>(rt_ret), i);
  109. }
  110. }
  111. event_list_.clear();
  112. for (size_t i = 0; i < label_list_.size(); ++i) {
  113. rt_ret = rtLabelDestroy(label_list_[i]);
  114. if (rt_ret != RT_ERROR_NONE) {
  115. GELOGW("Destroy label failed. rt_ret = %d, index = %zu.", static_cast<int>(rt_ret), i);
  116. }
  117. }
  118. label_list_.clear();
  119. if (rt_model_ != nullptr) {
  120. rt_ret = rtModelDestroy(rt_model_);
  121. if (rt_ret != RT_ERROR_NONE) {
  122. GELOGW("Destroy rt model failed. rt_ret = %d.", static_cast<int>(rt_ret));
  123. }
  124. rt_model_ = nullptr;
  125. }
  126. }
  127. Status RunContextUtil::CreateRunContext(Model &model, const ComputeGraphPtr &graph, Buffer &buffer,
  128. const uint64_t session_id) {
  129. GELOGD("Begin to Create RunContext, session_id = %lu", session_id);
  130. // check params
  131. if (graph == nullptr) {
  132. GELOGE(PARAM_INVALID, "CreateRunContext param graph is null. session_id=%lu", session_id);
  133. return PARAM_INVALID;
  134. }
  135. uint32_t stream_num = 0;
  136. if (!AttrUtils::GetInt(&model, ATTR_MODEL_STREAM_NUM, stream_num)) {
  137. GELOGE(INTERNAL_ERROR, "Get stream_num attr from model_def failed. session_id=%lu", session_id);
  138. return INTERNAL_ERROR;
  139. }
  140. GELOGD("Stream_num = %u", stream_num);
  141. uint32_t event_num = 0;
  142. if (!AttrUtils::GetInt(&model, ATTR_MODEL_EVENT_NUM, event_num)) {
  143. GELOGE(INTERNAL_ERROR, "Get event_num attr from model failed. session_id=%lu", session_id);
  144. return INTERNAL_ERROR;
  145. }
  146. GELOGD("Event_num = %u", event_num);
  147. uint32_t label_num = 0;
  148. if (!AttrUtils::GetInt(&model, ATTR_MODEL_LABEL_NUM, label_num)) {
  149. GELOGE(INTERNAL_ERROR, "Get label_num attr from model failed. session_id=%lu", session_id);
  150. return INTERNAL_ERROR;
  151. }
  152. GELOGD("Label_num = %u", label_num);
  153. Status ret = CreateRtModelResources(stream_num, event_num, label_num);
  154. if (ret != SUCCESS) {
  155. GELOGE(ret, "CreateRtModelResources failed. session_id=%lu", session_id);
  156. DestroyRtModelResources();
  157. return ret;
  158. }
  159. GELOGI("CreateRunContext: data_mem_base_ = %p, weight_mem_base_ = %p, memory_size = %lu, weight_size = %lu",
  160. data_mem_base_, weight_mem_base_, data_mem_size_, weight_mem_size_);
  161. PrintMemInfo();
  162. run_context_ = {rt_model_,
  163. nullptr,
  164. session_id,
  165. data_mem_size_,
  166. data_mem_base_,
  167. mem_type_to_data_mem_size_,
  168. mem_type_to_data_mem_base_,
  169. weight_mem_size_,
  170. weight_mem_base_,
  171. buffer,
  172. stream_list_,
  173. event_list_,
  174. label_list_};
  175. return SUCCESS;
  176. }
  177. void RunContextUtil::PrintMemInfo() {
  178. for (auto iter : mem_type_to_data_mem_base_) {
  179. GELOGD("CreateRunContext: memory type = %ld, data memory base = %p", iter.first, iter.second);
  180. }
  181. for (auto iter : mem_type_to_data_mem_size_) {
  182. GELOGD("CreateRunContext: memory type = %ld, data memory size = %lu", iter.first, iter.second);
  183. }
  184. }
  185. RunContext &RunContextUtil::GetRunContext() { return run_context_; }
  186. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示