You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

aicpu_ext_info.cc 11 kB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "hybrid/node_executor/aicpu/aicpu_ext_info.h"
  17. #include "framework/common/util.h"
  18. #include "framework/common/fmk_error_codes.h"
  19. #include "framework/common/debug/log.h"
  20. namespace ge {
  21. namespace hybrid {
  22. namespace {
  23. // if dim count is not reach kMaxShapeDims(8), use INT64_MIN to mark dim end.
  24. constexpr int64_t kDimEndFlag = INT64_MIN;
  25. }
  26. Status AicpuExtInfoHandler::Parse(const std::string &ext_info) {
  27. GELOGI("Node[%s] parse ext info start.", node_name_.c_str());
  28. if (ext_info.empty()) {
  29. GELOGE(PARAM_INVALID, "Node[%s] parse ext info failed as ext info is empty.", node_name_.c_str());
  30. return PARAM_INVALID;
  31. }
  32. ext_info_len_ = ext_info.size();
  33. ext_info_.reset(new(std::nothrow)uint8_t[ext_info_len_]);
  34. GE_CHECK_NOTNULL(ext_info_);
  35. if (memcpy_s(ext_info_.get(), ext_info_len_, ext_info.c_str(), ext_info.size()) != EOK) {
  36. GELOGE(FAILED, "[%s] Failed to coy ext info", node_name_.c_str());
  37. return FAILED;
  38. }
  39. input_shape_and_type_.clear();
  40. output_shape_and_type_.clear();
  41. auto ext_info_data = ext_info_.get();
  42. size_t offset = 0;
  43. while (offset + sizeof(AicpuExtInfo) <= ext_info_len_) {
  44. auto aicpu_ext_info = reinterpret_cast<AicpuExtInfo *>(ext_info_data + offset);
  45. GELOGD("Ext infoType=%d, infoLen=%u.", aicpu_ext_info->infoType, aicpu_ext_info->infoLen);
  46. switch (aicpu_ext_info->infoType) {
  47. case aicpu::FWKAdapter::FWK_ADPT_EXT_SHAPE_TYPE:
  48. GE_CHK_STATUS_RET(ParseExtShapeType(aicpu_ext_info), "Parse ext shape type failed.");
  49. break;
  50. case aicpu::FWKAdapter::FWK_ADPT_EXT_INPUT_SHAPE:
  51. GE_CHK_STATUS_RET(ParseExtInputShape(aicpu_ext_info), "Parse ext input shape failed.");
  52. break;
  53. case aicpu::FWKAdapter::FWK_ADPT_EXT_OUTPUT_SHAPE:
  54. GE_CHK_STATUS_RET(ParseExtOutputShape(aicpu_ext_info), "Parse ext output shape failed.");
  55. break;
  56. case aicpu::FWKAdapter::FWK_ADPT_EXT_SESSION_INFO:
  57. GE_CHK_STATUS_RET(ParseExtSessionInfo(aicpu_ext_info), "Parse ext session info failed.");
  58. break;
  59. default:
  60. GELOGD("Node[%s] ignore infoType=%d, infoLen=%u.",
  61. node_name_.c_str(), aicpu_ext_info->infoType, aicpu_ext_info->infoLen);
  62. break;
  63. }
  64. offset += sizeof(AicpuExtInfo);
  65. offset += aicpu_ext_info->infoLen;
  66. }
  67. GE_CHK_BOOL_RET_STATUS(offset == ext_info_len_, PARAM_INVALID,
  68. "Node[%s] ext_info format error, parse not reach end, offset=%zu, ext_info_len=%zu.",
  69. node_name_.c_str(), offset, ext_info_len_);
  70. GELOGI("Node[%s] parse ext info end.", node_name_.c_str());
  71. return SUCCESS;
  72. }
  73. Status AicpuExtInfoHandler::ParseExtShapeType(AicpuExtInfo *aicpu_ext_info) {
  74. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == sizeof(int32_t), PARAM_INVALID,
  75. "Node[%s] parse ext shape type failed as infoLen must be %zu but %u.",
  76. node_name_.c_str(), sizeof(int32_t), aicpu_ext_info->infoLen);
  77. auto type = reinterpret_cast<const int32_t *>(aicpu_ext_info->infoMsg);
  78. GE_CHK_BOOL_RET_STATUS(*type == unknown_type_, PARAM_INVALID,
  79. "Node[%s] parse ext shape type failed as need %d but %d.",
  80. node_name_.c_str(), unknown_type_, *type);
  81. GELOGI("Node[%s] parse ext shape type success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  82. return SUCCESS;
  83. }
  84. Status AicpuExtInfoHandler::ParseExtInputShape(AicpuExtInfo *aicpu_ext_info) {
  85. auto need_len = input_num_ * sizeof(AicpuShapeAndType);
  86. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
  87. "Node[%s] parse ext input shape failed as infoLen must be "
  88. "input_num[%u]*sizeof(ShapeAndType)[%zu] but %u.",
  89. node_name_.c_str(), input_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);
  90. auto input = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);
  91. for (uint32_t index = 0; index < input_num_; ++index) {
  92. input_shape_and_type_.emplace_back(&input[index]);
  93. }
  94. GELOGI("Node[%s] parse ext input shape success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  95. return SUCCESS;
  96. }
  97. Status AicpuExtInfoHandler::ParseExtOutputShape(AicpuExtInfo *aicpu_ext_info) {
  98. if (unknown_type_ == DEPEND_COMPUTE) {
  99. GELOGD("Node[%s] is depend compute type no need ext output shape, ignore it, infoLen=%u.",
  100. node_name_.c_str(), aicpu_ext_info->infoLen);
  101. return SUCCESS;
  102. }
  103. auto need_len = output_num_ * sizeof(AicpuShapeAndType);
  104. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == need_len, PARAM_INVALID,
  105. "Node[%s] parse ext output shape failed as infoLen must be "
  106. "output_num[%u]*sizeof(ShapeAndType)[%zu] but %u.",
  107. node_name_.c_str(), output_num_, sizeof(AicpuShapeAndType), aicpu_ext_info->infoLen);
  108. auto output = reinterpret_cast<AicpuShapeAndType *>(aicpu_ext_info->infoMsg);
  109. for (uint32_t index = 0; index < output_num_; ++index) {
  110. output_shape_and_type_.emplace_back(&output[index]);
  111. }
  112. GELOGI("Node[%s] parse ext output shape success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  113. return SUCCESS;
  114. }
  115. Status AicpuExtInfoHandler::ParseExtSessionInfo(AicpuExtInfo *aicpu_ext_info) {
  116. GE_CHK_BOOL_RET_STATUS(aicpu_ext_info->infoLen == sizeof(AicpuSessionInfo), PARAM_INVALID,
  117. "Node[%s] parse ext session info failed as infoLen must be %zu but %u.",
  118. node_name_.c_str(), sizeof(SessionInfo), aicpu_ext_info->infoLen);
  119. session_info_ = reinterpret_cast<AicpuSessionInfo *>(aicpu_ext_info->infoMsg);
  120. GELOGI("Node[%s] parse session info success infoLen=%u.", node_name_.c_str(), aicpu_ext_info->infoLen);
  121. return SUCCESS;
  122. }
  123. Status AicpuExtInfoHandler::UpdateSessionInfo(uint64_t session_id, uint64_t kernel_id, bool sess_flag) {
  124. if (session_info_ == nullptr) {
  125. GELOGD("There is no session info in ext_info, no need update.");
  126. return SUCCESS;
  127. }
  128. session_info_->sessionId = session_id;
  129. session_info_->kernelId = kernel_id;
  130. session_info_->sessFlag = sess_flag;
  131. return SUCCESS;
  132. }
  133. Status AicpuExtInfoHandler::UpdateSessionInfoSessionId(uint64_t session_id) {
  134. if (session_info_ == nullptr) {
  135. GELOGD("There is no session info in ext_info, no need update.");
  136. return SUCCESS;
  137. }
  138. session_info_->sessionId = session_id;
  139. session_info_->sessFlag = true;
  140. return SUCCESS;
  141. }
  142. Status AicpuExtInfoHandler::UpdateInputShapeAndType(uint32_t input_index, const GeTensorDesc &input_desc) {
  143. GE_CHECK_LE(input_index, input_num_);
  144. const auto &shape = input_desc.GetShape();
  145. GE_CHK_STATUS_RET(UpdateShapeAndType(shape, input_desc.GetDataType(), input_shape_and_type_[input_index]),
  146. "Node[%s] input[%u] update input shape and type failed.",
  147. node_name_.c_str(), input_index);
  148. return SUCCESS;
  149. }
  150. Status AicpuExtInfoHandler::UpdateOutputShapeAndType(uint32_t output_index, const GeTensorDesc &output_desc) {
  151. GE_CHK_BOOL_RET_STATUS((unknown_type_ != DEPEND_COMPUTE), INTERNAL_ERROR,
  152. "Node[%s] is depend compute is no need update output shape and type by ext.",
  153. node_name_.c_str());
  154. GE_CHECK_LE(output_index, output_num_);
  155. auto shape = output_desc.GetShape();
  156. // shape range need use range update shape
  157. if (unknown_type_ == DEPEND_SHAPE_RANGE) {
  158. std::vector<std::pair<int64_t, int64_t>> range;
  159. auto range_ret = output_desc.GetShapeRange(range);
  160. GE_CHK_BOOL_RET_STATUS(range_ret == GRAPH_SUCCESS, INTERNAL_ERROR,
  161. "Node[%s] is shape range type but get GetShapeRange failed, ret=%u.",
  162. node_name_.c_str(), range_ret);
  163. for (size_t k = 0; k < range.size(); ++k) {
  164. if (shape.GetDim(k) < 0 && k < range.size()) {
  165. GELOGD("Node[%s] output[%u] update dim[%zu] from %ld to range max %ld.",
  166. node_name_.c_str(), output_index, k, shape.GetDim(k), range[k].second);
  167. shape.SetDim(k, range[k].second);
  168. }
  169. }
  170. }
  171. return UpdateShapeAndType(shape, output_desc.GetDataType(), output_shape_and_type_[output_index]);
  172. }
  173. Status AicpuExtInfoHandler::GetOutputShapeAndType(uint32_t output_index, GeShape &shape, DataType &data_type) {
  174. GE_CHK_BOOL_RET_STATUS((unknown_type_ != DEPEND_COMPUTE), INTERNAL_ERROR,
  175. "Node[%s] is depend compute type can not get output shape and type by ext.",
  176. node_name_.c_str());
  177. GetShapeAndType(output_shape_and_type_[output_index], shape, data_type);
  178. return SUCCESS;
  179. }
  180. Status AicpuExtInfoHandler::UpdateShapeAndType(const GeShape &shape, DataType data_type,
  181. AicpuShapeAndType *shape_and_type) {
  182. auto dim_num = shape.GetDimNum();
  183. if (dim_num > aicpu::FWKAdapter::kMaxShapeDims) {
  184. GELOGE(PARAM_INVALID, "Update shape and type failed, as dim_num %zu is over max shape dims %u.",
  185. dim_num, aicpu::FWKAdapter::kMaxShapeDims);
  186. return PARAM_INVALID;
  187. }
  188. size_t index = 0;
  189. for (; index < dim_num; ++index) {
  190. shape_and_type->dims[index] = shape.GetDim(index);
  191. }
  192. if (index < aicpu::FWKAdapter::kMaxShapeDims) {
  193. shape_and_type->dims[index] = kDimEndFlag;
  194. }
  195. // now only support update shape, type is not support
  196. return SUCCESS;
  197. }
  198. void AicpuExtInfoHandler::GetShapeAndType(const AicpuShapeAndType *shape_and_type,
  199. GeShape &shape,
  200. DataType &data_type) {
  201. std::vector<int64_t> dims;
  202. for (uint32_t index = 0; index < aicpu::FWKAdapter::kMaxShapeDims; ++index) {
  203. auto tmpDim = shape_and_type->dims[index];
  204. if (tmpDim == kDimEndFlag) {
  205. break;
  206. }
  207. dims.emplace_back(tmpDim);
  208. }
  209. data_type = static_cast<DataType>(shape_and_type->type);
  210. shape = GeShape(dims);
  211. }
  212. } // namespace hybrid
  213. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示