You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 40 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <ctime>
  19. #include <iostream>
  20. #include "common/debug/log.h"
  21. #include "common/ge/ge_util.h"
  22. #include "common/helper/model_helper.h"
  23. #include "common/profiling/profiling_manager.h"
  24. #include "common/dump/dump_manager.h"
  25. #include "graph/execute/graph_execute.h"
  26. #include "graph/load/graph_loader.h"
  27. #include "graph/load/model_manager/model_manager.h"
  28. #include "graph/manager/graph_mem_allocator.h"
  29. #include "single_op/single_op_manager.h"
  30. #include "graph/load/model_manager/davinci_model.h"
  31. #include "opskernel_manager/ops_kernel_builder_manager.h"
  32. using std::string;
  33. using std::vector;
  34. namespace {
  35. const size_t kDynamicBatchSizeVecSize = 1;
  36. const size_t kStaticBatchInfoSize = 1;
  37. const size_t kDynamicImageSizeVecSize = 2;
  38. const size_t kDynamicImageSizeInputSize = 2;
  39. const char *const kBatchLabel = "Batch_";
  40. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  41. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  42. const std::vector<uint32_t> &formats) {
  43. uint32_t idx = 0;
  44. for (auto desc_item : domi_descs) {
  45. ge::TensorDesc ge_desc;
  46. ge_desc.SetName(desc_item.name.c_str());
  47. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  48. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  49. std::vector<int64_t> shape_dims;
  50. for (auto dim : desc_item.shape_info.dims) {
  51. shape_dims.push_back(dim);
  52. }
  53. ge::Shape ge_shape(shape_dims);
  54. ge_desc.SetShape(ge_shape);
  55. ge_desc.SetSize(desc_item.size);
  56. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  57. ge_descs.emplace_back(ge_desc);
  58. ++idx;
  59. }
  60. }
  61. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  62. inputs.index = input_data.index;
  63. inputs.model_id = input_data.modelId;
  64. inputs.timestamp = input_data.timestamp;
  65. inputs.timeout = input_data.timeout;
  66. inputs.request_id = input_data.request_id;
  67. for (const auto &data_item : input_data.blobs) {
  68. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  69. inputs.blobs.emplace_back(dataBuf);
  70. }
  71. }
  72. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  73. outputs.index = output_data.index;
  74. outputs.model_id = output_data.modelId;
  75. for (const auto &data_item : output_data.blobs) {
  76. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  77. outputs.blobs.emplace_back(dataBuf);
  78. }
  79. }
  80. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  81. ge::InputData &inputs) {
  82. inputs.is_dynamic_batch = true;
  83. std::string batch_label;
  84. size_t match_idx = 0;
  85. for (size_t i = 0; i < batch_info.size(); ++i) {
  86. // dynamic_dims
  87. if (input_data.dynamic_dims.size() != 0) {
  88. bool is_match = true;
  89. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  90. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  91. is_match = false;
  92. break;
  93. }
  94. }
  95. if (is_match) {
  96. match_idx = i;
  97. break;
  98. }
  99. // dynamic_batch_size
  100. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  101. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  102. match_idx = i;
  103. break;
  104. // dynamic_image_size
  105. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  106. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  107. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  108. match_idx = i;
  109. break;
  110. }
  111. }
  112. batch_label = kBatchLabel + std::to_string(match_idx);
  113. inputs.batch_label = batch_label;
  114. GELOGI("current batch label:%s", batch_label.c_str());
  115. }
  116. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  117. if (batch_info.empty()) {
  118. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  119. return false;
  120. }
  121. for (auto batch : batch_info) {
  122. if (batch.size() != kDynamicBatchSizeVecSize) {
  123. GELOGE(ge::FAILED, "Dynamic batch param num is %zu, current batch size is %zu.", kDynamicBatchSizeVecSize,
  124. batch.size());
  125. return false;
  126. }
  127. if (batch[0] == static_cast<int64_t>(batch_size)) {
  128. return true;
  129. }
  130. }
  131. GELOGE(ge::FAILED, "Dynamic batch %lu can not match the gear of model.", batch_size);
  132. return false;
  133. }
  134. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  135. const vector<std::vector<int64_t>> &batch_info) {
  136. if (batch_info.empty()) {
  137. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  138. return false;
  139. }
  140. for (auto resolution : batch_info) {
  141. if (resolution.size() != kDynamicImageSizeVecSize) {
  142. GELOGE(ge::FAILED, "Dynamic resolution param num is %zu, current resolution size is %zu.",
  143. kDynamicImageSizeVecSize, resolution.size());
  144. return false;
  145. }
  146. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  147. return true;
  148. }
  149. }
  150. GELOGE(ge::FAILED, "Dynamic resolution (%lu,%lu) can not match the gear of model.", image_height, image_width);
  151. return false;
  152. }
  153. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  154. const vector<vector<int64_t>> &batch_info) {
  155. if (batch_info.empty()) {
  156. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Dynamic batch info is empty.");
  157. return false;
  158. }
  159. bool find_match = false;
  160. for (auto resolution : batch_info) {
  161. if (cur_dynamic_dims.size() != resolution.size()) {
  162. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  163. cur_dynamic_dims.size(), resolution.size());
  164. return false;
  165. }
  166. bool flag = true;
  167. for (std::size_t i = 0; i < resolution.size(); ++i) {
  168. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  169. flag = false;
  170. break;
  171. }
  172. }
  173. if (flag) {
  174. find_match = true;
  175. break;
  176. }
  177. }
  178. if (!find_match) {
  179. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "choose dynamic dims can not match the gear of model.");
  180. }
  181. return find_match;
  182. }
  183. } // namespace
  184. namespace ge {
  185. bool GeExecutor::isInit_ = false;
  186. GeExecutor::GeExecutor() {}
  187. Status GeExecutor::Initialize() {
  188. GELOGI("Init GeExecutor begin.");
  189. if (isInit_) {
  190. GELOGW("Already initialized, no need to be initialized again.");
  191. return ge::SUCCESS;
  192. }
  193. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  194. mem_type.push_back(RT_MEMORY_P2P_DDR);
  195. auto ret = MemManager::Instance().Initialize(mem_type);
  196. if (ret != SUCCESS) {
  197. GELOGE(ret, "Memory Manager init failed.");
  198. return ret;
  199. }
  200. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  201. "Failed to initialize OpsKernelBuilders.");
  202. // Start profiling
  203. Options profiling_options;
  204. profiling_options.device_id = 0;
  205. // job id need to be set, the value is meaningless;
  206. profiling_options.job_id = "1";
  207. ProfilingManager::Instance().Init(profiling_options);
  208. isInit_ = true;
  209. GELOGI("Init GeExecutor over.");
  210. return ge::SUCCESS;
  211. }
  212. Status GeExecutor::Finalize() {
  213. GELOGI("Uninit GeExecutor begin.");
  214. if (isInit_ == false) {
  215. GELOGW("GeExecutor has not been initialized.");
  216. return ge::SUCCESS;
  217. }
  218. (void) OpsKernelBuilderManager::Instance().Finalize();
  219. // Stop profiling
  220. if (ProfilingManager::Instance().ProfilingOn()) {
  221. ProfilingManager::Instance().StopProfiling();
  222. ProfilingManager::Instance().PluginUnInit();
  223. }
  224. GELOGI("Uninit GeExecutor over.");
  225. return ge::SUCCESS;
  226. }
  227. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  228. uint64_t batch_size) {
  229. if (dynamic_input_addr == nullptr) {
  230. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  231. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  232. }
  233. uint64_t size = sizeof(uint32_t);
  234. if (length < size) {
  235. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length, size);
  236. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  237. }
  238. if (length >= sizeof(uint64_t)) {
  239. size = sizeof(uint64_t);
  240. }
  241. // Verify whether the input dynamic batch matches the model gear
  242. std::vector<std::vector<int64_t>> batch_info;
  243. std::vector<uint64_t> batch_num{batch_size};
  244. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  245. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  246. if (ret != SUCCESS) {
  247. GELOGE(ret, "Get dynamic input info failed.");
  248. return ret;
  249. }
  250. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  251. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  252. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  253. }
  254. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  255. if (ret != SUCCESS) {
  256. GELOGE(ret, "Set dynamic size failed");
  257. return ret;
  258. }
  259. // memcpy dynamic_batch_size from host to device
  260. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  261. if (rt_ret != RT_ERROR_NONE) {
  262. GELOGE(rt_ret, "memcpy dynamic batch input data failed! ret: 0x%X", rt_ret);
  263. return RT_ERROR_TO_GE_STATUS(rt_ret);
  264. }
  265. return SUCCESS;
  266. }
  267. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  268. uint64_t image_height, uint64_t image_width) {
  269. if (dynamic_input_addr == nullptr) {
  270. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  271. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  272. }
  273. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  274. if (length < dynamic_input_size) {
  275. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  276. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  277. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  278. }
  279. uint64_t size = sizeof(uint32_t);
  280. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  281. size = sizeof(uint64_t);
  282. }
  283. // Verify whether the input dynamic resolution matches the model gear
  284. std::vector<std::vector<int64_t>> batch_info;
  285. std::vector<uint64_t> batch_num{image_height, image_width};
  286. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  287. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  288. if (ret != SUCCESS) {
  289. GELOGE(ret, "Get dynamic input info failed.");
  290. return ret;
  291. }
  292. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  293. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  294. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  295. }
  296. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  297. if (ret != SUCCESS) {
  298. GELOGE(ret, "Set dynamic size failed");
  299. return ret;
  300. }
  301. // Memcpy dynamic resolution height from host to device
  302. rtError_t rt_ret =
  303. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  304. if (rt_ret != RT_ERROR_NONE) {
  305. GELOGE(rt_ret, "memcpy dynamic resolution input data failed! ret: 0x%X", rt_ret);
  306. return RT_ERROR_TO_GE_STATUS(rt_ret);
  307. }
  308. uint64_t remain_size = length - size;
  309. // Memcpy dynamic resolution width from host to device
  310. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  311. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  312. if (rt_ret != RT_ERROR_NONE) {
  313. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  314. return RT_ERROR_TO_GE_STATUS(rt_ret);
  315. }
  316. return SUCCESS;
  317. }
  318. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  319. const vector<uint64_t> &dynamic_dims) {
  320. if (dynamic_input_addr == nullptr) {
  321. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  322. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  323. }
  324. vector<uint64_t> cur_dynamic_dims;
  325. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  326. if (ret != SUCCESS) {
  327. GELOGE(ret, "Set cur gear dynamic dims failed");
  328. return ret;
  329. }
  330. std::vector<std::vector<int64_t>> batch_info;
  331. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  332. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  333. if (ret != SUCCESS) {
  334. GELOGE(ret, "Get dynamic input info failed.");
  335. return ret;
  336. }
  337. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  338. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  339. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  340. }
  341. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  342. if (ret != SUCCESS) {
  343. GELOGE(ret, "Set dynamic size failed");
  344. return ret;
  345. }
  346. size_t dynamic_dim_num = cur_dynamic_dims.size();
  347. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  348. if (length < dynamic_input_size) {
  349. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  350. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  351. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  352. }
  353. uint64_t size = sizeof(uint32_t);
  354. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  355. size = sizeof(uint64_t);
  356. }
  357. rtError_t rt_ret;
  358. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  359. // Memcpy dynamic dim[i] from host to device
  360. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  361. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  362. if (rt_ret != RT_ERROR_NONE) {
  363. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  364. return RT_ERROR_TO_GE_STATUS(rt_ret);
  365. }
  366. }
  367. return SUCCESS;
  368. }
  369. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  370. vector<uint64_t> &cur_dynamic_dims) {
  371. cur_dynamic_dims.clear();
  372. vector<ge::TensorDesc> input_desc;
  373. vector<ge::TensorDesc> output_desc;
  374. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  375. if (ret != ge::SUCCESS) {
  376. GELOGE(ret, "GetModelDescInfo failed.");
  377. return ret;
  378. }
  379. vector<string> user_designate_shape_order;
  380. vector<int64_t> all_data_dims;
  381. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  382. if (ret != ge::SUCCESS) {
  383. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  384. return ret;
  385. }
  386. for (auto &data_name : user_designate_shape_order) {
  387. for (auto &desc : input_desc) {
  388. if (desc.GetName() == data_name) {
  389. for (auto dim : desc.GetShape().GetDims()) {
  390. all_data_dims.push_back(dim);
  391. }
  392. break;
  393. }
  394. }
  395. }
  396. if (dynamic_dims.size() != all_data_dims.size()){
  397. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  398. "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  399. dynamic_dims.size(), all_data_dims.size());
  400. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  401. }
  402. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  403. if (all_data_dims[i] < 0) {
  404. cur_dynamic_dims.push_back(dynamic_dims[i]);
  405. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  406. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  407. "Static dims should be same, index: %zu value: %lu should be %ld",
  408. i, dynamic_dims[i], all_data_dims[i]);
  409. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  410. }
  411. }
  412. return SUCCESS;
  413. }
  414. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  415. GELOGI("Begin to get current shape");
  416. if (!isInit_) {
  417. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  418. return ACL_ERROR_GE_EXEC_NOT_INIT;
  419. }
  420. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  421. if (ret != SUCCESS) {
  422. GELOGE(ret, "Get current shape failed");
  423. return ret;
  424. }
  425. return SUCCESS;
  426. }
  427. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  428. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  429. const kAippDynamicPara &aippParms) {
  430. GELOGI("Enter to SetDynamicAippData.");
  431. if (dynamic_input_addr == nullptr) {
  432. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic aipp input addr is nullptr!");
  433. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  434. }
  435. if (aippBatchPara.empty()) {
  436. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "aippBatchPara is empty.");
  437. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  438. }
  439. uint64_t batch_num = aippBatchPara.size();
  440. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  441. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  442. GELOGI(
  443. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  444. "batch num is %lu, struct_len is %lu",
  445. model_id, length, batch_num, struct_len);
  446. if (struct_len > length) {
  447. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  448. "input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]", struct_len, length);
  449. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  450. }
  451. // Memcpy real kAippDynamicBatchPara from host to device
  452. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  453. if (rt_ret != RT_ERROR_NONE) {
  454. GELOGE(rt_ret, "memcpy real_aippParms_size failed! ret: 0x%X", rt_ret);
  455. return RT_ERROR_TO_GE_STATUS(rt_ret);
  456. }
  457. uint64_t remain_len = length - real_aippParms_size;
  458. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  459. for (uint64_t i = 0; i < batch_num; ++i) {
  460. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  461. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  462. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  463. if (rt_ret != RT_ERROR_NONE) {
  464. GELOGE(rt_ret, "memcpy kAippDynamicBatchPara input data failed! ret: 0x%X", rt_ret);
  465. return RT_ERROR_TO_GE_STATUS(rt_ret);
  466. }
  467. }
  468. return SUCCESS;
  469. }
  470. Status GeExecutor::UnloadModel(uint32_t model_id) {
  471. GELOGD("unload model %u begin.", model_id);
  472. if (!isInit_) {
  473. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  474. return ACL_ERROR_GE_EXEC_NOT_INIT;
  475. }
  476. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  477. if (ret != SUCCESS) {
  478. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  479. return ret;
  480. }
  481. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model =
  482. ModelManager::GetInstance()->GetHybridModel(model_id);
  483. if (hybrid_davinci_model != nullptr) {
  484. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  485. VarManagerPool::Instance().RemoveVarManager(session_id);
  486. } else {
  487. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  488. if (davinci_model != nullptr) {
  489. uint64_t session_id = davinci_model->GetSessionId();
  490. VarManagerPool::Instance().RemoveVarManager(session_id);
  491. }
  492. }
  493. ret = GraphLoader::UnloadModel(model_id);
  494. if (ret != SUCCESS) {
  495. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  496. return ret;
  497. }
  498. return SUCCESS;
  499. }
  500. // Get input and output descriptor
  501. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  502. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  503. if (!isInit_) {
  504. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  505. return ACL_ERROR_GE_EXEC_NOT_INIT;
  506. }
  507. std::vector<InputOutputDescInfo> input_desc_infos;
  508. std::vector<InputOutputDescInfo> output_desc_infos;
  509. std::vector<uint32_t> input_formats;
  510. std::vector<uint32_t> output_formats;
  511. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  512. output_formats, new_model_desc);
  513. if (ret != domi::SUCCESS) {
  514. GELOGE(ret, "GetInputOutputDescInfo failed. ret = %u", ret);
  515. return ACL_ERROR_GE_GET_TENSOR_INFO;
  516. }
  517. if (input_formats.size() != input_desc_infos.size()) {
  518. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  519. "input_formats size %zu is not equal to input_desc_infos size %zu.",
  520. input_formats.size(), input_desc_infos.size());
  521. return ACL_ERROR_GE_PARAM_INVALID;
  522. }
  523. if (output_formats.size() != output_desc_infos.size()) {
  524. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats size %zu is not equal to output_desc_infos size %zu.",
  525. output_formats.size(), output_desc_infos.size());
  526. return ACL_ERROR_GE_PARAM_INVALID;
  527. }
  528. // Transfer data to TensorDesc
  529. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  530. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  531. return ge::SUCCESS;
  532. }
  533. ///
  534. /// @ingroup ge
  535. /// @brief Get dynamic batch_info
  536. /// @param [in] model_id
  537. /// @param [out] batch_info
  538. /// @param [out] dynamic_type
  539. /// @return execute result
  540. ///
  541. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  542. int32_t &dynamic_type) {
  543. if (!isInit_) {
  544. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  545. return ACL_ERROR_GE_EXEC_NOT_INIT;
  546. }
  547. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  548. if (ret != SUCCESS) {
  549. GELOGE(ret, "GetDynamicBatchInfo failed.");
  550. return ret;
  551. }
  552. return SUCCESS;
  553. }
  554. ///
  555. /// @ingroup ge
  556. /// @brief Get combined dynamic dims info
  557. /// @param [in] model_id
  558. /// @param [out] batch_info
  559. /// @return execute result
  560. ///
  561. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  562. GELOGI("Begin to get combined dynamic dims info.");
  563. if (!isInit_) {
  564. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  565. return ACL_ERROR_GE_EXEC_NOT_INIT;
  566. }
  567. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  568. if (ret != SUCCESS) {
  569. GELOGE(ret, "GetCombinedDynamicDims failed.");
  570. return ret;
  571. }
  572. GELOGI("Get combined dynamic dims succ.");
  573. return SUCCESS;
  574. }
  575. ///
  576. /// @ingroup ge
  577. /// @brief Get user designeate shape order
  578. /// @param [in] model_id
  579. /// @param [out] user_designate_shape_order
  580. /// @return execute result
  581. ///
  582. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  583. if (!isInit_) {
  584. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  585. return ACL_ERROR_GE_EXEC_NOT_INIT;
  586. }
  587. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  588. if (ret != SUCCESS) {
  589. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  590. return ret;
  591. }
  592. return SUCCESS;
  593. }
  594. ///
  595. /// @ingroup ge
  596. /// @brief Get AIPP input format
  597. /// @param [in] model_id
  598. /// @param [in] index
  599. /// @param [out] input_format
  600. /// @return execute result
  601. ///
  602. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  603. GELOGI("Begin to GetAIPPInfo.");
  604. if (!isInit_) {
  605. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  606. return ACL_ERROR_GE_EXEC_NOT_INIT;
  607. }
  608. Status ret = GraphExecutor::GetAippInfo(model_id, index, aipp_info);
  609. if (ret != SUCCESS) {
  610. GELOGW("GetAIPPInfo is not success.");
  611. return ret;
  612. }
  613. GELOGI("GetAIPPInfo succ.");
  614. return SUCCESS;
  615. }
  616. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  617. GELOGI("Begin to get aipp type.");
  618. if (!isInit_) {
  619. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  620. return ACL_ERROR_GE_EXEC_NOT_INIT;
  621. }
  622. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  623. if (ret != SUCCESS) {
  624. GELOGW("Get aipp type is not success.");
  625. return ret;
  626. }
  627. GELOGI("Get aipp type success.");
  628. return SUCCESS;
  629. }
  630. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  631. if (!isInit_) {
  632. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  633. return ACL_ERROR_GE_EXEC_NOT_INIT;
  634. }
  635. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  636. if (ret != SUCCESS) {
  637. GELOGE(ret, "Get dynamic batch output shape info failed.");
  638. return ret;
  639. }
  640. return SUCCESS;
  641. }
  642. Status GeExecutor::CommandHandle(const Command &command) {
  643. Status ret = GraphLoader::CommandHandle(command);
  644. if (ret != SUCCESS) {
  645. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "CommandHandle: Command Handle failed.");
  646. return ACL_ERROR_GE_COMMAND_HANDLE;
  647. }
  648. return SUCCESS;
  649. }
  650. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  651. GELOGI("Get max used memory begin.");
  652. if (!isInit_) {
  653. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  654. return ACL_ERROR_GE_EXEC_NOT_INIT;
  655. }
  656. uint64_t max_mem_size = 0;
  657. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  658. max_size = static_cast<uint32_t>(max_mem_size);
  659. return ret;
  660. }
  661. /**
  662. * @ingroup ge
  663. * @brief Load data from model file to memory
  664. * @param [in] const std::string &path: Offline model file path
  665. * @param [out] domi::ModelData &model_data: Offline model memory data
  666. * @return SUCCESS handle successfully / others handle failed
  667. */
  668. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  669. GELOGI("Load data from file begin.");
  670. if (!isInit_) {
  671. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  672. return ACL_ERROR_GE_EXEC_NOT_INIT;
  673. }
  674. string filePath = RealPath(path.c_str());
  675. if (filePath.empty()) {
  676. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  677. "File path is invalid. please check your text file '%s'.", path.c_str());
  678. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  679. }
  680. GELOGI("load modelData from file: %s.", path.c_str());
  681. std::string key_path;
  682. int32_t priority = 0;
  683. Status ret = GraphLoader::LoadDataFromFile(path, key_path, priority, model_data);
  684. if (ret != SUCCESS) {
  685. if (model_data.model_data != nullptr) {
  686. delete[] static_cast<char *>(model_data.model_data);
  687. model_data.model_data = nullptr;
  688. }
  689. }
  690. return ret;
  691. }
  692. /**
  693. * @ingroup ge
  694. * @brief Load model from offline model memory data
  695. * @param [in] domi::ModelData &model_data: Offline model data
  696. void *dev_ptr: Input/Output memory start address
  697. size_t memsize: Input/Output memory length
  698. void *weight_ptr: Weight memory start address
  699. size_t weightsize: Weight memory length
  700. * @param [out] uint32_t &model_id: identification after model loading
  701. * @return SUCCESS handle successfully / others handle failed
  702. */
  703. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  704. void *weight_ptr, size_t weight_size) {
  705. if (!isInit_) {
  706. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  707. return ACL_ERROR_GE_EXEC_NOT_INIT;
  708. }
  709. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  710. }
  711. /**
  712. * @ingroup ge
  713. * @brief Load task list from ModelData with queue.
  714. * @param [out] model_id: model id allocate from manager.
  715. * @param [in] ge_model_data: Model data load from offline model.
  716. * @param [in] input_queue_ids: input queue ids create from user.
  717. * @param [in] output_queue_ids: input queue ids create from user.
  718. * @return: 0 for success / others for fail
  719. */
  720. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  721. const std::vector<uint32_t> &input_queue_ids,
  722. const std::vector<uint32_t> &output_queue_ids) {
  723. GELOGI("Load model with queue begin.");
  724. if (!isInit_) {
  725. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  726. return ACL_ERROR_GE_EXEC_NOT_INIT;
  727. }
  728. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  729. }
  730. /**
  731. * @ingroup ge
  732. * @brief Synchronous execution of offline model(Do not create thread)
  733. * @param [in] uint32_t model_id: Model ID to execute
  734. void* stream: stream to execute
  735. const domi::InputData *input_data: Model input data
  736. bool async_mode: is asynchronize mode.
  737. * @param [out] domi::OutputData *output_data: Model output data
  738. * @return SUCCESS handle successfully / others handle failed
  739. */
  740. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  741. ge::RunModelData &run_output_data, bool async_mode) {
  742. std::vector<GeTensorDesc> input_desc = {};
  743. std::vector<GeTensorDesc> output_desc = {};
  744. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  745. }
  746. /**
  747. * @ingroup ge
  748. * @brief Synchronous execution of offline model(Do not create thread)
  749. * @param [in] uint32_t model_id: Model ID to execute
  750. void* stream: stream to execute
  751. const domi::InputData *input_data: Model input data
  752. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  753. bool async_mode: is asynchronize mode
  754. * @param [out] domi::OutputData *output_data: Model output data
  755. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  756. * @return SUCCESS handle successfully / others handle failed
  757. */
  758. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  759. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  760. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  761. if (!isInit_) {
  762. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  763. return ACL_ERROR_GE_EXEC_NOT_INIT;
  764. }
  765. InputData input_data;
  766. OutputData output_data;
  767. GetDomiInputData(run_input_data, input_data);
  768. GetDomiOutputData(run_output_data, output_data);
  769. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  770. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  771. std::vector<std::vector<int64_t>> batch_info;
  772. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  773. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  774. if (ret != SUCCESS) {
  775. GELOGE(ret, "Get dynamic input info failed.");
  776. return ret;
  777. }
  778. if (!batch_info.empty()) {
  779. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  780. }
  781. }
  782. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  783. }
  784. /**
  785. * @ingroup ge
  786. * @brief Get weight memory size from model file
  787. * @param [in] const std::string &path: Offline model file path
  788. * @param [out] size_t &mem_size Execution memory size
  789. size_t &weight_size Weight memory space size
  790. * @return SUCCESS handle successfully / others handle failed
  791. */
  792. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  793. GELOGI("Get memory and weight size from file begin.");
  794. if (!isInit_) {
  795. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  796. return ACL_ERROR_GE_EXEC_NOT_INIT;
  797. }
  798. ModelData model;
  799. std::string key;
  800. Status ret = ge::GraphLoader::LoadDataFromFile(path, key, 0, model);
  801. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  802. GELOGE(ret, "Load data from file failed. ret = %d", ret);
  803. return ret;
  804. }
  805. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  806. delete[] static_cast<char *>(model.model_data);
  807. model.model_data = nullptr;
  808. return ret;
  809. }
  810. /**
  811. * @ingroup ge
  812. * @brief Get weight memory size from model file
  813. * @param [in] const void *model_data Offline model buffer
  814. size_t model_size Offline model buffer length
  815. * @param [out] size_t &mem_size Execution memory size
  816. size_t &weight_size Weight memory space size
  817. * @return SUCCESS handle successfully / others handle failed
  818. */
  819. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  820. size_t &weight_size) {
  821. GELOGI("Get memory and weight size from data begin.");
  822. if (!isInit_) {
  823. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  824. return ACL_ERROR_GE_EXEC_NOT_INIT;
  825. }
  826. if (model_data == nullptr) {
  827. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "invalid model data!");
  828. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  829. }
  830. ModelData model;
  831. model.model_data = const_cast<void *>(model_data);
  832. model.model_len = static_cast<uint32_t>(model_size);
  833. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  834. }
  835. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  836. SingleOp **single_op) {
  837. return LoadSingleOpV2(model_name, modelData, stream, single_op, 0);
  838. }
  839. Status GeExecutor::LoadSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  840. SingleOp **single_op, const uint64_t model_id) {
  841. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op, model_id);
  842. }
  843. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  844. DynamicSingleOp **single_op) {
  845. return LoadDynamicSingleOpV2(model_name, modelData, stream, single_op, 0);
  846. }
  847. Status GeExecutor::LoadDynamicSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  848. DynamicSingleOp **single_op, const uint64_t model_id) {
  849. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op, model_id);
  850. }
  851. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  852. std::vector<DataBuffer> &outputs) {
  853. if (executor == nullptr) {
  854. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "param is NULL");
  855. return ACL_ERROR_GE_EXEC_NOT_INIT;
  856. }
  857. return executor->ExecuteAsync(inputs, outputs);
  858. }
  859. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  860. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  861. vector<DataBuffer> &outputs) {
  862. GE_CHECK_NOTNULL(executor);
  863. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  864. }
  865. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  866. ModelManager::GetInstance()->ClearAicpuSo();
  867. return SingleOpManager::GetInstance().ReleaseResource(stream);
  868. }
  869. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  870. auto model_manager = ModelManager::GetInstance();
  871. GE_CHECK_NOTNULL(model_manager);
  872. auto davinci_model = model_manager->GetModel(model_id);
  873. if (davinci_model == nullptr) {
  874. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id: %d is invaild or model is not loaded.", model_id);
  875. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  876. }
  877. device_id = davinci_model->GetDeviceId();
  878. return SUCCESS;
  879. }
  880. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  881. std::vector<std::vector<int64_t>> batch_info;
  882. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  883. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  884. if (ret != SUCCESS) {
  885. GELOGE(ret, "Calc batch info size failed. ret = %d", ret);
  886. return ret;
  887. }
  888. if (batch_info.empty()) {
  889. shape_count = kStaticBatchInfoSize;
  890. } else {
  891. shape_count = batch_info.size();
  892. }
  893. return SUCCESS;
  894. }
  895. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  896. GELOGI("Begin to GetOrigInputInfo.");
  897. if (!isInit_) {
  898. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  899. return ACL_ERROR_GE_EXEC_NOT_INIT;
  900. }
  901. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  902. if (ret != SUCCESS) {
  903. GELOGE(ret, "GetOrigInputInfo failed.");
  904. return ret;
  905. }
  906. GELOGI("GetOrigInputInfo succ.");
  907. return SUCCESS;
  908. }
  909. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  910. std::vector<InputOutputDims> &input_dims,
  911. std::vector<InputOutputDims> &output_dims) {
  912. GELOGI("Begin to GetAllAippInputOutputDims.");
  913. if (!isInit_) {
  914. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  915. return ACL_ERROR_GE_EXEC_NOT_INIT;
  916. }
  917. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  918. if (ret != SUCCESS) {
  919. GELOGE(ret, "GetAllAippInputOutputDims failed.");
  920. return ret;
  921. }
  922. GELOGI("GetAllAippInputOutputDims succ.");
  923. return SUCCESS;
  924. }
  925. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  926. GELOGI("Begin to GetOpDescInfo.");
  927. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  928. if (ret != SUCCESS) {
  929. GELOGE(ret, "GetOpDescInfo failed.");
  930. return ret;
  931. }
  932. GELOGI("GetOpDescInfo succ.");
  933. return SUCCESS;
  934. }
  935. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  936. GELOGI("Start to set dump config");
  937. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  938. if (ret != SUCCESS) {
  939. GELOGE(ret, "Set dump conf failed");
  940. return ret;
  941. }
  942. GELOGI("Set dump config successfully");
  943. return SUCCESS;
  944. }
  945. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示