You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 51 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201120212031204120512061207
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "framework/executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <ctime>
  19. #include <iostream>
  20. #include "framework/common/debug/log.h"
  21. #include "common/ge/ge_util.h"
  22. #include "framework/common/helper/model_helper.h"
  23. #include "common/profiling/profiling_manager.h"
  24. #include "common/dump/dump_manager.h"
  25. #include "graph/execute/graph_execute.h"
  26. #include "graph/load/graph_loader.h"
  27. #include "graph/load/model_manager/model_manager.h"
  28. #include "graph/manager/graph_mem_manager.h"
  29. #include "single_op/single_op_manager.h"
  30. #include "graph/load/model_manager/davinci_model.h"
  31. #include "opskernel_manager/ops_kernel_builder_manager.h"
  32. #include "graph/opsproto_manager.h"
  33. #include "ge_local_engine/engine/host_cpu_engine.h"
  34. using std::string;
  35. using std::vector;
  36. namespace {
  37. const size_t kDynamicBatchSizeVecSize = 1;
  38. const size_t kStaticBatchInfoSize = 1;
  39. const size_t kDynamicImageSizeVecSize = 2;
  40. const size_t kDynamicImageSizeInputSize = 2;
  41. const char *const kBatchLabel = "Batch_";
  42. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  43. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  44. const std::vector<uint32_t> &formats) {
  45. uint32_t idx = 0;
  46. for (auto desc_item : domi_descs) {
  47. ge::TensorDesc ge_desc;
  48. ge_desc.SetName(desc_item.name.c_str());
  49. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  50. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  51. std::vector<int64_t> shape_dims;
  52. for (auto dim : desc_item.shape_info.dims) {
  53. shape_dims.push_back(dim);
  54. }
  55. ge::Shape ge_shape(shape_dims);
  56. ge_desc.SetShape(ge_shape);
  57. ge_desc.SetSize(desc_item.size);
  58. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  59. ge_descs.emplace_back(ge_desc);
  60. ++idx;
  61. }
  62. }
  63. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  64. inputs.index = input_data.index;
  65. inputs.model_id = input_data.modelId;
  66. inputs.timestamp = input_data.timestamp;
  67. inputs.timeout = input_data.timeout;
  68. inputs.request_id = input_data.request_id;
  69. for (const auto &data_item : input_data.blobs) {
  70. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  71. inputs.blobs.emplace_back(dataBuf);
  72. }
  73. }
  74. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  75. outputs.index = output_data.index;
  76. outputs.model_id = output_data.modelId;
  77. for (const auto &data_item : output_data.blobs) {
  78. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  79. outputs.blobs.emplace_back(dataBuf);
  80. }
  81. }
  82. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  83. ge::InputData &inputs) {
  84. inputs.is_dynamic_batch = true;
  85. std::string batch_label;
  86. size_t match_idx = 0;
  87. for (size_t i = 0; i < batch_info.size(); ++i) {
  88. // dynamic_dims
  89. if (input_data.dynamic_dims.size() != 0) {
  90. bool is_match = true;
  91. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  92. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  93. is_match = false;
  94. break;
  95. }
  96. }
  97. if (is_match) {
  98. match_idx = i;
  99. break;
  100. }
  101. // dynamic_batch_size
  102. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  103. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  104. match_idx = i;
  105. break;
  106. // dynamic_image_size
  107. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  108. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  109. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  110. match_idx = i;
  111. break;
  112. }
  113. }
  114. batch_label = kBatchLabel + std::to_string(match_idx);
  115. inputs.batch_label = batch_label;
  116. GELOGI("current batch label:%s", batch_label.c_str());
  117. }
  118. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  119. if (batch_info.empty()) {
  120. REPORT_INNER_ERROR("E19999", "param Dynamic batch info is empty, check invalid.");
  121. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  122. return false;
  123. }
  124. for (auto batch : batch_info) {
  125. if (batch.size() != kDynamicBatchSizeVecSize) {
  126. REPORT_INNER_ERROR("E19999", "Dynamic batch param num is %zu, current batch size is %zu.",
  127. kDynamicBatchSizeVecSize, batch.size());
  128. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch param num is %zu, current batch size is %zu.",
  129. kDynamicBatchSizeVecSize, batch.size());
  130. return false;
  131. }
  132. if (batch[0] == static_cast<int64_t>(batch_size)) {
  133. return true;
  134. }
  135. }
  136. REPORT_INNER_ERROR("E19999", "Dynamic batch %lu can not match the gear of model.", batch_size);
  137. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch %lu can not match the gear of model.", batch_size);
  138. return false;
  139. }
  140. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  141. const vector<std::vector<int64_t>> &batch_info) {
  142. if (batch_info.empty()) {
  143. REPORT_INNER_ERROR("E19999", "ParamDynamic batch info is empty. check invalid");
  144. GELOGE(ge::FAILED, "[Check][Param] Dynamic batch info is empty.");
  145. return false;
  146. }
  147. for (auto resolution : batch_info) {
  148. if (resolution.size() != kDynamicImageSizeVecSize) {
  149. REPORT_INNER_ERROR("E19999", "Dynamic resolution param num is %zu, current resolution size is %zu.",
  150. kDynamicImageSizeVecSize, resolution.size());
  151. GELOGE(ge::FAILED, "[Check][Param] Dynamic resolution param num is %zu, current resolution size is %zu.",
  152. kDynamicImageSizeVecSize, resolution.size());
  153. return false;
  154. }
  155. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  156. return true;
  157. }
  158. }
  159. REPORT_INNER_ERROR("E19999", "Dynamic resolution (%lu,%lu) can not match the gear of model.",
  160. image_height, image_width);
  161. GELOGE(ge::FAILED, "[Check][Param]Dynamic resolution (%lu,%lu) can not match the gear of model.",
  162. image_height, image_width);
  163. return false;
  164. }
  165. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  166. const vector<vector<int64_t>> &batch_info) {
  167. if (batch_info.empty()) {
  168. REPORT_INNER_ERROR("E19999", "param batch_info is empty, check invalid");
  169. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] Dynamic batch info is empty.");
  170. return false;
  171. }
  172. bool find_match = false;
  173. for (auto resolution : batch_info) {
  174. if (cur_dynamic_dims.size() != resolution.size()) {
  175. REPORT_INNER_ERROR("E19999", "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  176. cur_dynamic_dims.size(), resolution.size());
  177. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  178. "[Check][Param] Cur dynamic dims param num is %zu, current resolution size is %zu.",
  179. cur_dynamic_dims.size(), resolution.size());
  180. return false;
  181. }
  182. bool flag = true;
  183. for (std::size_t i = 0; i < resolution.size(); ++i) {
  184. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  185. flag = false;
  186. break;
  187. }
  188. }
  189. if (flag) {
  190. find_match = true;
  191. break;
  192. }
  193. }
  194. if (!find_match) {
  195. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "[Check][Param] choose dynamic dims can not match the gear of model.");
  196. }
  197. return find_match;
  198. }
  199. } // namespace
  200. namespace ge {
  201. bool GeExecutor::isInit_ = false;
  202. static void InitOpsProtoManager() {
  203. string opsproto_path;
  204. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  205. if (path_env != nullptr) {
  206. string path = path_env;
  207. string file_path = RealPath(path.c_str());
  208. if (file_path.empty()) {
  209. GELOGE(FAILED, "[Check][EnvPath]ASCEND_OPP_PATH path [%s] is invalid.", path.c_str());
  210. REPORT_INPUT_ERROR("E68016", {"ASCEND_OPP_PATH", path});
  211. return;
  212. }
  213. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  214. GELOGI("Get opsproto so path from env : %s", path.c_str());
  215. } else {
  216. string path_base = PluginManager::GetPath();
  217. GELOGI("path_base is %s", path_base.c_str());
  218. path_base = path_base.substr(0, path_base.rfind('/'));
  219. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  220. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  221. }
  222. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  223. OpsProtoManager *manager = OpsProtoManager::Instance();
  224. map<string, string> option_tmp;
  225. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  226. (void)manager->Initialize(option_tmp);
  227. }
  228. GeExecutor::GeExecutor() {}
  229. Status GeExecutor::Initialize() {
  230. GELOGI("Init GeExecutor begin.");
  231. if (isInit_) {
  232. GELOGW("Already initialized, no need to be initialized again.");
  233. return ge::SUCCESS;
  234. }
  235. OpTilingManager::GetInstance().LoadSo();
  236. Status init_hostcpu_engine_status = HostCpuEngine::GetInstance().Initialize();
  237. if (init_hostcpu_engine_status != SUCCESS) {
  238. GELOGE(init_hostcpu_engine_status, "[initialize][HostCpuEngine] failed");
  239. return init_hostcpu_engine_status;
  240. }
  241. InitOpsProtoManager();
  242. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  243. mem_type.push_back(RT_MEMORY_P2P_DDR);
  244. auto ret = MemManager::Instance().Initialize(mem_type);
  245. if (ret != SUCCESS) {
  246. GELOGE(ret, "[Initialize][MemManager] failed.");
  247. return ret;
  248. }
  249. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  250. "[Initialize][OpsKernelBuilderManager] failed.");
  251. // Start profiling
  252. Options profiling_options;
  253. profiling_options.device_id = 0;
  254. // job id need to be set, the value is meaningless;
  255. profiling_options.job_id = "1";
  256. ProfilingManager::Instance().Init(profiling_options);
  257. isInit_ = true;
  258. GELOGI("Init GeExecutor over.");
  259. return ge::SUCCESS;
  260. }
  261. Status GeExecutor::Finalize() {
  262. GELOGI("Uninit GeExecutor begin.");
  263. if (isInit_ == false) {
  264. GELOGW("GeExecutor has not been initialized.");
  265. return ge::SUCCESS;
  266. }
  267. (void) OpsKernelBuilderManager::Instance().Finalize();
  268. // Stop profiling
  269. if (ProfilingManager::Instance().ProfilingOn()) {
  270. ProfilingManager::Instance().StopProfiling();
  271. ProfilingManager::Instance().PluginUnInit();
  272. }
  273. GELOGI("Uninit GeExecutor over.");
  274. return ge::SUCCESS;
  275. }
  276. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  277. uint64_t batch_size) {
  278. if (dynamic_input_addr == nullptr) {
  279. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  280. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  281. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  282. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  283. }
  284. uint64_t size = sizeof(uint32_t);
  285. if (length < size) {
  286. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  287. length, size, model_id);
  288. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  289. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u", length, size, model_id);
  290. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  291. }
  292. if (length >= sizeof(uint64_t)) {
  293. size = sizeof(uint64_t);
  294. }
  295. // Verify whether the input dynamic batch matches the model gear
  296. std::vector<std::vector<int64_t>> batch_info;
  297. std::vector<uint64_t> batch_num{batch_size};
  298. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  299. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  300. if (ret != SUCCESS) {
  301. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u", model_id);
  302. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  303. return ret;
  304. }
  305. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  306. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  307. "[Check][Param] The current dynamic input does not match the gear of the model(id:%u).", model_id);
  308. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  309. }
  310. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  311. if (ret != SUCCESS) {
  312. REPORT_CALL_ERROR("E19999", "set dynamic size failed, model id:%u, dynamic_type:1", model_id);
  313. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u, dynamic_type:1", model_id);
  314. return ret;
  315. }
  316. // memcpy dynamic_batch_size from host to device
  317. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  318. if (rt_ret != RT_ERROR_NONE) {
  319. REPORT_CALL_ERROR("E19999", "Call rtMemcpy, size:%lu ret:0x%X", length, rt_ret);
  320. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic batch input data failed! size:%lu ret:0x%X", length, rt_ret);
  321. return RT_ERROR_TO_GE_STATUS(rt_ret);
  322. }
  323. return SUCCESS;
  324. }
  325. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  326. uint64_t image_height, uint64_t image_width) {
  327. if (dynamic_input_addr == nullptr) {
  328. REPORT_INNER_ERROR("E19999", "param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  329. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  330. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  331. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  332. }
  333. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  334. if (length < dynamic_input_size) {
  335. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is less than [%lu], check invalid, model id:%u",
  336. length, dynamic_input_size, model_id);
  337. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  338. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  339. length, dynamic_input_size, model_id);
  340. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  341. }
  342. uint64_t size = sizeof(uint32_t);
  343. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  344. size = sizeof(uint64_t);
  345. }
  346. // Verify whether the input dynamic resolution matches the model gear
  347. std::vector<std::vector<int64_t>> batch_info;
  348. std::vector<uint64_t> batch_num{image_height, image_width};
  349. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  350. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  351. if (ret != SUCCESS) {
  352. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  353. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  354. return ret;
  355. }
  356. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  357. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  358. "[Check][Param] The current dynamic input does not match the gear of the model, "
  359. "image_height:%lu, image_width:%lu.", image_height, image_width);
  360. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  361. }
  362. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  363. if (ret != SUCCESS) {
  364. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u,", model_id);
  365. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  366. return ret;
  367. }
  368. // Memcpy dynamic resolution height from host to device
  369. rtError_t rt_ret =
  370. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  371. if (rt_ret != RT_ERROR_NONE) {
  372. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u", size, rt_ret, model_id);
  373. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  374. size, rt_ret, model_id);
  375. return RT_ERROR_TO_GE_STATUS(rt_ret);
  376. }
  377. uint64_t remain_size = length - size;
  378. // Memcpy dynamic resolution width from host to device
  379. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  380. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  381. if (rt_ret != RT_ERROR_NONE) {
  382. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed! size:%lu, ret:0x%X, model id:%u",
  383. remain_size, rt_ret, model_id);
  384. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X, model id:%u",
  385. remain_size, rt_ret, model_id);
  386. return RT_ERROR_TO_GE_STATUS(rt_ret);
  387. }
  388. return SUCCESS;
  389. }
  390. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  391. const vector<uint64_t> &dynamic_dims) {
  392. if (dynamic_input_addr == nullptr) {
  393. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  394. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  395. "[Check][Param] Dynamic input addr is nullptr, model id:%u", model_id);
  396. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  397. }
  398. vector<uint64_t> cur_dynamic_dims;
  399. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  400. if (ret != SUCCESS) {
  401. GELOGE(ret, "[Get][CurDynamicDims] failed, model id:%u", model_id);
  402. return ret;
  403. }
  404. std::vector<std::vector<int64_t>> batch_info;
  405. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  406. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  407. if (ret != SUCCESS) {
  408. REPORT_CALL_ERROR("E19999", "Get dynamic input info failed, model id:%u.", model_id);
  409. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  410. return ret;
  411. }
  412. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  413. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID,
  414. "[Check][Param] The current dynamic input does not match the gear of the model, id:%u.", model_id);
  415. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  416. }
  417. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  418. if (ret != SUCCESS) {
  419. REPORT_CALL_ERROR("E19999", "Set dynamic size failed, model id:%u", model_id);
  420. GELOGE(ret, "[Set][DynamicSize] failed, model id:%u", model_id);
  421. return ret;
  422. }
  423. size_t dynamic_dim_num = cur_dynamic_dims.size();
  424. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  425. if (length < dynamic_input_size) {
  426. REPORT_INNER_ERROR("E19999", "input dynamic size [%lu] is less than [%lu], model id:%u",
  427. length, dynamic_input_size, model_id);
  428. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  429. "[Check][Param] Dynamic input size [%lu] is less than [%lu], model id:%u",
  430. length, dynamic_input_size, model_id);
  431. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  432. }
  433. uint64_t size = sizeof(uint32_t);
  434. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  435. size = sizeof(uint64_t);
  436. }
  437. rtError_t rt_ret;
  438. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  439. // Memcpy dynamic dim[i] from host to device
  440. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  441. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  442. if (rt_ret != RT_ERROR_NONE) {
  443. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", (length - size * i), rt_ret);
  444. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy dynamic resolution input data failed! size:%lu, ret:0x%X",
  445. length - size * i, rt_ret);
  446. return RT_ERROR_TO_GE_STATUS(rt_ret);
  447. }
  448. }
  449. return SUCCESS;
  450. }
  451. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  452. vector<uint64_t> &cur_dynamic_dims) {
  453. cur_dynamic_dims.clear();
  454. vector<ge::TensorDesc> input_desc;
  455. vector<ge::TensorDesc> output_desc;
  456. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  457. if (ret != ge::SUCCESS) {
  458. GELOGE(ret, "[Get][ModelDescInfo] failed, model id:%u.", model_id);
  459. return ret;
  460. }
  461. vector<string> user_designate_shape_order;
  462. vector<int64_t> all_data_dims;
  463. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  464. if (ret != ge::SUCCESS) {
  465. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  466. return ret;
  467. }
  468. for (auto &data_name : user_designate_shape_order) {
  469. for (auto &desc : input_desc) {
  470. if (desc.GetName() == data_name) {
  471. for (auto dim : desc.GetShape().GetDims()) {
  472. all_data_dims.push_back(dim);
  473. }
  474. break;
  475. }
  476. }
  477. }
  478. if (dynamic_dims.size() != all_data_dims.size()){
  479. REPORT_INNER_ERROR("E19999", "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  480. dynamic_dims.size(), all_data_dims.size());
  481. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  482. "[Check][Param] Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  483. dynamic_dims.size(), all_data_dims.size());
  484. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  485. }
  486. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  487. if (all_data_dims[i] < 0) {
  488. cur_dynamic_dims.push_back(dynamic_dims[i]);
  489. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  490. REPORT_INNER_ERROR("E19999", "Static dims should be same, index:%zu value:%lu should be %ld",
  491. i, dynamic_dims[i], all_data_dims[i]);
  492. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  493. "[Check][Param] Static dims should be same, index:%zu value:%lu should be %ld",
  494. i, dynamic_dims[i], all_data_dims[i]);
  495. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  496. }
  497. }
  498. return SUCCESS;
  499. }
  500. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  501. GELOGI("Begin to get current shape");
  502. if (!isInit_) {
  503. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  504. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  505. return ACL_ERROR_GE_EXEC_NOT_INIT;
  506. }
  507. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  508. if (ret != SUCCESS) {
  509. REPORT_CALL_ERROR("E19999", "Get Cur Shape failed, model id:%u", model_id);
  510. GELOGE(ret, "[Get][CurShape] failed, model id:%u", model_id);
  511. return ret;
  512. }
  513. return SUCCESS;
  514. }
  515. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  516. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  517. const kAippDynamicPara &aippParms) {
  518. GELOGI("Enter to SetDynamicAippData.");
  519. if (dynamic_input_addr == nullptr) {
  520. REPORT_INNER_ERROR("E19999", "Param dynamic_input_addr is nullptr, check invalid, model id:%u", model_id);
  521. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID,
  522. "[Check][Param] Dynamic aipp input addr is nullptr, model id:%u", model_id);
  523. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  524. }
  525. if (aippBatchPara.empty()) {
  526. REPORT_INNER_ERROR("E19999", "Param aippBatchPara is empty, check invalid, model id:%u", model_id);
  527. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "[Check][Param] aippBatchPara is empty, model id:%u", model_id);
  528. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  529. }
  530. uint64_t batch_num = aippBatchPara.size();
  531. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  532. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  533. GELOGI(
  534. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  535. "batch num is %lu, struct_len is %lu",
  536. model_id, length, batch_num, struct_len);
  537. if (struct_len > length) {
  538. REPORT_INNER_ERROR("E19999", "input dynamic aipp param len:%lu is larger than aipp_data size:%lu",
  539. struct_len, length);
  540. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  541. "[Check][Param] input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]",
  542. struct_len, length);
  543. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  544. }
  545. // Memcpy real kAippDynamicBatchPara from host to device
  546. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  547. if (rt_ret != RT_ERROR_NONE) {
  548. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, size:%lu, ret:0x%X", length, rt_ret);
  549. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy aippParms failed! size:%lu, ret:0x%X", length, rt_ret);
  550. return RT_ERROR_TO_GE_STATUS(rt_ret);
  551. }
  552. uint64_t remain_len = length - real_aippParms_size;
  553. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  554. for (uint64_t i = 0; i < batch_num; ++i) {
  555. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  556. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  557. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  558. if (rt_ret != RT_ERROR_NONE) {
  559. REPORT_CALL_ERROR("E19999", "Call rtMemcpy failed, ret:0x%X", rt_ret);
  560. GELOGE(rt_ret, "[Call][RtMemcpy] memcpy kAippDynamicBatchPara input data failed! ret:0x%X", rt_ret);
  561. return RT_ERROR_TO_GE_STATUS(rt_ret);
  562. }
  563. }
  564. return SUCCESS;
  565. }
  566. Status GeExecutor::UnloadModel(uint32_t model_id) {
  567. GELOGD("unload model %u begin.", model_id);
  568. if (!isInit_) {
  569. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized");
  570. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  571. return ACL_ERROR_GE_EXEC_NOT_INIT;
  572. }
  573. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  574. if (ret != SUCCESS) {
  575. REPORT_CALL_ERROR("E19999", "Destroy Aicpu Session For Infer failed, model id:%u", model_id);
  576. GELOGE(ret, "[Destroy][AicpuSession] For Infer failed. model id:%u", model_id);
  577. return ret;
  578. }
  579. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model =
  580. ModelManager::GetInstance()->GetHybridModel(model_id);
  581. if (hybrid_davinci_model != nullptr) {
  582. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  583. VarManagerPool::Instance().RemoveVarManager(session_id);
  584. } else {
  585. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  586. if (davinci_model != nullptr) {
  587. uint64_t session_id = davinci_model->GetSessionId();
  588. VarManagerPool::Instance().RemoveVarManager(session_id);
  589. }
  590. }
  591. ret = GraphLoader::UnloadModel(model_id);
  592. if (ret != SUCCESS) {
  593. REPORT_CALL_ERROR("E19999", "unload model failed, model id:%u", model_id);
  594. GELOGE(ret, "[Unload][Model] failed. model id:%u", model_id);
  595. return ret;
  596. }
  597. return SUCCESS;
  598. }
  599. // Get input and output descriptor
  600. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  601. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  602. if (!isInit_) {
  603. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized, model id:%u", model_id);
  604. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized, model id:%u", model_id);
  605. return ACL_ERROR_GE_EXEC_NOT_INIT;
  606. }
  607. std::vector<InputOutputDescInfo> input_desc_infos;
  608. std::vector<InputOutputDescInfo> output_desc_infos;
  609. std::vector<uint32_t> input_formats;
  610. std::vector<uint32_t> output_formats;
  611. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  612. output_formats, new_model_desc);
  613. if (ret != domi::SUCCESS) {
  614. REPORT_CALL_ERROR("E19999", "get input output desc info failed, ret = %u, model id:%u", ret, model_id);
  615. GELOGE(ret, "[Get][InputOutputDescInfo] failed. ret = %u, model id:%u", ret, model_id);
  616. return ACL_ERROR_GE_GET_TENSOR_INFO;
  617. }
  618. if (input_formats.size() != input_desc_infos.size()) {
  619. REPORT_INNER_ERROR("E19999", "input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  620. input_formats.size(), input_desc_infos.size(), model_id);
  621. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  622. "[Check][Param] input_formats size %zu is not equal to input_desc_infos size %zu, model id:%u.",
  623. input_formats.size(), input_desc_infos.size(), model_id);
  624. return ACL_ERROR_GE_PARAM_INVALID;
  625. }
  626. if (output_formats.size() != output_desc_infos.size()) {
  627. REPORT_INNER_ERROR("E19999", "output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  628. output_formats.size(), output_desc_infos.size(), model_id);
  629. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  630. "[Check][Param] output_formats size %zu is not equal to output_desc_infos size %zu, model id:%u.",
  631. output_formats.size(), output_desc_infos.size(), model_id);
  632. return ACL_ERROR_GE_PARAM_INVALID;
  633. }
  634. // Transfer data to TensorDesc
  635. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  636. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  637. return ge::SUCCESS;
  638. }
  639. ///
  640. /// @ingroup ge
  641. /// @brief Get dynamic batch_info
  642. /// @param [in] model_id
  643. /// @param [out] batch_info
  644. /// @param [out] dynamic_type
  645. /// @return execute result
  646. ///
  647. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  648. int32_t &dynamic_type) {
  649. if (!isInit_) {
  650. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  651. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  652. return ACL_ERROR_GE_EXEC_NOT_INIT;
  653. }
  654. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  655. if (ret != SUCCESS) {
  656. REPORT_CALL_ERROR("E19999", "Get Dynamic BatchInfo failed, model id:%u.", model_id);
  657. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  658. return ret;
  659. }
  660. return SUCCESS;
  661. }
  662. ///
  663. /// @ingroup ge
  664. /// @brief Get combined dynamic dims info
  665. /// @param [in] model_id
  666. /// @param [out] batch_info
  667. /// @return execute result
  668. ///
  669. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  670. GELOGI("Begin to get combined dynamic dims info.");
  671. if (!isInit_) {
  672. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  673. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  674. return ACL_ERROR_GE_EXEC_NOT_INIT;
  675. }
  676. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  677. if (ret != SUCCESS) {
  678. REPORT_CALL_ERROR("E19999", "Get Combined DynamicDims failed, model id:%u.", model_id);
  679. GELOGE(ret, "[Get][CombinedDynamicDims] failed, model id:%u.", model_id);
  680. return ret;
  681. }
  682. GELOGI("Get combined dynamic dims succ.");
  683. return SUCCESS;
  684. }
  685. ///
  686. /// @ingroup ge
  687. /// @brief Get user designeate shape order
  688. /// @param [in] model_id
  689. /// @param [out] user_designate_shape_order
  690. /// @return execute result
  691. ///
  692. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  693. if (!isInit_) {
  694. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  695. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  696. return ACL_ERROR_GE_EXEC_NOT_INIT;
  697. }
  698. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  699. if (ret != SUCCESS) {
  700. REPORT_CALL_ERROR("E19999", "GetUserDesignateShapeOrder failed, model id:%u.", model_id);
  701. GELOGE(ret, "[Call][GetUserDesignateShapeOrder] failed, model id:%u.", model_id);
  702. return ret;
  703. }
  704. return SUCCESS;
  705. }
  706. ///
  707. /// @ingroup ge
  708. /// @brief Get AIPP input format
  709. /// @param [in] model_id
  710. /// @param [in] index
  711. /// @param [out] input_format
  712. /// @return execute result
  713. ///
  714. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  715. GELOGI("Begin to GetAIPPInfo.");
  716. if (!isInit_) {
  717. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  718. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor not inited yet!");
  719. return ACL_ERROR_GE_EXEC_NOT_INIT;
  720. }
  721. Status ret = GraphExecutor::GetAippInfo(model_id, index, aipp_info);
  722. if (ret != SUCCESS) {
  723. GELOGW("GetAIPPInfo is not success.");
  724. return ret;
  725. }
  726. GELOGI("GetAIPPInfo succ.");
  727. return SUCCESS;
  728. }
  729. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  730. GELOGI("Begin to get aipp type.");
  731. if (!isInit_) {
  732. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  733. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not inited yet!");
  734. return ACL_ERROR_GE_EXEC_NOT_INIT;
  735. }
  736. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  737. if (ret != SUCCESS) {
  738. GELOGW("Get aipp type is not success.");
  739. return ret;
  740. }
  741. GELOGI("Get aipp type success.");
  742. return SUCCESS;
  743. }
  744. Status GeExecutor::GetOpAttr(uint32_t model_id, const std::string &op_name, const std::string &attr_name,
  745. std::string &attr_value) {
  746. GELOGI("Begin to get op attr.");
  747. if (!isInit_) {
  748. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Init][GeExecutor]Ge executor not inited yet!");
  749. REPORT_INNER_ERROR("E19999", "Ge executor not inited yet!");
  750. return ACL_ERROR_GE_EXEC_NOT_INIT;
  751. }
  752. Status ret = GraphExecutor::GetOpAttr(model_id, op_name, attr_name, attr_value);
  753. if (ret != SUCCESS) {
  754. GELOGE(ret, "[Get][OpAttr]Get op:%s attr:%s failed, model id:%u.",
  755. op_name.c_str(), attr_name.c_str(), model_id);
  756. REPORT_CALL_ERROR("E19999", "Get op:%s attr:%s failed, model id:%u",
  757. op_name.c_str(), attr_name.c_str(), model_id);
  758. return ret;
  759. }
  760. return SUCCESS;
  761. }
  762. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  763. if (!isInit_) {
  764. REPORT_INNER_ERROR("E19999", "GeExecutor has not inited yet!");
  765. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  766. return ACL_ERROR_GE_EXEC_NOT_INIT;
  767. }
  768. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  769. if (ret != SUCCESS) {
  770. REPORT_CALL_ERROR("E19999", "Get Model Attr failed, model id:%u.", model_id);
  771. GELOGE(ret, "[Get][ModelAttr] failed, model id:%u.", model_id);
  772. return ret;
  773. }
  774. return SUCCESS;
  775. }
  776. Status GeExecutor::CommandHandle(const Command &command) {
  777. Status ret = GraphLoader::CommandHandle(command);
  778. if (ret != SUCCESS) {
  779. REPORT_CALL_ERROR("E19999", "call CommandHandle failed, ret:%u", ret);
  780. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "[Call][CommandHandle] failed, ret:%u", ret);
  781. return ACL_ERROR_GE_COMMAND_HANDLE;
  782. }
  783. return SUCCESS;
  784. }
  785. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  786. GELOGI("Get max used memory begin.");
  787. if (!isInit_) {
  788. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  789. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  790. return ACL_ERROR_GE_EXEC_NOT_INIT;
  791. }
  792. uint64_t max_mem_size = 0;
  793. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  794. max_size = static_cast<uint32_t>(max_mem_size);
  795. return ret;
  796. }
  797. /**
  798. * @ingroup ge
  799. * @brief Load data from model file to memory
  800. * @param [in] const std::string &path: Offline model file path
  801. * @param [out] domi::ModelData &model_data: Offline model memory data
  802. * @return SUCCESS handle successfully / others handle failed
  803. */
  804. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  805. GELOGI("Load data from file begin.");
  806. if (!isInit_) {
  807. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  808. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  809. return ACL_ERROR_GE_EXEC_NOT_INIT;
  810. }
  811. string filePath = RealPath(path.c_str());
  812. if (filePath.empty()) {
  813. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  814. "[Call][RealPath] File path is invalid. please check your text file '%s'.", path.c_str());
  815. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  816. }
  817. GELOGI("load modelData from file: %s.", path.c_str());
  818. int32_t priority = 0;
  819. Status ret = GraphLoader::LoadDataFromFile(path, priority, model_data);
  820. if (ret != SUCCESS) {
  821. if (model_data.model_data != nullptr) {
  822. delete[] static_cast<char *>(model_data.model_data);
  823. model_data.model_data = nullptr;
  824. }
  825. }
  826. return ret;
  827. }
  828. /**
  829. * @ingroup ge
  830. * @brief Load model from offline model memory data
  831. * @param [in] domi::ModelData &model_data: Offline model data
  832. void *dev_ptr: Input/Output memory start address
  833. size_t memsize: Input/Output memory length
  834. void *weight_ptr: Weight memory start address
  835. size_t weightsize: Weight memory length
  836. * @param [out] uint32_t &model_id: identification after model loading
  837. * @return SUCCESS handle successfully / others handle failed
  838. */
  839. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  840. void *weight_ptr, size_t weight_size) {
  841. if (!isInit_) {
  842. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  843. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not inited yet!");
  844. return ACL_ERROR_GE_EXEC_NOT_INIT;
  845. }
  846. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  847. }
  848. /**
  849. * @ingroup ge
  850. * @brief Load task list from ModelData with queue.
  851. * @param [out] model_id: model id allocate from manager.
  852. * @param [in] ge_model_data: Model data load from offline model.
  853. * @param [in] input_queue_ids: input queue ids create from user.
  854. * @param [in] output_queue_ids: input queue ids create from user.
  855. * @return: 0 for success / others for fail
  856. */
  857. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  858. const std::vector<uint32_t> &input_queue_ids,
  859. const std::vector<uint32_t> &output_queue_ids) {
  860. GELOGI("Load model with queue begin.");
  861. if (!isInit_) {
  862. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  863. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  864. return ACL_ERROR_GE_EXEC_NOT_INIT;
  865. }
  866. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  867. }
  868. /**
  869. * @ingroup ge
  870. * @brief Synchronous execution of offline model(Do not create thread)
  871. * @param [in] uint32_t model_id: Model ID to execute
  872. void* stream: stream to execute
  873. const domi::InputData *input_data: Model input data
  874. bool async_mode: is asynchronize mode.
  875. * @param [out] domi::OutputData *output_data: Model output data
  876. * @return SUCCESS handle successfully / others handle failed
  877. */
  878. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  879. ge::RunModelData &run_output_data, bool async_mode) {
  880. std::vector<GeTensorDesc> input_desc = {};
  881. std::vector<GeTensorDesc> output_desc = {};
  882. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  883. }
  884. /**
  885. * @ingroup ge
  886. * @brief Synchronous execution of offline model(Do not create thread)
  887. * @param [in] uint32_t model_id: Model ID to execute
  888. void* stream: stream to execute
  889. const domi::InputData *input_data: Model input data
  890. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  891. bool async_mode: is asynchronize mode
  892. * @param [out] domi::OutputData *output_data: Model output data
  893. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  894. * @return SUCCESS handle successfully / others handle failed
  895. */
  896. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  897. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  898. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  899. if (!isInit_) {
  900. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  901. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  902. return ACL_ERROR_GE_EXEC_NOT_INIT;
  903. }
  904. InputData input_data;
  905. OutputData output_data;
  906. GetDomiInputData(run_input_data, input_data);
  907. GetDomiOutputData(run_output_data, output_data);
  908. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  909. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  910. std::vector<std::vector<int64_t>> batch_info;
  911. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  912. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  913. if (ret != SUCCESS) {
  914. REPORT_CALL_ERROR("E19999", "get dynamic batch info failed, model id:%u.", model_id);
  915. GELOGE(ret, "[Get][DynamicBatchInfo] failed, model id:%u.", model_id);
  916. return ret;
  917. }
  918. if (!batch_info.empty()) {
  919. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  920. }
  921. }
  922. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  923. }
  924. /**
  925. * @ingroup ge
  926. * @brief Get weight memory size from model file
  927. * @param [in] const std::string &path: Offline model file path
  928. * @param [out] size_t &mem_size Execution memory size
  929. size_t &weight_size Weight memory space size
  930. * @return SUCCESS handle successfully / others handle failed
  931. */
  932. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  933. GELOGI("Get memory and weight size from file begin.");
  934. if (!isInit_) {
  935. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  936. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  937. return ACL_ERROR_GE_EXEC_NOT_INIT;
  938. }
  939. ModelData model;
  940. Status ret = ge::GraphLoader::LoadDataFromFile(path, 0, model);
  941. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  942. REPORT_CALL_ERROR("E19999", "load data from file failed, ret = %d", ret);
  943. GELOGE(ret, "[Load][Data] from file failed. ret = %d", ret);
  944. return ret;
  945. }
  946. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  947. delete[] static_cast<char *>(model.model_data);
  948. model.model_data = nullptr;
  949. return ret;
  950. }
  951. /**
  952. * @ingroup ge
  953. * @brief Get weight memory size from model file
  954. * @param [in] const void *model_data Offline model buffer
  955. size_t model_size Offline model buffer length
  956. * @param [out] size_t &mem_size Execution memory size
  957. size_t &weight_size Weight memory space size
  958. * @return SUCCESS handle successfully / others handle failed
  959. */
  960. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  961. size_t &weight_size) {
  962. GELOGI("Get memory and weight size from data begin.");
  963. if (!isInit_) {
  964. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  965. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  966. return ACL_ERROR_GE_EXEC_NOT_INIT;
  967. }
  968. if (model_data == nullptr) {
  969. REPORT_INNER_ERROR("E19999", "param model_data is nullptr, check invalid!");
  970. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "[Check][Param] invalid model data!");
  971. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  972. }
  973. ModelData model;
  974. model.model_data = const_cast<void *>(model_data);
  975. model.model_len = static_cast<uint32_t>(model_size);
  976. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  977. }
  978. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  979. SingleOp **single_op) {
  980. return LoadSingleOpV2(model_name, modelData, stream, single_op, 0);
  981. }
  982. Status GeExecutor::LoadSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  983. SingleOp **single_op, const uint64_t model_id) {
  984. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op, model_id);
  985. }
  986. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  987. DynamicSingleOp **single_op) {
  988. return LoadDynamicSingleOpV2(model_name, modelData, stream, single_op, 0);
  989. }
  990. Status GeExecutor::LoadDynamicSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  991. DynamicSingleOp **single_op, const uint64_t model_id) {
  992. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op, model_id);
  993. }
  994. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  995. std::vector<DataBuffer> &outputs) {
  996. if (executor == nullptr) {
  997. REPORT_INNER_ERROR("E19999", "Param executor is nullptr, check invalid");
  998. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] param executor is nullptr");
  999. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1000. }
  1001. return executor->ExecuteAsync(inputs, outputs);
  1002. }
  1003. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  1004. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  1005. vector<DataBuffer> &outputs) {
  1006. GE_CHECK_NOTNULL(executor);
  1007. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  1008. }
  1009. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  1010. ModelManager::GetInstance()->ClearAicpuSo();
  1011. return SingleOpManager::GetInstance().ReleaseResource(stream);
  1012. }
  1013. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  1014. auto model_manager = ModelManager::GetInstance();
  1015. GE_CHECK_NOTNULL(model_manager);
  1016. auto davinci_model = model_manager->GetModel(model_id);
  1017. if (davinci_model == nullptr) {
  1018. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID,
  1019. "[Get][Model] failed, Model id:%u is invaild or model is not loaded.", model_id);
  1020. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  1021. }
  1022. device_id = davinci_model->GetDeviceId();
  1023. return SUCCESS;
  1024. }
  1025. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  1026. std::vector<std::vector<int64_t>> batch_info;
  1027. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  1028. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  1029. if (ret != SUCCESS) {
  1030. GELOGE(ret, "[Get][DynamicBatchInfo] failed. ret = %d, model id:%u", ret, model_id);
  1031. return ret;
  1032. }
  1033. if (batch_info.empty()) {
  1034. shape_count = kStaticBatchInfoSize;
  1035. } else {
  1036. shape_count = batch_info.size();
  1037. }
  1038. return SUCCESS;
  1039. }
  1040. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  1041. GELOGI("Begin to GetOrigInputInfo.");
  1042. if (!isInit_) {
  1043. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1044. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1045. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1046. }
  1047. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  1048. if (ret != SUCCESS) {
  1049. REPORT_CALL_ERROR("E19999", "Get Orig Input Info failed, model id:%u.", model_id);
  1050. GELOGE(ret, "[Get][OrigInputInfo] failed, model id:%u.", model_id);
  1051. return ret;
  1052. }
  1053. GELOGI("GetOrigInputInfo succ.");
  1054. return SUCCESS;
  1055. }
  1056. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  1057. std::vector<InputOutputDims> &input_dims,
  1058. std::vector<InputOutputDims> &output_dims) {
  1059. GELOGI("Begin to GetAllAippInputOutputDims.");
  1060. if (!isInit_) {
  1061. REPORT_INNER_ERROR("E19999", "GeExecutor has not been initialized!");
  1062. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Check][Param] GeExecutor has not been initialized!");
  1063. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1064. }
  1065. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  1066. if (ret != SUCCESS) {
  1067. REPORT_CALL_ERROR("E19999", "Get All Aipp Input Output Dims failed, model id:%u.", model_id);
  1068. GELOGE(ret, "[Get][AllAippInputOutputDims] failed, model id:%u.", model_id);
  1069. return ret;
  1070. }
  1071. GELOGI("GetAllAippInputOutputDims succ.");
  1072. return SUCCESS;
  1073. }
  1074. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  1075. GELOGI("Begin to GetOpDescInfo.");
  1076. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  1077. if (ret != SUCCESS) {
  1078. REPORT_CALL_ERROR("E19999", "get opdesc info failed, device_id:%u, stream_id:%u, task_id:%u.",
  1079. device_id, stream_id, task_id);
  1080. GELOGE(ret, "[Get][OpDescInfo] failed, device_id:%u, stream_id:%u, task_id:%u.",
  1081. device_id, stream_id, task_id);
  1082. return ret;
  1083. }
  1084. GELOGI("GetOpDescInfo succ.");
  1085. return SUCCESS;
  1086. }
  1087. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  1088. GELOGI("Start to set dump config");
  1089. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  1090. if (ret != SUCCESS) {
  1091. GELOGE(ret, "[Set][DumpConf] failed, ret:%d", ret);
  1092. return ret;
  1093. }
  1094. GELOGI("Set dump config successfully");
  1095. return SUCCESS;
  1096. }
  1097. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示