You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 42 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802803804805806807808809810811812813814815816817818819820821822823824825826827828829830831832833834835836837838839840841842843844845846847848849850851852853854855856857858859860861862863864865866867868869870871872873874875876877878879880881882883884885886887888889890891892893894895896897898899900901902903904905906907908909910911912913914915916917918919920921922923924925926927928929930931932933934935936937938939940941942943944945946947948949950951952953954955956957958959960961962963964965966967968969970971972973974975976977978979980981982983984985986987988989990991992993994995996997998999100010011002100310041005100610071008100910101011101210131014101510161017101810191020102110221023102410251026102710281029103010311032103310341035103610371038103910401041104210431044104510461047104810491050105110521053105410551056105710581059106010611062106310641065106610671068106910701071107210731074107510761077107810791080108110821083108410851086108710881089109010911092109310941095109610971098109911001101110211031104110511061107
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <ctime>
  19. #include <iostream>
  20. #include "common/debug/log.h"
  21. #include "common/ge/ge_util.h"
  22. #include "common/helper/model_helper.h"
  23. #include "common/profiling/profiling_manager.h"
  24. #include "common/dump/dump_manager.h"
  25. #include "graph/execute/graph_execute.h"
  26. #include "graph/load/graph_loader.h"
  27. #include "graph/load/model_manager/model_manager.h"
  28. #include "graph/manager/graph_mem_manager.h"
  29. #include "single_op/single_op_manager.h"
  30. #include "graph/load/model_manager/davinci_model.h"
  31. #include "opskernel_manager/ops_kernel_builder_manager.h"
  32. #include "graph/opsproto_manager.h"
  33. #include "ge_local_engine/engine/host_cpu_engine.h"
  34. using std::string;
  35. using std::vector;
  36. namespace {
  37. const size_t kDynamicBatchSizeVecSize = 1;
  38. const size_t kStaticBatchInfoSize = 1;
  39. const size_t kDynamicImageSizeVecSize = 2;
  40. const size_t kDynamicImageSizeInputSize = 2;
  41. const char *const kBatchLabel = "Batch_";
  42. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  43. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  44. const std::vector<uint32_t> &formats) {
  45. uint32_t idx = 0;
  46. for (auto desc_item : domi_descs) {
  47. ge::TensorDesc ge_desc;
  48. ge_desc.SetName(desc_item.name.c_str());
  49. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  50. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  51. std::vector<int64_t> shape_dims;
  52. for (auto dim : desc_item.shape_info.dims) {
  53. shape_dims.push_back(dim);
  54. }
  55. ge::Shape ge_shape(shape_dims);
  56. ge_desc.SetShape(ge_shape);
  57. ge_desc.SetSize(desc_item.size);
  58. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  59. ge_descs.emplace_back(ge_desc);
  60. ++idx;
  61. }
  62. }
  63. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  64. inputs.index = input_data.index;
  65. inputs.model_id = input_data.modelId;
  66. inputs.timestamp = input_data.timestamp;
  67. inputs.timeout = input_data.timeout;
  68. inputs.request_id = input_data.request_id;
  69. for (const auto &data_item : input_data.blobs) {
  70. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  71. inputs.blobs.emplace_back(dataBuf);
  72. }
  73. }
  74. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  75. outputs.index = output_data.index;
  76. outputs.model_id = output_data.modelId;
  77. for (const auto &data_item : output_data.blobs) {
  78. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  79. outputs.blobs.emplace_back(dataBuf);
  80. }
  81. }
  82. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  83. ge::InputData &inputs) {
  84. inputs.is_dynamic_batch = true;
  85. std::string batch_label;
  86. size_t match_idx = 0;
  87. for (size_t i = 0; i < batch_info.size(); ++i) {
  88. // dynamic_dims
  89. if (input_data.dynamic_dims.size() != 0) {
  90. bool is_match = true;
  91. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  92. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  93. is_match = false;
  94. break;
  95. }
  96. }
  97. if (is_match) {
  98. match_idx = i;
  99. break;
  100. }
  101. // dynamic_batch_size
  102. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  103. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  104. match_idx = i;
  105. break;
  106. // dynamic_image_size
  107. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  108. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  109. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  110. match_idx = i;
  111. break;
  112. }
  113. }
  114. batch_label = kBatchLabel + std::to_string(match_idx);
  115. inputs.batch_label = batch_label;
  116. GELOGI("current batch label:%s", batch_label.c_str());
  117. }
  118. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  119. if (batch_info.empty()) {
  120. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  121. return false;
  122. }
  123. for (auto batch : batch_info) {
  124. if (batch.size() != kDynamicBatchSizeVecSize) {
  125. GELOGE(ge::FAILED, "Dynamic batch param num is %zu, current batch size is %zu.", kDynamicBatchSizeVecSize,
  126. batch.size());
  127. return false;
  128. }
  129. if (batch[0] == static_cast<int64_t>(batch_size)) {
  130. return true;
  131. }
  132. }
  133. GELOGE(ge::FAILED, "Dynamic batch %lu can not match the gear of model.", batch_size);
  134. return false;
  135. }
  136. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  137. const vector<std::vector<int64_t>> &batch_info) {
  138. if (batch_info.empty()) {
  139. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  140. return false;
  141. }
  142. for (auto resolution : batch_info) {
  143. if (resolution.size() != kDynamicImageSizeVecSize) {
  144. GELOGE(ge::FAILED, "Dynamic resolution param num is %zu, current resolution size is %zu.",
  145. kDynamicImageSizeVecSize, resolution.size());
  146. return false;
  147. }
  148. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  149. return true;
  150. }
  151. }
  152. GELOGE(ge::FAILED, "Dynamic resolution (%lu,%lu) can not match the gear of model.", image_height, image_width);
  153. return false;
  154. }
  155. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  156. const vector<vector<int64_t>> &batch_info) {
  157. if (batch_info.empty()) {
  158. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Dynamic batch info is empty.");
  159. return false;
  160. }
  161. bool find_match = false;
  162. for (auto resolution : batch_info) {
  163. if (cur_dynamic_dims.size() != resolution.size()) {
  164. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  165. cur_dynamic_dims.size(), resolution.size());
  166. return false;
  167. }
  168. bool flag = true;
  169. for (std::size_t i = 0; i < resolution.size(); ++i) {
  170. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  171. flag = false;
  172. break;
  173. }
  174. }
  175. if (flag) {
  176. find_match = true;
  177. break;
  178. }
  179. }
  180. if (!find_match) {
  181. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "choose dynamic dims can not match the gear of model.");
  182. }
  183. return find_match;
  184. }
  185. } // namespace
  186. namespace ge {
  187. bool GeExecutor::isInit_ = false;
  188. static void InitOpsProtoManager() {
  189. string opsproto_path;
  190. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  191. if (path_env != nullptr) {
  192. string path = path_env;
  193. string file_path = RealPath(path.c_str());
  194. if (file_path.empty()) {
  195. GELOGE(FAILED, "[Check][EnvPath]ASCEND_OPP_PATH path [%s] is invalid.", path.c_str());
  196. REPORT_INPUT_ERROR("E68016", {"ASCEND_OPP_PATH", path});
  197. return;
  198. }
  199. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  200. GELOGI("Get opsproto so path from env : %s", path.c_str());
  201. } else {
  202. string path_base = PluginManager::GetPath();
  203. GELOGI("path_base is %s", path_base.c_str());
  204. path_base = path_base.substr(0, path_base.rfind('/'));
  205. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  206. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  207. }
  208. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  209. OpsProtoManager *manager = OpsProtoManager::Instance();
  210. map<string, string> option_tmp;
  211. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  212. (void)manager->Initialize(option_tmp);
  213. }
  214. GeExecutor::GeExecutor() {}
  215. Status GeExecutor::Initialize() {
  216. GELOGI("Init GeExecutor begin.");
  217. if (isInit_) {
  218. GELOGW("Already initialized, no need to be initialized again.");
  219. return ge::SUCCESS;
  220. }
  221. OpTilingManager::GetInstance().LoadSo();
  222. Status init_hostcpu_engine_status = HostCpuEngine::GetInstance().Initialize();
  223. if (init_hostcpu_engine_status != SUCCESS) {
  224. GELOGE(init_hostcpu_engine_status, "Failed to initialize HostCpuEngine");
  225. return init_hostcpu_engine_status;
  226. }
  227. InitOpsProtoManager();
  228. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  229. mem_type.push_back(RT_MEMORY_P2P_DDR);
  230. auto ret = MemManager::Instance().Initialize(mem_type);
  231. if (ret != SUCCESS) {
  232. GELOGE(ret, "Memory Manager init failed.");
  233. return ret;
  234. }
  235. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  236. "Failed to initialize OpsKernelBuilders.");
  237. // Start profiling
  238. Options profiling_options;
  239. profiling_options.device_id = 0;
  240. // job id need to be set, the value is meaningless;
  241. profiling_options.job_id = "1";
  242. ProfilingManager::Instance().Init(profiling_options);
  243. isInit_ = true;
  244. GELOGI("Init GeExecutor over.");
  245. return ge::SUCCESS;
  246. }
  247. Status GeExecutor::Finalize() {
  248. GELOGI("Uninit GeExecutor begin.");
  249. if (isInit_ == false) {
  250. GELOGW("GeExecutor has not been initialized.");
  251. return ge::SUCCESS;
  252. }
  253. (void) OpsKernelBuilderManager::Instance().Finalize();
  254. // Stop profiling
  255. if (ProfilingManager::Instance().ProfilingOn()) {
  256. ProfilingManager::Instance().StopProfiling();
  257. ProfilingManager::Instance().PluginUnInit();
  258. }
  259. GELOGI("Uninit GeExecutor over.");
  260. return ge::SUCCESS;
  261. }
  262. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  263. uint64_t batch_size) {
  264. if (dynamic_input_addr == nullptr) {
  265. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  266. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  267. }
  268. uint64_t size = sizeof(uint32_t);
  269. if (length < size) {
  270. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length, size);
  271. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  272. }
  273. if (length >= sizeof(uint64_t)) {
  274. size = sizeof(uint64_t);
  275. }
  276. // Verify whether the input dynamic batch matches the model gear
  277. std::vector<std::vector<int64_t>> batch_info;
  278. std::vector<uint64_t> batch_num{batch_size};
  279. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  280. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  281. if (ret != SUCCESS) {
  282. GELOGE(ret, "Get dynamic input info failed.");
  283. return ret;
  284. }
  285. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  286. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  287. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  288. }
  289. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  290. if (ret != SUCCESS) {
  291. GELOGE(ret, "Set dynamic size failed");
  292. return ret;
  293. }
  294. // memcpy dynamic_batch_size from host to device
  295. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  296. if (rt_ret != RT_ERROR_NONE) {
  297. GELOGE(rt_ret, "memcpy dynamic batch input data failed! ret: 0x%X", rt_ret);
  298. return RT_ERROR_TO_GE_STATUS(rt_ret);
  299. }
  300. return SUCCESS;
  301. }
  302. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  303. uint64_t image_height, uint64_t image_width) {
  304. if (dynamic_input_addr == nullptr) {
  305. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  306. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  307. }
  308. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  309. if (length < dynamic_input_size) {
  310. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  311. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  312. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  313. }
  314. uint64_t size = sizeof(uint32_t);
  315. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  316. size = sizeof(uint64_t);
  317. }
  318. // Verify whether the input dynamic resolution matches the model gear
  319. std::vector<std::vector<int64_t>> batch_info;
  320. std::vector<uint64_t> batch_num{image_height, image_width};
  321. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  322. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  323. if (ret != SUCCESS) {
  324. GELOGE(ret, "Get dynamic input info failed.");
  325. return ret;
  326. }
  327. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  328. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  329. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  330. }
  331. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  332. if (ret != SUCCESS) {
  333. GELOGE(ret, "Set dynamic size failed");
  334. return ret;
  335. }
  336. // Memcpy dynamic resolution height from host to device
  337. rtError_t rt_ret =
  338. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  339. if (rt_ret != RT_ERROR_NONE) {
  340. GELOGE(rt_ret, "memcpy dynamic resolution input data failed! ret: 0x%X", rt_ret);
  341. return RT_ERROR_TO_GE_STATUS(rt_ret);
  342. }
  343. uint64_t remain_size = length - size;
  344. // Memcpy dynamic resolution width from host to device
  345. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  346. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  347. if (rt_ret != RT_ERROR_NONE) {
  348. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  349. return RT_ERROR_TO_GE_STATUS(rt_ret);
  350. }
  351. return SUCCESS;
  352. }
  353. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  354. const vector<uint64_t> &dynamic_dims) {
  355. if (dynamic_input_addr == nullptr) {
  356. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  357. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  358. }
  359. vector<uint64_t> cur_dynamic_dims;
  360. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  361. if (ret != SUCCESS) {
  362. GELOGE(ret, "Set cur gear dynamic dims failed");
  363. return ret;
  364. }
  365. std::vector<std::vector<int64_t>> batch_info;
  366. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  367. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  368. if (ret != SUCCESS) {
  369. GELOGE(ret, "Get dynamic input info failed.");
  370. return ret;
  371. }
  372. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  373. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  374. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  375. }
  376. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  377. if (ret != SUCCESS) {
  378. GELOGE(ret, "Set dynamic size failed");
  379. return ret;
  380. }
  381. size_t dynamic_dim_num = cur_dynamic_dims.size();
  382. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  383. if (length < dynamic_input_size) {
  384. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  385. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  386. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  387. }
  388. uint64_t size = sizeof(uint32_t);
  389. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  390. size = sizeof(uint64_t);
  391. }
  392. rtError_t rt_ret;
  393. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  394. // Memcpy dynamic dim[i] from host to device
  395. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  396. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  397. if (rt_ret != RT_ERROR_NONE) {
  398. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  399. return RT_ERROR_TO_GE_STATUS(rt_ret);
  400. }
  401. }
  402. return SUCCESS;
  403. }
  404. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  405. vector<uint64_t> &cur_dynamic_dims) {
  406. cur_dynamic_dims.clear();
  407. vector<ge::TensorDesc> input_desc;
  408. vector<ge::TensorDesc> output_desc;
  409. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  410. if (ret != ge::SUCCESS) {
  411. GELOGE(ret, "GetModelDescInfo failed.");
  412. return ret;
  413. }
  414. vector<string> user_designate_shape_order;
  415. vector<int64_t> all_data_dims;
  416. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  417. if (ret != ge::SUCCESS) {
  418. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  419. return ret;
  420. }
  421. for (auto &data_name : user_designate_shape_order) {
  422. for (auto &desc : input_desc) {
  423. if (desc.GetName() == data_name) {
  424. for (auto dim : desc.GetShape().GetDims()) {
  425. all_data_dims.push_back(dim);
  426. }
  427. break;
  428. }
  429. }
  430. }
  431. if (dynamic_dims.size() != all_data_dims.size()){
  432. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  433. "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  434. dynamic_dims.size(), all_data_dims.size());
  435. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  436. }
  437. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  438. if (all_data_dims[i] < 0) {
  439. cur_dynamic_dims.push_back(dynamic_dims[i]);
  440. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  441. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  442. "Static dims should be same, index: %zu value: %lu should be %ld",
  443. i, dynamic_dims[i], all_data_dims[i]);
  444. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  445. }
  446. }
  447. return SUCCESS;
  448. }
  449. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  450. GELOGI("Begin to get current shape");
  451. if (!isInit_) {
  452. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  453. return ACL_ERROR_GE_EXEC_NOT_INIT;
  454. }
  455. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  456. if (ret != SUCCESS) {
  457. GELOGE(ret, "Get current shape failed");
  458. return ret;
  459. }
  460. return SUCCESS;
  461. }
  462. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  463. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  464. const kAippDynamicPara &aippParms) {
  465. GELOGI("Enter to SetDynamicAippData.");
  466. if (dynamic_input_addr == nullptr) {
  467. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic aipp input addr is nullptr!");
  468. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  469. }
  470. if (aippBatchPara.empty()) {
  471. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "aippBatchPara is empty.");
  472. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  473. }
  474. uint64_t batch_num = aippBatchPara.size();
  475. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  476. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  477. GELOGI(
  478. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  479. "batch num is %lu, struct_len is %lu",
  480. model_id, length, batch_num, struct_len);
  481. if (struct_len > length) {
  482. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  483. "input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]", struct_len, length);
  484. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  485. }
  486. // Memcpy real kAippDynamicBatchPara from host to device
  487. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  488. if (rt_ret != RT_ERROR_NONE) {
  489. GELOGE(rt_ret, "memcpy real_aippParms_size failed! ret: 0x%X", rt_ret);
  490. return RT_ERROR_TO_GE_STATUS(rt_ret);
  491. }
  492. uint64_t remain_len = length - real_aippParms_size;
  493. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  494. for (uint64_t i = 0; i < batch_num; ++i) {
  495. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  496. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  497. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  498. if (rt_ret != RT_ERROR_NONE) {
  499. GELOGE(rt_ret, "memcpy kAippDynamicBatchPara input data failed! ret: 0x%X", rt_ret);
  500. return RT_ERROR_TO_GE_STATUS(rt_ret);
  501. }
  502. }
  503. return SUCCESS;
  504. }
  505. Status GeExecutor::UnloadModel(uint32_t model_id) {
  506. GELOGD("unload model %u begin.", model_id);
  507. if (!isInit_) {
  508. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  509. return ACL_ERROR_GE_EXEC_NOT_INIT;
  510. }
  511. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  512. if (ret != SUCCESS) {
  513. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  514. return ret;
  515. }
  516. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model =
  517. ModelManager::GetInstance()->GetHybridModel(model_id);
  518. if (hybrid_davinci_model != nullptr) {
  519. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  520. VarManagerPool::Instance().RemoveVarManager(session_id);
  521. } else {
  522. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  523. if (davinci_model != nullptr) {
  524. uint64_t session_id = davinci_model->GetSessionId();
  525. VarManagerPool::Instance().RemoveVarManager(session_id);
  526. }
  527. }
  528. ret = GraphLoader::UnloadModel(model_id);
  529. if (ret != SUCCESS) {
  530. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  531. return ret;
  532. }
  533. return SUCCESS;
  534. }
  535. // Get input and output descriptor
  536. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  537. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  538. if (!isInit_) {
  539. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  540. return ACL_ERROR_GE_EXEC_NOT_INIT;
  541. }
  542. std::vector<InputOutputDescInfo> input_desc_infos;
  543. std::vector<InputOutputDescInfo> output_desc_infos;
  544. std::vector<uint32_t> input_formats;
  545. std::vector<uint32_t> output_formats;
  546. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  547. output_formats, new_model_desc);
  548. if (ret != domi::SUCCESS) {
  549. GELOGE(ret, "GetInputOutputDescInfo failed. ret = %u", ret);
  550. return ACL_ERROR_GE_GET_TENSOR_INFO;
  551. }
  552. if (input_formats.size() != input_desc_infos.size()) {
  553. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  554. "input_formats size %zu is not equal to input_desc_infos size %zu.",
  555. input_formats.size(), input_desc_infos.size());
  556. return ACL_ERROR_GE_PARAM_INVALID;
  557. }
  558. if (output_formats.size() != output_desc_infos.size()) {
  559. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats size %zu is not equal to output_desc_infos size %zu.",
  560. output_formats.size(), output_desc_infos.size());
  561. return ACL_ERROR_GE_PARAM_INVALID;
  562. }
  563. // Transfer data to TensorDesc
  564. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  565. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  566. return ge::SUCCESS;
  567. }
  568. ///
  569. /// @ingroup ge
  570. /// @brief Get dynamic batch_info
  571. /// @param [in] model_id
  572. /// @param [out] batch_info
  573. /// @param [out] dynamic_type
  574. /// @return execute result
  575. ///
  576. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  577. int32_t &dynamic_type) {
  578. if (!isInit_) {
  579. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  580. return ACL_ERROR_GE_EXEC_NOT_INIT;
  581. }
  582. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  583. if (ret != SUCCESS) {
  584. GELOGE(ret, "GetDynamicBatchInfo failed.");
  585. return ret;
  586. }
  587. return SUCCESS;
  588. }
  589. ///
  590. /// @ingroup ge
  591. /// @brief Get combined dynamic dims info
  592. /// @param [in] model_id
  593. /// @param [out] batch_info
  594. /// @return execute result
  595. ///
  596. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  597. GELOGI("Begin to get combined dynamic dims info.");
  598. if (!isInit_) {
  599. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  600. return ACL_ERROR_GE_EXEC_NOT_INIT;
  601. }
  602. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  603. if (ret != SUCCESS) {
  604. GELOGE(ret, "GetCombinedDynamicDims failed.");
  605. return ret;
  606. }
  607. GELOGI("Get combined dynamic dims succ.");
  608. return SUCCESS;
  609. }
  610. ///
  611. /// @ingroup ge
  612. /// @brief Get user designeate shape order
  613. /// @param [in] model_id
  614. /// @param [out] user_designate_shape_order
  615. /// @return execute result
  616. ///
  617. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  618. if (!isInit_) {
  619. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  620. return ACL_ERROR_GE_EXEC_NOT_INIT;
  621. }
  622. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  623. if (ret != SUCCESS) {
  624. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  625. return ret;
  626. }
  627. return SUCCESS;
  628. }
  629. ///
  630. /// @ingroup ge
  631. /// @brief Get AIPP input format
  632. /// @param [in] model_id
  633. /// @param [in] index
  634. /// @param [out] input_format
  635. /// @return execute result
  636. ///
  637. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  638. GELOGI("Begin to GetAIPPInfo.");
  639. if (!isInit_) {
  640. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  641. return ACL_ERROR_GE_EXEC_NOT_INIT;
  642. }
  643. Status ret = GraphExecutor::GetAippInfo(model_id, index, aipp_info);
  644. if (ret != SUCCESS) {
  645. GELOGW("GetAIPPInfo is not success.");
  646. return ret;
  647. }
  648. GELOGI("GetAIPPInfo succ.");
  649. return SUCCESS;
  650. }
  651. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  652. GELOGI("Begin to get aipp type.");
  653. if (!isInit_) {
  654. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  655. return ACL_ERROR_GE_EXEC_NOT_INIT;
  656. }
  657. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  658. if (ret != SUCCESS) {
  659. GELOGW("Get aipp type is not success.");
  660. return ret;
  661. }
  662. GELOGI("Get aipp type success.");
  663. return SUCCESS;
  664. }
  665. Status GeExecutor::GetOpAttr(uint32_t model_id, const std::string &op_name, const std::string &attr_name,
  666. std::string &attr_value) {
  667. GELOGI("Begin to get op attr.");
  668. if (!isInit_) {
  669. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "[Init][GeExecutor]Ge executor not inited yet!");
  670. REPORT_INNER_ERROR("E19999", "Ge executor not inited yet!");
  671. return ACL_ERROR_GE_EXEC_NOT_INIT;
  672. }
  673. Status ret = GraphExecutor::GetOpAttr(model_id, op_name, attr_name, attr_value);
  674. if (ret != SUCCESS) {
  675. GELOGE(ret, "[Get][OpAttr]Get op:%s attr:%s failed.", op_name.c_str(), attr_name.c_str());
  676. REPORT_CALL_ERROR("E19999", "Get op:%s attr:%s failed.", op_name.c_str(), attr_name.c_str());
  677. return ret;
  678. }
  679. return SUCCESS;
  680. }
  681. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  682. if (!isInit_) {
  683. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  684. return ACL_ERROR_GE_EXEC_NOT_INIT;
  685. }
  686. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  687. if (ret != SUCCESS) {
  688. GELOGE(ret, "Get dynamic batch output shape info failed.");
  689. return ret;
  690. }
  691. return SUCCESS;
  692. }
  693. Status GeExecutor::CommandHandle(const Command &command) {
  694. Status ret = GraphLoader::CommandHandle(command);
  695. if (ret != SUCCESS) {
  696. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "CommandHandle: Command Handle failed.");
  697. return ACL_ERROR_GE_COMMAND_HANDLE;
  698. }
  699. return SUCCESS;
  700. }
  701. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  702. GELOGI("Get max used memory begin.");
  703. if (!isInit_) {
  704. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  705. return ACL_ERROR_GE_EXEC_NOT_INIT;
  706. }
  707. uint64_t max_mem_size = 0;
  708. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  709. max_size = static_cast<uint32_t>(max_mem_size);
  710. return ret;
  711. }
  712. /**
  713. * @ingroup ge
  714. * @brief Load data from model file to memory
  715. * @param [in] const std::string &path: Offline model file path
  716. * @param [out] domi::ModelData &model_data: Offline model memory data
  717. * @return SUCCESS handle successfully / others handle failed
  718. */
  719. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  720. GELOGI("Load data from file begin.");
  721. if (!isInit_) {
  722. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  723. return ACL_ERROR_GE_EXEC_NOT_INIT;
  724. }
  725. string filePath = RealPath(path.c_str());
  726. if (filePath.empty()) {
  727. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  728. "File path is invalid. please check your text file '%s'.", path.c_str());
  729. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  730. }
  731. GELOGI("load modelData from file: %s.", path.c_str());
  732. std::string key_path;
  733. int32_t priority = 0;
  734. Status ret = GraphLoader::LoadDataFromFile(path, key_path, priority, model_data);
  735. if (ret != SUCCESS) {
  736. if (model_data.model_data != nullptr) {
  737. delete[] static_cast<char *>(model_data.model_data);
  738. model_data.model_data = nullptr;
  739. }
  740. }
  741. return ret;
  742. }
  743. /**
  744. * @ingroup ge
  745. * @brief Load model from offline model memory data
  746. * @param [in] domi::ModelData &model_data: Offline model data
  747. void *dev_ptr: Input/Output memory start address
  748. size_t memsize: Input/Output memory length
  749. void *weight_ptr: Weight memory start address
  750. size_t weightsize: Weight memory length
  751. * @param [out] uint32_t &model_id: identification after model loading
  752. * @return SUCCESS handle successfully / others handle failed
  753. */
  754. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  755. void *weight_ptr, size_t weight_size) {
  756. if (!isInit_) {
  757. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  758. return ACL_ERROR_GE_EXEC_NOT_INIT;
  759. }
  760. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  761. }
  762. /**
  763. * @ingroup ge
  764. * @brief Load task list from ModelData with queue.
  765. * @param [out] model_id: model id allocate from manager.
  766. * @param [in] ge_model_data: Model data load from offline model.
  767. * @param [in] input_queue_ids: input queue ids create from user.
  768. * @param [in] output_queue_ids: input queue ids create from user.
  769. * @return: 0 for success / others for fail
  770. */
  771. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  772. const std::vector<uint32_t> &input_queue_ids,
  773. const std::vector<uint32_t> &output_queue_ids) {
  774. GELOGI("Load model with queue begin.");
  775. if (!isInit_) {
  776. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  777. return ACL_ERROR_GE_EXEC_NOT_INIT;
  778. }
  779. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  780. }
  781. /**
  782. * @ingroup ge
  783. * @brief Synchronous execution of offline model(Do not create thread)
  784. * @param [in] uint32_t model_id: Model ID to execute
  785. void* stream: stream to execute
  786. const domi::InputData *input_data: Model input data
  787. bool async_mode: is asynchronize mode.
  788. * @param [out] domi::OutputData *output_data: Model output data
  789. * @return SUCCESS handle successfully / others handle failed
  790. */
  791. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  792. ge::RunModelData &run_output_data, bool async_mode) {
  793. std::vector<GeTensorDesc> input_desc = {};
  794. std::vector<GeTensorDesc> output_desc = {};
  795. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  796. }
  797. /**
  798. * @ingroup ge
  799. * @brief Synchronous execution of offline model(Do not create thread)
  800. * @param [in] uint32_t model_id: Model ID to execute
  801. void* stream: stream to execute
  802. const domi::InputData *input_data: Model input data
  803. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  804. bool async_mode: is asynchronize mode
  805. * @param [out] domi::OutputData *output_data: Model output data
  806. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  807. * @return SUCCESS handle successfully / others handle failed
  808. */
  809. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  810. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  811. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  812. if (!isInit_) {
  813. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  814. return ACL_ERROR_GE_EXEC_NOT_INIT;
  815. }
  816. InputData input_data;
  817. OutputData output_data;
  818. GetDomiInputData(run_input_data, input_data);
  819. GetDomiOutputData(run_output_data, output_data);
  820. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  821. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  822. std::vector<std::vector<int64_t>> batch_info;
  823. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  824. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  825. if (ret != SUCCESS) {
  826. GELOGE(ret, "Get dynamic input info failed.");
  827. return ret;
  828. }
  829. if (!batch_info.empty()) {
  830. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  831. }
  832. }
  833. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  834. }
  835. /**
  836. * @ingroup ge
  837. * @brief Get weight memory size from model file
  838. * @param [in] const std::string &path: Offline model file path
  839. * @param [out] size_t &mem_size Execution memory size
  840. size_t &weight_size Weight memory space size
  841. * @return SUCCESS handle successfully / others handle failed
  842. */
  843. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  844. GELOGI("Get memory and weight size from file begin.");
  845. if (!isInit_) {
  846. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  847. return ACL_ERROR_GE_EXEC_NOT_INIT;
  848. }
  849. ModelData model;
  850. std::string key;
  851. Status ret = ge::GraphLoader::LoadDataFromFile(path, key, 0, model);
  852. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  853. GELOGE(ret, "Load data from file failed. ret = %d", ret);
  854. return ret;
  855. }
  856. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  857. delete[] static_cast<char *>(model.model_data);
  858. model.model_data = nullptr;
  859. return ret;
  860. }
  861. /**
  862. * @ingroup ge
  863. * @brief Get weight memory size from model file
  864. * @param [in] const void *model_data Offline model buffer
  865. size_t model_size Offline model buffer length
  866. * @param [out] size_t &mem_size Execution memory size
  867. size_t &weight_size Weight memory space size
  868. * @return SUCCESS handle successfully / others handle failed
  869. */
  870. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  871. size_t &weight_size) {
  872. GELOGI("Get memory and weight size from data begin.");
  873. if (!isInit_) {
  874. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  875. return ACL_ERROR_GE_EXEC_NOT_INIT;
  876. }
  877. if (model_data == nullptr) {
  878. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "invalid model data!");
  879. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  880. }
  881. ModelData model;
  882. model.model_data = const_cast<void *>(model_data);
  883. model.model_len = static_cast<uint32_t>(model_size);
  884. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  885. }
  886. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  887. SingleOp **single_op) {
  888. return LoadSingleOpV2(model_name, modelData, stream, single_op, 0);
  889. }
  890. Status GeExecutor::LoadSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  891. SingleOp **single_op, const uint64_t model_id) {
  892. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op, model_id);
  893. }
  894. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  895. DynamicSingleOp **single_op) {
  896. return LoadDynamicSingleOpV2(model_name, modelData, stream, single_op, 0);
  897. }
  898. Status GeExecutor::LoadDynamicSingleOpV2(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  899. DynamicSingleOp **single_op, const uint64_t model_id) {
  900. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op, model_id);
  901. }
  902. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  903. std::vector<DataBuffer> &outputs) {
  904. if (executor == nullptr) {
  905. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "param is NULL");
  906. return ACL_ERROR_GE_EXEC_NOT_INIT;
  907. }
  908. return executor->ExecuteAsync(inputs, outputs);
  909. }
  910. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  911. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  912. vector<DataBuffer> &outputs) {
  913. GE_CHECK_NOTNULL(executor);
  914. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  915. }
  916. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  917. ModelManager::GetInstance()->ClearAicpuSo();
  918. return SingleOpManager::GetInstance().ReleaseResource(stream);
  919. }
  920. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  921. auto model_manager = ModelManager::GetInstance();
  922. GE_CHECK_NOTNULL(model_manager);
  923. auto davinci_model = model_manager->GetModel(model_id);
  924. if (davinci_model == nullptr) {
  925. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id: %d is invaild or model is not loaded.", model_id);
  926. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  927. }
  928. device_id = davinci_model->GetDeviceId();
  929. return SUCCESS;
  930. }
  931. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  932. std::vector<std::vector<int64_t>> batch_info;
  933. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  934. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  935. if (ret != SUCCESS) {
  936. GELOGE(ret, "Calc batch info size failed. ret = %d", ret);
  937. return ret;
  938. }
  939. if (batch_info.empty()) {
  940. shape_count = kStaticBatchInfoSize;
  941. } else {
  942. shape_count = batch_info.size();
  943. }
  944. return SUCCESS;
  945. }
  946. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  947. GELOGI("Begin to GetOrigInputInfo.");
  948. if (!isInit_) {
  949. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  950. return ACL_ERROR_GE_EXEC_NOT_INIT;
  951. }
  952. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  953. if (ret != SUCCESS) {
  954. GELOGE(ret, "GetOrigInputInfo failed.");
  955. return ret;
  956. }
  957. GELOGI("GetOrigInputInfo succ.");
  958. return SUCCESS;
  959. }
  960. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  961. std::vector<InputOutputDims> &input_dims,
  962. std::vector<InputOutputDims> &output_dims) {
  963. GELOGI("Begin to GetAllAippInputOutputDims.");
  964. if (!isInit_) {
  965. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  966. return ACL_ERROR_GE_EXEC_NOT_INIT;
  967. }
  968. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  969. if (ret != SUCCESS) {
  970. GELOGE(ret, "GetAllAippInputOutputDims failed.");
  971. return ret;
  972. }
  973. GELOGI("GetAllAippInputOutputDims succ.");
  974. return SUCCESS;
  975. }
  976. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  977. GELOGI("Begin to GetOpDescInfo.");
  978. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  979. if (ret != SUCCESS) {
  980. GELOGE(ret, "GetOpDescInfo failed.");
  981. return ret;
  982. }
  983. GELOGI("GetOpDescInfo succ.");
  984. return SUCCESS;
  985. }
  986. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  987. GELOGI("Start to set dump config");
  988. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  989. if (ret != SUCCESS) {
  990. GELOGE(ret, "Set dump conf failed");
  991. return ret;
  992. }
  993. GELOGI("Set dump config successfully");
  994. return SUCCESS;
  995. }
  996. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示