You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ge_executor.cc 45 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
4 years ago
5 years ago
12345678910111213141516171819202122232425262728293031323334353637383940414243444546474849505152535455565758596061626364656667686970717273747576777879808182838485868788899091929394959697989910010110210310410510610710810911011111211311411511611711811912012112212312412512612712812913013113213313413513613713813914014114214314414514614714814915015115215315415515615715815916016116216316416516616716816917017117217317417517617717817918018118218318418518618718818919019119219319419519619719819920020120220320420520620720820921021121221321421521621721821922022122222322422522622722822923023123223323423523623723823924024124224324424524624724824925025125225325425525625725825926026126226326426526626726826927027127227327427527627727827928028128228328428528628728828929029129229329429529629729829930030130230330430530630730830931031131231331431531631731831932032132232332432532632732832933033133233333433533633733833934034134234334434534634734834935035135235335435535635735835936036136236336436536636736836937037137237337437537637737837938038138238338438538638738838939039139239339439539639739839940040140240340440540640740840941041141241341441541641741841942042142242342442542642742842943043143243343443543643743843944044144244344444544644744844945045145245345445545645745845946046146246346446546646746846947047147247347447547647747847948048148248348448548648748848949049149249349449549649749849950050150250350450550650750850951051151251351451551651751851952052152252352452552652752852953053153253353453553653753853954054154254354454554654754854955055155255355455555655755855956056156256356456556656756856957057157257357457557657757857958058158258358458558658758858959059159259359459559659759859960060160260360460560660760860961061161261361461561661761861962062162262362462562662762862963063163263363463563663763863964064164264364464564664764864965065165265365465565665765865966066166266366466566666766866967067167267367467567667767867968068168268368468568668768868969069169269369469569669769869970070170270370470570670770870971071171271371471571671771871972072172272372472572672772872973073173273373473573673773873974074174274374474574674774874975075175275375475575675775875976076176276376476576676776876977077177277377477577677777877978078178278378478578678778878979079179279379479579679779879980080180280380480580680780880981081181281381481581681781881982082182282382482582682782882983083183283383483583683783883984084184284384484584684784884985085185285385485585685785885986086186286386486586686786886987087187287387487587687787887988088188288388488588688788888989089189289389489589689789889990090190290390490590690790890991091191291391491591691791891992092192292392492592692792892993093193293393493593693793893994094194294394494594694794894995095195295395495595695795895996096196296396496596696796896997097197297397497597697797897998098198298398498598698798898999099199299399499599699799899910001001100210031004100510061007100810091010101110121013101410151016101710181019102010211022102310241025102610271028102910301031103210331034103510361037103810391040104110421043104410451046104710481049105010511052105310541055105610571058105910601061106210631064106510661067106810691070107110721073107410751076107710781079108010811082108310841085108610871088108910901091109210931094109510961097109810991100110111021103110411051106110711081109111011111112111311141115111611171118111911201121112211231124112511261127112811291130113111321133113411351136113711381139114011411142114311441145114611471148114911501151115211531154115511561157115811591160116111621163116411651166116711681169117011711172117311741175117611771178117911801181118211831184118511861187118811891190119111921193119411951196119711981199120012011202120312041205
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include "executor/ge_executor.h"
  17. #include <cce/cce.h>
  18. #include <cce/compiler_stub.h>
  19. #include <ctime>
  20. #include <iostream>
  21. #include "common/debug/log.h"
  22. #include "common/ge/ge_util.h"
  23. #include "common/helper/model_helper.h"
  24. #include "common/profiling/profiling_manager.h"
  25. #include "common/dump/dump_manager.h"
  26. #include "common/util.h"
  27. #include "framework/common/debug/ge_log.h"
  28. #include "framework/common/util.h"
  29. #include "graph/execute/graph_execute.h"
  30. #include "graph/load/graph_loader.h"
  31. #include "graph/load/new_model_manager/davinci_model_parser.h"
  32. #include "graph/load/new_model_manager/model_manager.h"
  33. #include "graph/manager/graph_mem_allocator.h"
  34. #include "graph/model.h"
  35. #include "graph/utils/graph_utils.h"
  36. #include "mmpa/mmpa_api.h"
  37. #include "single_op/single_op_manager.h"
  38. #include "graph/manager/graph_var_manager.h"
  39. #include "graph/load/new_model_manager/davinci_model.h"
  40. #include "opskernel_manager/ops_kernel_builder_manager.h"
  41. #include "graph/opsproto_manager.h"
  42. #include "ge_local_engine/engine/host_cpu_engine.h"
  43. using std::string;
  44. using std::vector;
  45. namespace {
  46. const size_t kDynamicBatchSizeVecSize = 1;
  47. const size_t kStaticBatchInfoSize = 1;
  48. const size_t kDynamicImageSizeVecSize = 2;
  49. const size_t kDynamicImageSizeInputSize = 2;
  50. const char *const kBatchLabel = "Batch_";
  51. void GetGeTensorDescFromDomiInfo(std::vector<ge::TensorDesc> &ge_descs,
  52. const std::vector<ge::InputOutputDescInfo> &domi_descs,
  53. const std::vector<uint32_t> &formats) {
  54. uint32_t idx = 0;
  55. for (auto desc_item : domi_descs) {
  56. ge::TensorDesc ge_desc;
  57. ge_desc.SetName(desc_item.name);
  58. ge_desc.SetDataType(static_cast<ge::DataType>(desc_item.data_type));
  59. ge_desc.SetFormat(static_cast<ge::Format>(formats[idx]));
  60. std::vector<int64_t> shape_dims;
  61. for (auto dim : desc_item.shape_info.dims) {
  62. shape_dims.push_back(dim);
  63. }
  64. ge::Shape ge_shape(shape_dims);
  65. ge_desc.SetShape(ge_shape);
  66. ge_desc.SetSize(desc_item.size);
  67. ge_desc.SetShapeRange(desc_item.shape_info.shape_ranges);
  68. ge_descs.emplace_back(ge_desc);
  69. ++idx;
  70. }
  71. }
  72. void GetDomiInputData(const ge::RunModelData &input_data, ge::InputData &inputs) {
  73. inputs.index = input_data.index;
  74. inputs.model_id = input_data.modelId;
  75. inputs.timestamp = input_data.timestamp;
  76. inputs.timeout = input_data.timeout;
  77. inputs.request_id = input_data.request_id;
  78. for (const auto &data_item : input_data.blobs) {
  79. ge::DataBuffer dataBuf{data_item.data, data_item.length, data_item.isDataSupportMemShare};
  80. inputs.blobs.emplace_back(dataBuf);
  81. }
  82. }
  83. void GetDomiOutputData(const ge::RunModelData &output_data, ge::OutputData &outputs) {
  84. outputs.index = output_data.index;
  85. outputs.model_id = output_data.modelId;
  86. for (const auto &data_item : output_data.blobs) {
  87. ge::DataBuffer dataBuf(data_item.data, data_item.length, data_item.isDataSupportMemShare);
  88. outputs.blobs.emplace_back(dataBuf);
  89. }
  90. }
  91. void SetDynamicInputDataFlag(const ge::RunModelData &input_data, const std::vector<std::vector<int64_t>> batch_info,
  92. ge::InputData &inputs) {
  93. inputs.is_dynamic_batch = true;
  94. std::string batch_label;
  95. size_t match_idx = 0;
  96. for (size_t i = 0; i < batch_info.size(); ++i) {
  97. // dynamic_dims
  98. if (input_data.dynamic_dims.size() != 0) {
  99. bool is_match = true;
  100. for (size_t j = 0; j < static_cast<size_t>(input_data.dynamic_dims.size()); ++j) {
  101. if (static_cast<uint64_t>(batch_info[i][j]) != input_data.dynamic_dims[j]) {
  102. is_match = false;
  103. break;
  104. }
  105. }
  106. if (is_match) {
  107. match_idx = i;
  108. break;
  109. }
  110. // dynamic_batch_size
  111. } else if (batch_info[i].size() == kDynamicBatchSizeVecSize &&
  112. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_batch_size)) {
  113. match_idx = i;
  114. break;
  115. // dynamic_image_size
  116. } else if (batch_info[i].size() == kDynamicImageSizeVecSize &&
  117. batch_info[i][0] == static_cast<int64_t>(input_data.dynamic_image_height) &&
  118. batch_info[i][1] == static_cast<int64_t>(input_data.dynamic_image_width)) {
  119. match_idx = i;
  120. break;
  121. }
  122. }
  123. batch_label = kBatchLabel + std::to_string(match_idx);
  124. inputs.batch_label = batch_label;
  125. GELOGI("current batch label:%s", batch_label.c_str());
  126. }
  127. bool IsDynamicBatchSizeMatchModel(uint64_t batch_size, const vector<std::vector<int64_t>> &batch_info) {
  128. if (batch_info.empty()) {
  129. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  130. return false;
  131. }
  132. for (auto batch : batch_info) {
  133. if (batch.size() != kDynamicBatchSizeVecSize) {
  134. GELOGE(ge::FAILED, "Dynamic batch param num is %zu, current batch size is %zu.", kDynamicBatchSizeVecSize,
  135. batch.size());
  136. return false;
  137. }
  138. if (batch[0] == static_cast<int64_t>(batch_size)) {
  139. return true;
  140. }
  141. }
  142. GELOGE(ge::FAILED, "Dynamic batch %lu can not match the gear of model.", batch_size);
  143. return false;
  144. }
  145. bool IsDynamicImageSizeMatchModel(uint64_t image_height, uint64_t image_width,
  146. const vector<std::vector<int64_t>> &batch_info) {
  147. if (batch_info.empty()) {
  148. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  149. return false;
  150. }
  151. for (auto resolution : batch_info) {
  152. if (resolution.size() != kDynamicImageSizeVecSize) {
  153. GELOGE(ge::FAILED, "Dynamic resolution param num is %zu, current resolution size is %zu.",
  154. kDynamicImageSizeVecSize, resolution.size());
  155. return false;
  156. }
  157. if (resolution[0] == static_cast<int64_t>(image_height) && resolution[1] == static_cast<int64_t>(image_width)) {
  158. return true;
  159. }
  160. }
  161. GELOGE(ge::FAILED, "Dynamic resolution (%lu,%lu) can not match the gear of model.", image_height, image_width);
  162. return false;
  163. }
  164. bool IsDynmaicDimsSizeMatchModel(const vector<uint64_t> cur_dynamic_dims,
  165. const vector<vector<int64_t>> &batch_info) {
  166. if (batch_info.empty()) {
  167. GELOGE(ge::FAILED, "Dynamic batch info is empty.");
  168. return false;
  169. }
  170. bool find_match = false;
  171. for (auto resolution : batch_info) {
  172. if (cur_dynamic_dims.size() != resolution.size()) {
  173. GELOGE(ge::FAILED, "Cur dynamic dims param num is %zu, current resolution size is %zu.",
  174. cur_dynamic_dims.size(), resolution.size());
  175. return false;
  176. }
  177. bool flag = true;
  178. for (std::size_t i = 0; i < resolution.size(); ++i) {
  179. if (cur_dynamic_dims[i] != static_cast<uint64_t>(resolution[i])) {
  180. flag = false;
  181. break;
  182. }
  183. }
  184. if (flag) {
  185. find_match = true;
  186. break;
  187. }
  188. }
  189. if (!find_match) {
  190. GELOGE(ge::FAILED, "choose dynamic dims can not match the gear of model.");
  191. }
  192. return find_match;
  193. }
  194. } // namespace
  195. namespace ge {
  196. bool GeExecutor::isInit_ = false;
  197. class ModelListenerAdapter : public ModelListener {
  198. public:
  199. domi::Status OnComputeDone(uint32_t model_id, uint32_t dataIndex, uint32_t resultCode,
  200. std::vector<ge::OutputTensorInfo> &outputs) {
  201. if (listener == nullptr) {
  202. GELOGE(ge::FAILED, "listener is null.");
  203. return FAILED;
  204. }
  205. return listener->OnComputeDone(model_id, dataIndex, resultCode, outputs);
  206. }
  207. std::shared_ptr<ge::ModelListener> listener;
  208. };
  209. static void InitOpsProtoManger() {
  210. string opsproto_path;
  211. const char *path_env = std::getenv("ASCEND_OPP_PATH");
  212. if (path_env != nullptr) {
  213. string path = path_env;
  214. string file_path = RealPath(path.c_str());
  215. if (file_path.empty()) {
  216. GELOGE(FAILED, "File path %s is invalid.", path.c_str());
  217. return;
  218. }
  219. opsproto_path = (path + "/op_proto/custom/" + ":") + (path + "/op_proto/built-in/");
  220. GELOGI("Get opsproto so path from env : %s", path.c_str());
  221. } else {
  222. string path_base = PluginManager::GetPath();
  223. GELOGI("path_base is %s", path_base.c_str());
  224. path_base = path_base.substr(0, path_base.rfind('/'));
  225. path_base = path_base.substr(0, path_base.rfind('/') + 1);
  226. opsproto_path = (path_base + "ops/op_proto/custom/" + ":") + (path_base + "ops/op_proto/built-in/");
  227. }
  228. GELOGI("Get opsproto path is %s", opsproto_path.c_str());
  229. OpsProtoManager *manager = OpsProtoManager::Instance();
  230. map<string, string> option_tmp;
  231. option_tmp.emplace(std::pair<string, string>(string("ge.opsProtoLibPath"), opsproto_path));
  232. (void)manager->Initialize(option_tmp);
  233. }
  234. GeExecutor::GeExecutor() {}
  235. Status GeExecutor::Initialize() {
  236. GELOGI("Init GeExecutor begin.");
  237. if (isInit_) {
  238. GELOGW("Already initialized, no need to be initialized again.");
  239. return ge::SUCCESS;
  240. }
  241. OpTilingManager::GetInstance().LoadSo();
  242. Status initHostCpuEngineStatus = HostCpuEngine::GetInstance().Initialize();
  243. if (initHostCpuEngineStatus != SUCCESS) {
  244. GELOGE(initHostCpuEngineStatus, "Failed to initialize HostCpuEngine");
  245. return initHostCpuEngineStatus;
  246. }
  247. InitOpsProtoManger();
  248. std::vector<rtMemType_t> mem_type(1, RT_MEMORY_HBM);
  249. mem_type.push_back(RT_MEMORY_P2P_DDR);
  250. auto ret = MemManager::Instance().Initialize(mem_type);
  251. if (ret != SUCCESS) {
  252. GELOGE(ret, "Memory Manager init failed.");
  253. return ret;
  254. }
  255. GE_CHK_STATUS_RET(OpsKernelBuilderManager::Instance().Initialize({}, false),
  256. "Failed to initialize OpsKernelBuilders");
  257. // Start profiling
  258. Options profiling_options;
  259. profiling_options.device_id = 0;
  260. profiling_options.job_id = "1";
  261. ProfilingManager::Instance().Init(profiling_options);
  262. isInit_ = true;
  263. GELOGI("Init GeExecutor over.");
  264. return ge::SUCCESS;
  265. }
  266. Status GeExecutor::Finalize() {
  267. GELOGI("Uninit GeExecutor begin.");
  268. if (isInit_ == false) {
  269. GELOGW("GeExecutor has not been initialized.");
  270. return ge::SUCCESS;
  271. }
  272. (void) OpsKernelBuilderManager::Instance().Finalize();
  273. // Stop profiling
  274. if (ProfilingManager::Instance().ProfilingOn()) {
  275. ProfilingManager::Instance().StopProfiling();
  276. ProfilingManager::Instance().PluginUnInit(GE_PROFILING_MODULE);
  277. }
  278. GELOGI("Uninit GeExecutor over.");
  279. return ge::SUCCESS;
  280. }
  281. Status GeExecutor::SetDynamicBatchSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  282. uint64_t batch_size) {
  283. if (dynamic_input_addr == nullptr) {
  284. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  285. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  286. }
  287. uint64_t size = sizeof(uint32_t);
  288. if (length < size) {
  289. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Dynamic input size [%lu] is less than [%lu]!", length, size);
  290. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  291. }
  292. if (length >= sizeof(uint64_t)) {
  293. size = sizeof(uint64_t);
  294. }
  295. // Verify whether the input dynamic batch matches the model gear
  296. std::vector<std::vector<int64_t>> batch_info;
  297. std::vector<uint64_t> batch_num{batch_size};
  298. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  299. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  300. if (ret != SUCCESS) {
  301. GELOGE(ret, "Get dynamic input info failed.");
  302. return ret;
  303. }
  304. if (!IsDynamicBatchSizeMatchModel(batch_size, batch_info)) {
  305. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  306. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  307. }
  308. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_BATCH));
  309. if (ret != SUCCESS) {
  310. GELOGE(ret, "Set dynamic size failed");
  311. return ret;
  312. }
  313. // memcpy dynamic_batch_size from host to device
  314. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &batch_size, size, RT_MEMCPY_HOST_TO_DEVICE);
  315. if (rt_ret != RT_ERROR_NONE) {
  316. GELOGE(rt_ret, "memcpy dynamic batch input data failed! ret: 0x%X", rt_ret);
  317. return RT_ERROR_TO_GE_STATUS(rt_ret);
  318. }
  319. return SUCCESS;
  320. }
  321. Status GeExecutor::SetDynamicImageSize(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  322. uint64_t image_height, uint64_t image_width) {
  323. if (dynamic_input_addr == nullptr) {
  324. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  325. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  326. }
  327. uint64_t dynamic_input_size = kDynamicImageSizeInputSize * sizeof(uint32_t);
  328. if (length < dynamic_input_size) {
  329. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  330. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  331. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  332. }
  333. uint64_t size = sizeof(uint32_t);
  334. if (length >= kDynamicImageSizeInputSize * sizeof(uint64_t)) {
  335. size = sizeof(uint64_t);
  336. }
  337. // Verify whether the input dynamic resolution matches the model gear
  338. std::vector<std::vector<int64_t>> batch_info;
  339. std::vector<uint64_t> batch_num{image_height, image_width};
  340. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  341. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  342. if (ret != SUCCESS) {
  343. GELOGE(ret, "Get dynamic input info failed.");
  344. return ret;
  345. }
  346. if (!IsDynamicImageSizeMatchModel(image_height, image_width, batch_info)) {
  347. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  348. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  349. }
  350. ret = GraphExecutor::SetDynamicSize(model_id, batch_num, static_cast<int32_t>(DYNAMIC_IMAGE));
  351. if (ret != SUCCESS) {
  352. GELOGE(ret, "Set dynamic size failed");
  353. return ret;
  354. }
  355. // Memcpy dynamic resolution height from host to device
  356. rtError_t rt_ret =
  357. rtMemcpy(dynamic_input_addr, size, &image_height, size, RT_MEMCPY_HOST_TO_DEVICE);
  358. if (rt_ret != RT_ERROR_NONE) {
  359. GELOGE(rt_ret, "memcpy dynamic resolution input data failed! ret: 0x%X", rt_ret);
  360. return RT_ERROR_TO_GE_STATUS(rt_ret);
  361. }
  362. uint64_t remain_size = length - size;
  363. // Memcpy dynamic resolution width from host to device
  364. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size),
  365. remain_size, &image_width, size, RT_MEMCPY_HOST_TO_DEVICE);
  366. if (rt_ret != RT_ERROR_NONE) {
  367. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  368. return RT_ERROR_TO_GE_STATUS(rt_ret);
  369. }
  370. return SUCCESS;
  371. }
  372. Status GeExecutor::SetDynamicDims(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  373. const vector<uint64_t> &dynamic_dims) {
  374. if (dynamic_input_addr == nullptr) {
  375. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic input addr is nullptr!");
  376. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  377. }
  378. vector<uint64_t> cur_dynamic_dims;
  379. Status ret = GetCurDynamicDims(model_id, dynamic_dims, cur_dynamic_dims);
  380. if (ret != SUCCESS) {
  381. GELOGE(ret, "Set cur gear dynamic dims failed");
  382. return ret;
  383. }
  384. std::vector<std::vector<int64_t>> batch_info;
  385. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  386. ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  387. if (ret != SUCCESS) {
  388. GELOGE(ret, "Get dynamic input info failed.");
  389. return ret;
  390. }
  391. if (!IsDynmaicDimsSizeMatchModel(cur_dynamic_dims, batch_info)) {
  392. GELOGE(ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID, "The current dynamic input does not match the gear of the model.");
  393. return ACL_ERROR_GE_DYNAMIC_BATCH_SIZE_INVALID;
  394. }
  395. ret = GraphExecutor::SetDynamicSize(model_id, cur_dynamic_dims, static_cast<int32_t>(DYNAMIC_DIMS));
  396. if (ret != SUCCESS) {
  397. GELOGE(ret, "Set dynamic size failed");
  398. return ret;
  399. }
  400. size_t dynamic_dim_num = cur_dynamic_dims.size();
  401. uint64_t dynamic_input_size = static_cast<uint64_t>(dynamic_dim_num * sizeof(uint32_t));
  402. if (length < dynamic_input_size) {
  403. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  404. "Dynamic input size [%lu] is less than [%lu]!", length, dynamic_input_size);
  405. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  406. }
  407. uint64_t size = sizeof(uint32_t);
  408. if (length >= dynamic_dim_num * sizeof(uint64_t)) {
  409. size = sizeof(uint64_t);
  410. }
  411. rtError_t rt_ret;
  412. for (uint32_t i = 0; i < dynamic_dim_num; ++i) {
  413. // Memcpy dynamic dim[i] from host to device
  414. rt_ret = rtMemcpy(reinterpret_cast<void *>(reinterpret_cast<uint8_t *>(dynamic_input_addr) + size * i),
  415. length - size * i, &cur_dynamic_dims[i], size, RT_MEMCPY_HOST_TO_DEVICE);
  416. if (rt_ret != RT_ERROR_NONE) {
  417. GELOGE(rt_ret, "memcpy dynamic resolution input data failed!");
  418. return RT_ERROR_TO_GE_STATUS(rt_ret);
  419. }
  420. }
  421. return SUCCESS;
  422. }
  423. Status GeExecutor::GetCurDynamicDims(uint32_t model_id, const vector<uint64_t> &dynamic_dims,
  424. vector<uint64_t> &cur_dynamic_dims) {
  425. cur_dynamic_dims.clear();
  426. vector<ge::TensorDesc> input_desc;
  427. vector<ge::TensorDesc> output_desc;
  428. auto ret = GetModelDescInfo(model_id, input_desc, output_desc);
  429. if (ret != ge::SUCCESS) {
  430. GELOGE(ret, "GetModelDescInfo failed.");
  431. return ret;
  432. }
  433. vector<string> user_designate_shape_order;
  434. vector<int64_t> all_data_dims;
  435. ret = GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  436. if (ret != ge::SUCCESS) {
  437. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  438. return ret;
  439. }
  440. for (auto &data_name : user_designate_shape_order) {
  441. for (auto &desc : input_desc) {
  442. if (desc.GetName() == data_name) {
  443. for (auto dim : desc.GetShape().GetDims()) {
  444. all_data_dims.push_back(dim);
  445. }
  446. break;
  447. }
  448. }
  449. }
  450. if (dynamic_dims.size() != all_data_dims.size()){
  451. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  452. "Dynamic input size [%lu] is not equal with all data dims size [%lu]!",
  453. dynamic_dims.size(), all_data_dims.size());
  454. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  455. }
  456. for (std::size_t i = 0; i < all_data_dims.size(); ++i) {
  457. if (all_data_dims[i] < 0) {
  458. cur_dynamic_dims.push_back(dynamic_dims[i]);
  459. } else if (static_cast<uint64_t>(all_data_dims[i]) != dynamic_dims[i]) {
  460. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID, "Static dims should be same, index: %zu value: %d should be %d",
  461. i, dynamic_dims[i], all_data_dims[i]);
  462. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  463. }
  464. }
  465. return SUCCESS;
  466. }
  467. Status GeExecutor::GetCurShape(const uint32_t model_id, std::vector<int64_t> &batch_info, int32_t &dynamic_type) {
  468. GELOGI("Begin to get current shape");
  469. if (!isInit_) {
  470. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  471. return ACL_ERROR_GE_EXEC_NOT_INIT;
  472. }
  473. Status ret = GraphExecutor::GetCurShape(model_id, batch_info, dynamic_type);
  474. if (ret != SUCCESS) {
  475. GELOGE(ret, "Get current shape failed");
  476. return ret;
  477. }
  478. return SUCCESS;
  479. }
  480. Status GeExecutor::SetDynamicAippData(uint32_t model_id, void *dynamic_input_addr, uint64_t length,
  481. const std::vector<kAippDynamicBatchPara> &aippBatchPara,
  482. const kAippDynamicPara &aippParms) {
  483. GELOGI("Enter to SetDynamicAippData.");
  484. if (dynamic_input_addr == nullptr) {
  485. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID, "Dynamic aipp input addr is nullptr!");
  486. return ACL_ERROR_GE_DYNAMIC_INPUT_ADDR_INVALID;
  487. }
  488. if (aippBatchPara.empty()) {
  489. GELOGE(ACL_ERROR_GE_AIPP_BATCH_EMPTY, "aippBatchPara is empty.");
  490. return ACL_ERROR_GE_AIPP_BATCH_EMPTY;
  491. }
  492. uint64_t batch_num = aippBatchPara.size();
  493. uint64_t real_aippParms_size = sizeof(kAippDynamicPara) - sizeof(kAippDynamicBatchPara);
  494. uint64_t struct_len = batch_num * sizeof(kAippDynamicBatchPara) + real_aippParms_size;
  495. GELOGI(
  496. "Get acl input dynamic aipp data, model_id is %u, length is %lu,"
  497. "batch num is %lu, struct_len is %lu",
  498. model_id, length, batch_num, struct_len);
  499. if (struct_len > length) {
  500. GELOGE(ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID,
  501. "input dynamic aipp param len [%lu] is larger than aipp_data size [%lu]", struct_len, length);
  502. return ACL_ERROR_GE_DYNAMIC_INPUT_LENGTH_INVALID;
  503. }
  504. // Memcpy real kAippDynamicBatchPara from host to device
  505. rtError_t rt_ret = rtMemcpy(dynamic_input_addr, length, &aippParms, real_aippParms_size, RT_MEMCPY_HOST_TO_DEVICE);
  506. if (rt_ret != RT_ERROR_NONE) {
  507. GELOGE(rt_ret, "memcpy real_aippParms_size failed! ret: 0x%X", rt_ret);
  508. return RT_ERROR_TO_GE_STATUS(rt_ret);
  509. }
  510. uint64_t remain_len = length - real_aippParms_size;
  511. uint8_t *aipp_batch_para_dev = reinterpret_cast<uint8_t *>(dynamic_input_addr) + real_aippParms_size;
  512. for (uint64_t i = 0; i < batch_num; ++i) {
  513. rt_ret = rtMemcpy(reinterpret_cast<void *>(aipp_batch_para_dev + i * sizeof(kAippDynamicBatchPara)),
  514. (remain_len - i * sizeof(kAippDynamicBatchPara)), &(aippBatchPara[i]),
  515. sizeof(kAippDynamicBatchPara), RT_MEMCPY_HOST_TO_DEVICE);
  516. if (rt_ret != RT_ERROR_NONE) {
  517. GELOGE(rt_ret, "memcpy kAippDynamicBatchPara input data failed! ret: 0x%X", rt_ret);
  518. return RT_ERROR_TO_GE_STATUS(rt_ret);
  519. }
  520. }
  521. return SUCCESS;
  522. }
  523. // Load model
  524. Status GeExecutor::LoadModelOffline(uint32_t &model_id, const std::string &path, const std::string &key,
  525. int32_t priority, std::shared_ptr<ge::ModelListener> listener) {
  526. GELOGI("load model offline begin.");
  527. if (!isInit_) {
  528. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  529. return ACL_ERROR_GE_EXEC_NOT_INIT;
  530. }
  531. string filePath = RealPath(path.c_str());
  532. if (filePath.empty()) {
  533. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  534. "File path is invalid. please check your text file '%s'.", path.c_str());
  535. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  536. }
  537. std::shared_ptr<ModelListenerAdapter> listener_adapter = MakeShared<ModelListenerAdapter>();
  538. if (listener_adapter == nullptr) {
  539. GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelListenerAdapter make shared failed!");
  540. return ACL_ERROR_GE_MEMORY_ALLOCATION;
  541. }
  542. listener_adapter->listener = listener;
  543. Status ret = GraphLoader::LoadModelFromFile(path, key, priority, listener_adapter, model_id);
  544. if (ret != SUCCESS) {
  545. GELOGE(ret, "[GeExecutor] LoadModelFromFile failed");
  546. return ACL_ERROR_GE_LOAD_MODEL;
  547. }
  548. return SUCCESS;
  549. }
  550. Status GeExecutor::LoadModel(uint32_t &model_id, const ModelData &model_data,
  551. std::shared_ptr<ge::ModelListener> listener) {
  552. GELOGI("Load model begin.");
  553. if (!isInit_) {
  554. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  555. return ACL_ERROR_GE_EXEC_NOT_INIT;
  556. }
  557. std::shared_ptr<ModelListenerAdapter> listener_adapter = MakeShared<ModelListenerAdapter>();
  558. if (listener_adapter == nullptr) {
  559. GELOGE(ACL_ERROR_GE_MEMORY_ALLOCATION, "ModelListenerAdapter make shared failed!");
  560. return ACL_ERROR_GE_MEMORY_ALLOCATION;
  561. }
  562. listener_adapter->listener = listener;
  563. Status ret = GraphLoader::LoadModel(model_data, listener_adapter, model_id);
  564. if (ret != SUCCESS) {
  565. GELOGE(ret, "[GeExecutor] LoadModel failed.");
  566. return ACL_ERROR_GE_LOAD_MODEL;
  567. }
  568. return ret;
  569. }
  570. Status GeExecutor::UnloadModel(uint32_t model_id) {
  571. GELOGD("unload model %u begin.", model_id);
  572. if (!isInit_) {
  573. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  574. return ACL_ERROR_GE_EXEC_NOT_INIT;
  575. }
  576. Status ret = GraphLoader::DestroyAicpuSessionForInfer(model_id);
  577. if (ret != SUCCESS) {
  578. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  579. return ACL_ERROR_GE_INTERNAL_ERROR;
  580. }
  581. std::shared_ptr<hybrid::HybridDavinciModel> hybrid_davinci_model = ModelManager::GetInstance()->GetHybridModel(model_id);
  582. if (hybrid_davinci_model != nullptr) {
  583. uint64_t session_id = hybrid_davinci_model->GetSessionId();
  584. VarManagerPool::Instance().RemoveVarManager(session_id);
  585. } else {
  586. std::shared_ptr<DavinciModel> davinci_model = ModelManager::GetInstance()->GetModel(model_id);
  587. if (davinci_model != nullptr) {
  588. uint64_t session_id = davinci_model->GetSessionId();
  589. VarManagerPool::Instance().RemoveVarManager(session_id);
  590. }
  591. }
  592. ret = GraphLoader::UnloadModel(model_id);
  593. if (ret != SUCCESS) {
  594. GELOGE(ret, "[GraphLoader] DestroyAicpuSessionForInfer failed. model id: %u", model_id);
  595. return ACL_ERROR_GE_UNLOAD_MODEL;
  596. }
  597. return SUCCESS;
  598. }
  599. Status GeExecutor::RunModel(const ge::RunModelData &input_data, ge::RunModelData &output_data) {
  600. GELOGI("run model begin.");
  601. if (!isInit_) {
  602. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  603. return ACL_ERROR_GE_EXEC_NOT_INIT;
  604. }
  605. InputData inputs;
  606. GetDomiInputData(input_data, inputs);
  607. OutputData outputs;
  608. GetDomiOutputData(output_data, outputs);
  609. return GraphExecutor::DataInput(inputs, outputs);
  610. }
  611. // Get input and output descriptor
  612. Status GeExecutor::GetModelDescInfo(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  613. std::vector<ge::TensorDesc> &output_desc, bool new_model_desc) {
  614. if (!isInit_) {
  615. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  616. return ACL_ERROR_GE_EXEC_NOT_INIT;
  617. }
  618. std::vector<InputOutputDescInfo> input_desc_infos;
  619. std::vector<InputOutputDescInfo> output_desc_infos;
  620. std::vector<uint32_t> input_formats;
  621. std::vector<uint32_t> output_formats;
  622. Status ret = GraphExecutor::GetInputOutputDescInfo(model_id, input_desc_infos, output_desc_infos, input_formats,
  623. output_formats, new_model_desc);
  624. if (ret != domi::SUCCESS) {
  625. GELOGE(ret, "GetInputOutputDescInfo failed. ret = %u", ret);
  626. return ACL_ERROR_GE_GET_TENSOR_INFO;
  627. }
  628. if (input_formats.size() != input_desc_infos.size()) {
  629. GELOGE(ACL_ERROR_GE_PARAM_INVALID,
  630. "input_formats size %zu is not equal to input_desc_infos size %zu.",
  631. input_formats.size(), input_desc_infos.size());
  632. return ACL_ERROR_GE_PARAM_INVALID;
  633. }
  634. if (output_formats.size() != output_desc_infos.size()) {
  635. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats size %zu is not equal to output_desc_infos size %zu.",
  636. output_formats.size(), output_desc_infos.size());
  637. return ACL_ERROR_GE_PARAM_INVALID;
  638. }
  639. // Transfer data to TensorDesc
  640. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  641. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  642. return ge::SUCCESS;
  643. }
  644. ///
  645. /// @ingroup ge
  646. /// @brief Get dynamic batch_info
  647. /// @param [in] model_id
  648. /// @param [out] batch_info
  649. /// @param [out] dynamic_type
  650. /// @return execute result
  651. ///
  652. Status GeExecutor::GetDynamicBatchInfo(uint32_t model_id, std::vector<std::vector<int64_t>> &batch_info,
  653. int32_t &dynamic_type) {
  654. if (!isInit_) {
  655. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  656. return ACL_ERROR_GE_EXEC_NOT_INIT;
  657. }
  658. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  659. if (ret != SUCCESS) {
  660. GELOGE(ret, "GetDynamicBatchInfo failed.");
  661. return ret;
  662. }
  663. return SUCCESS;
  664. }
  665. ///
  666. /// @ingroup ge
  667. /// @brief Get combined dynamic dims info
  668. /// @param [in] model_id
  669. /// @param [out] batch_info
  670. /// @return execute result
  671. ///
  672. Status GeExecutor::GetCombinedDynamicDims(uint32_t model_id, vector<vector<int64_t>> &batch_info) {
  673. GELOGI("Begin to get combined dynamic dims info.");
  674. if (!isInit_) {
  675. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  676. return ACL_ERROR_GE_EXEC_NOT_INIT;
  677. }
  678. Status ret = GraphExecutor::GetCombinedDynamicDims(model_id, batch_info);
  679. if (ret != SUCCESS) {
  680. GELOGE(ret, "GetCombinedDynamicDims failed.");
  681. return ret;
  682. }
  683. GELOGI("Get combined dynamic dims succ.");
  684. return SUCCESS;
  685. }
  686. ///
  687. /// @ingroup ge
  688. /// @brief Get user designeate shape order
  689. /// @param [in] model_id
  690. /// @param [out] user_designate_shape_order
  691. /// @return execute result
  692. ///
  693. Status GeExecutor::GetUserDesignateShapeOrder(uint32_t model_id, vector<string> &user_designate_shape_order) {
  694. if (!isInit_) {
  695. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  696. return ACL_ERROR_GE_EXEC_NOT_INIT;
  697. }
  698. Status ret = GraphExecutor::GetUserDesignateShapeOrder(model_id, user_designate_shape_order);
  699. if (ret != SUCCESS) {
  700. GELOGE(ret, "GetUserDesignateShapeOrder failed.");
  701. return ret;
  702. }
  703. return SUCCESS;
  704. }
  705. ///
  706. /// @ingroup ge
  707. /// @brief Get AIPP input format
  708. /// @param [in] model_id
  709. /// @param [in] index
  710. /// @param [out] input_format
  711. /// @return execute result
  712. ///
  713. Status GeExecutor::GetAIPPInfo(uint32_t model_id, uint32_t index, AippConfigInfo &aipp_info) {
  714. GELOGI("Begin to GetAIPPInfo.");
  715. if (!isInit_) {
  716. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  717. return ACL_ERROR_GE_EXEC_NOT_INIT;
  718. }
  719. Status ret = GraphExecutor::GetAIPPInfo(model_id, index, aipp_info);
  720. if (ret != SUCCESS) {
  721. GELOGW("GetAIPPInfo is not success.");
  722. return ret;
  723. }
  724. GELOGI("GetAIPPInfo succ.");
  725. return SUCCESS;
  726. }
  727. Status GeExecutor::GetAippType(uint32_t model_id, uint32_t index, InputAippType &type, size_t &aipp_index) {
  728. GELOGI("Begin to get aipp type.");
  729. if (!isInit_) {
  730. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  731. return ACL_ERROR_GE_EXEC_NOT_INIT;
  732. }
  733. Status ret = GraphExecutor::GetAippType(model_id, index, type, aipp_index);
  734. if (ret != SUCCESS) {
  735. GELOGW("Get aipp type is not success.");
  736. return ret;
  737. }
  738. GELOGI("Get aipp type success.");
  739. return SUCCESS;
  740. }
  741. Status GeExecutor::GetModelAttr(uint32_t model_id, std::vector<std::string> &dynamic_output_shape_info) {
  742. if (!isInit_) {
  743. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  744. return ACL_ERROR_GE_EXEC_NOT_INIT;
  745. }
  746. Status ret = GraphExecutor::GetModelAttr(model_id, dynamic_output_shape_info);
  747. if (ret != SUCCESS) {
  748. GELOGE(ret, "Get dynamic batch output shape info failed.");
  749. return ret;
  750. }
  751. return SUCCESS;
  752. }
  753. Status GeExecutor::GetModelDescInfoForZeroCopy(uint32_t model_id, std::vector<ge::TensorDesc> &input_desc,
  754. std::vector<TensorDesc> &output_desc) {
  755. GELOGI("get model desc info for zero copy begin.");
  756. if (!isInit_) {
  757. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  758. return ACL_ERROR_GE_EXEC_NOT_INIT;
  759. }
  760. std::vector<InputOutputDescInfo> input_desc_infos;
  761. std::vector<InputOutputDescInfo> output_desc_infos;
  762. std::vector<uint32_t> input_formats;
  763. std::vector<uint32_t> output_formats;
  764. Status ret = GraphExecutor::GetInputOutputDescInfoForZeroCopy(model_id, input_desc_infos, output_desc_infos,
  765. input_formats, output_formats);
  766. if (ret != domi::SUCCESS) {
  767. GELOGE(ret, "Get DescInfo from zero copy failed. ret = %u", ret);
  768. return ACL_ERROR_GE_GET_TENSOR_INFO;
  769. }
  770. if (input_formats.size() != input_desc_infos.size()) {
  771. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "input_formats.size() != input_desc_infos.size().");
  772. return ACL_ERROR_GE_PARAM_INVALID;
  773. }
  774. if (output_formats.size() != output_desc_infos.size()) {
  775. GELOGE(ACL_ERROR_GE_PARAM_INVALID, "output_formats.size() != output_desc_infos.size().");
  776. return ACL_ERROR_GE_PARAM_INVALID;
  777. }
  778. GetGeTensorDescFromDomiInfo(input_desc, input_desc_infos, input_formats);
  779. GetGeTensorDescFromDomiInfo(output_desc, output_desc_infos, output_formats);
  780. GELOGI("get model desc info from zero copy end.");
  781. return ge::SUCCESS;
  782. }
  783. Status GeExecutor::CommandHandle(const Command &command) {
  784. Status ret = GraphLoader::CommandHandle(command);
  785. if (ret != SUCCESS) {
  786. GELOGE(ACL_ERROR_GE_COMMAND_HANDLE, "CommandHandle: Command Handle failed.");
  787. return ACL_ERROR_GE_COMMAND_HANDLE;
  788. }
  789. return SUCCESS;
  790. }
  791. Status GeExecutor::GetMaxUsedMemory(uint32_t model_id, uint32_t &max_size) {
  792. GELOGI("Get max used memory begin.");
  793. if (!isInit_) {
  794. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  795. return ACL_ERROR_GE_EXEC_NOT_INIT;
  796. }
  797. uint64_t max_mem_size = 0;
  798. Status ret = GraphLoader::GetMaxUsedMemory(model_id, max_mem_size);
  799. max_size = static_cast<uint32_t>(max_mem_size);
  800. return ret;
  801. }
  802. /**
  803. * @ingroup ge
  804. * @brief Load data from model file to memory
  805. * @param [in] const std::string &path: Offline model file path
  806. * @param [out] domi::ModelData &model_data: Offline model memory data
  807. * @return SUCCESS handle successfully / others handle failed
  808. */
  809. Status GeExecutor::LoadDataFromFile(const std::string &path, ModelData &model_data) {
  810. GELOGI("Load data from file begin.");
  811. if (!isInit_) {
  812. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  813. return ACL_ERROR_GE_EXEC_NOT_INIT;
  814. }
  815. string filePath = RealPath(path.c_str());
  816. if (filePath.empty()) {
  817. GELOGE(ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID,
  818. "File path is invalid. please check your text file '%s'.", path.c_str());
  819. return ACL_ERROR_GE_EXEC_MODEL_PATH_INVALID;
  820. }
  821. GELOGI("load modelData from file: %s.", path.c_str());
  822. std::string key_path;
  823. int32_t priority = 0;
  824. Status ret = GraphLoader::LoadDataFromFile(path, key_path, priority, model_data);
  825. if (ret != SUCCESS) {
  826. if (model_data.model_data != nullptr) {
  827. delete[] static_cast<char *>(model_data.model_data);
  828. model_data.model_data = nullptr;
  829. }
  830. }
  831. return ret;
  832. }
  833. /**
  834. * @ingroup ge
  835. * @brief Load model from offline model memory data
  836. * @param [in] domi::ModelData &model_data: Offline model data
  837. void *dev_ptr: Input/Output memory start address
  838. size_t memsize: Input/Output memory length
  839. void *weight_ptr: Weight memory start address
  840. size_t weightsize: Weight memory length
  841. * @param [out] uint32_t &model_id: identification after model loading
  842. * @return SUCCESS handle successfully / others handle failed
  843. */
  844. Status GeExecutor::LoadModelFromData(uint32_t &model_id, const ModelData &model_data, void *dev_ptr, size_t mem_size,
  845. void *weight_ptr, size_t weight_size) {
  846. if (!isInit_) {
  847. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  848. return ACL_ERROR_GE_EXEC_NOT_INIT;
  849. }
  850. return GraphLoader::LoadModelFromData(model_id, model_data, dev_ptr, mem_size, weight_ptr, weight_size);
  851. }
  852. /**
  853. * @ingroup ge
  854. * @brief Load task list from ModelData with queue.
  855. * @param [out] model_id: model id allocate from manager.
  856. * @param [in] ge_model_data: Model data load from offline model.
  857. * @param [in] input_queue_ids: input queue ids create from user.
  858. * @param [in] output_queue_ids: input queue ids create from user.
  859. * @return: 0 for success / others for fail
  860. */
  861. Status GeExecutor::LoadModelWithQ(uint32_t &model_id, const ModelData &model_data,
  862. const std::vector<uint32_t> &input_queue_ids,
  863. const std::vector<uint32_t> &output_queue_ids) {
  864. GELOGI("Load model with queue begin.");
  865. if (!isInit_) {
  866. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  867. return ACL_ERROR_GE_EXEC_NOT_INIT;
  868. }
  869. return GraphLoader::LoadModelWithQ(model_id, model_data, input_queue_ids, output_queue_ids);
  870. }
  871. /**
  872. * @ingroup ge
  873. * @brief Synchronous execution of offline model(Do not create thread)
  874. * @param [in] uint32_t model_id: Model ID to execute
  875. void* stream: stream to execute
  876. const domi::InputData *input_data: Model input data
  877. bool async_mode: is asynchronize mode.
  878. * @param [out] domi::OutputData *output_data: Model output data
  879. * @return SUCCESS handle successfully / others handle failed
  880. */
  881. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  882. ge::RunModelData &run_output_data, bool async_mode) {
  883. std::vector<GeTensorDesc> input_desc = {};
  884. std::vector<GeTensorDesc> output_desc = {};
  885. return ExecModel(model_id, stream, run_input_data, input_desc, run_output_data, output_desc, async_mode);
  886. }
  887. /**
  888. * @ingroup ge
  889. * @brief Synchronous execution of offline model(Do not create thread)
  890. * @param [in] uint32_t model_id: Model ID to execute
  891. void* stream: stream to execute
  892. const domi::InputData *input_data: Model input data
  893. const std::vector<GeTensorDesc> &input_desc: Description of model input data
  894. bool async_mode: is asynchronize mode
  895. * @param [out] domi::OutputData *output_data: Model output data
  896. * @param [out] std::vector<GeTensorDesc> &output_desc: Description of model output data
  897. * @return SUCCESS handle successfully / others handle failed
  898. */
  899. Status GeExecutor::ExecModel(uint32_t model_id, void *stream, const ge::RunModelData &run_input_data,
  900. const std::vector<GeTensorDesc> &input_desc, ge::RunModelData &run_output_data,
  901. std::vector<GeTensorDesc> &output_desc, bool async_mode) {
  902. if (!isInit_) {
  903. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  904. return ACL_ERROR_GE_EXEC_NOT_INIT;
  905. }
  906. InputData input_data;
  907. OutputData output_data;
  908. GetDomiInputData(run_input_data, input_data);
  909. GetDomiOutputData(run_output_data, output_data);
  910. if ((run_input_data.dynamic_batch_size != 0) || (run_input_data.dynamic_image_width != 0) ||
  911. (run_input_data.dynamic_image_height != 0) || (run_input_data.dynamic_dims.size() != 0)) {
  912. std::vector<std::vector<int64_t>> batch_info;
  913. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  914. Status ret = GraphExecutor::GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  915. if (ret != SUCCESS) {
  916. GELOGE(ret, "Get dynamic input info failed.");
  917. return ret;
  918. }
  919. if (!batch_info.empty()) {
  920. SetDynamicInputDataFlag(run_input_data, batch_info, input_data);
  921. }
  922. }
  923. return GraphLoader::ExecuteModel(model_id, stream, async_mode, input_data, input_desc, output_data, output_desc);
  924. }
  925. /**
  926. * @ingroup ge
  927. * @brief Get weight memory size from model file
  928. * @param [in] const std::string &path: Offline model file path
  929. * @param [out] size_t &mem_size Execution memory size
  930. size_t &weight_size Weight memory space size
  931. * @return SUCCESS handle successfully / others handle failed
  932. */
  933. Status GeExecutor::GetMemAndWeightSize(const std::string &path, size_t &mem_size, size_t &weight_size) {
  934. GELOGI("Get memory and weight size from file begin.");
  935. if (!isInit_) {
  936. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  937. return ACL_ERROR_GE_EXEC_NOT_INIT;
  938. }
  939. ModelData model;
  940. std::string key;
  941. Status ret = ge::GraphLoader::LoadDataFromFile(path, key, 0, model);
  942. if ((ret != SUCCESS) || (model.model_data == nullptr)) {
  943. GELOGE(ret, "Load data from file failed. ret = %d", ret);
  944. return ret;
  945. }
  946. ret = ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  947. delete[] static_cast<char *>(model.model_data);
  948. model.model_data = nullptr;
  949. return ret;
  950. }
  951. /**
  952. * @ingroup ge
  953. * @brief Get weight memory size from model file
  954. * @param [in] const void *model_data Offline model buffer
  955. size_t model_size Offline model buffer length
  956. * @param [out] size_t &mem_size Execution memory size
  957. size_t &weight_size Weight memory space size
  958. * @return SUCCESS handle successfully / others handle failed
  959. */
  960. Status GeExecutor::GetMemAndWeightSize(const void *model_data, size_t model_size, size_t &mem_size,
  961. size_t &weight_size) {
  962. GELOGI("Get memory and weight size from data begin.");
  963. if (!isInit_) {
  964. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "GeExecutor has not been initialized!");
  965. return ACL_ERROR_GE_EXEC_NOT_INIT;
  966. }
  967. if (model_data == nullptr) {
  968. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID, "invalid model data!");
  969. return ACL_ERROR_GE_EXEC_MODEL_ADDR_INVALID;
  970. }
  971. ModelData model;
  972. model.model_data = const_cast<void *>(model_data);
  973. model.model_len = static_cast<uint32_t>(model_size);
  974. return ge::ModelManager::GetModelMemAndWeightSize(model, mem_size, weight_size);
  975. }
  976. Status GeExecutor::LoadSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  977. SingleOp **single_op) {
  978. return SingleOpManager::GetInstance().GetOpFromModel(model_name, modelData, stream, single_op);
  979. }
  980. Status GeExecutor::LoadDynamicSingleOp(const std::string &model_name, const ge::ModelData &modelData, void *stream,
  981. DynamicSingleOp **single_op) {
  982. return SingleOpManager::GetInstance().GetDynamicOpFromModel(model_name, modelData, stream, single_op);
  983. }
  984. Status GeExecutor::ExecuteAsync(SingleOp *executor, const std::vector<DataBuffer> &inputs,
  985. std::vector<DataBuffer> &outputs) {
  986. if (executor == nullptr) {
  987. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "param is NULL");
  988. return ACL_ERROR_GE_EXEC_NOT_INIT;
  989. }
  990. return executor->ExecuteAsync(inputs, outputs);
  991. }
  992. ge::Status GeExecutor::ExecuteAsync(DynamicSingleOp *executor, const vector<GeTensorDesc> &input_desc,
  993. const vector<DataBuffer> &inputs, vector<GeTensorDesc> &output_desc,
  994. vector<DataBuffer> &outputs) {
  995. GE_CHECK_NOTNULL(executor);
  996. return executor->ExecuteAsync(input_desc, inputs, output_desc, outputs);
  997. }
  998. Status GeExecutor::ReleaseSingleOpResource(void *stream) {
  999. ModelManager::GetInstance()->ClearAicpuSo();
  1000. return SingleOpManager::GetInstance().ReleaseResource(stream);
  1001. }
  1002. Status GeExecutor::GetDeviceIdByModelId(uint32_t model_id, uint32_t &device_id) {
  1003. auto model_manager = ModelManager::GetInstance();
  1004. GE_CHECK_NOTNULL(model_manager);
  1005. auto davinci_model = model_manager->GetModel(model_id);
  1006. if (davinci_model == nullptr) {
  1007. GELOGE(ACL_ERROR_GE_EXEC_MODEL_ID_INVALID, "Model id: %d is invaild or model is not loaded.", model_id);
  1008. return ACL_ERROR_GE_EXEC_MODEL_ID_INVALID;
  1009. }
  1010. device_id = davinci_model->GetDeviceId();
  1011. return SUCCESS;
  1012. }
  1013. Status GeExecutor::GetBatchInfoSize(uint32_t model_id, size_t &shape_count) {
  1014. std::vector<std::vector<int64_t>> batch_info;
  1015. int32_t dynamic_type = static_cast<int32_t>(FIXED);
  1016. Status ret = GetDynamicBatchInfo(model_id, batch_info, dynamic_type);
  1017. if (ret != SUCCESS) {
  1018. GELOGE(ret, "Calc batch info size failed. ret = %d", ret);
  1019. return ret;
  1020. }
  1021. if (batch_info.empty()) {
  1022. shape_count = kStaticBatchInfoSize;
  1023. } else {
  1024. shape_count = batch_info.size();
  1025. }
  1026. return SUCCESS;
  1027. }
  1028. Status GeExecutor::GetOrigInputInfo(uint32_t model_id, uint32_t index, OriginInputInfo &orig_input_info) {
  1029. GELOGI("Begin to GetOrigInputInfo.");
  1030. if (!isInit_) {
  1031. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  1032. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1033. }
  1034. Status ret = GraphExecutor::GetOrigInputInfo(model_id, index, orig_input_info);
  1035. if (ret != SUCCESS) {
  1036. GELOGE(ret, "GetOrigInputInfo failed.");
  1037. return ret;
  1038. }
  1039. GELOGI("GetOrigInputInfo succ.");
  1040. return SUCCESS;
  1041. }
  1042. Status GeExecutor::GetAllAippInputOutputDims(uint32_t model_id, uint32_t index,
  1043. std::vector<InputOutputDims> &input_dims,
  1044. std::vector<InputOutputDims> &output_dims) {
  1045. GELOGI("Begin to GetAllAippInputOutputDims.");
  1046. if (!isInit_) {
  1047. GELOGE(ACL_ERROR_GE_EXEC_NOT_INIT, "not inited yet!");
  1048. return ACL_ERROR_GE_EXEC_NOT_INIT;
  1049. }
  1050. Status ret = GraphExecutor::GetAllAippInputOutputDims(model_id, index, input_dims, output_dims);
  1051. if (ret != SUCCESS) {
  1052. GELOGE(ret, "GetAllAippInputOutputDims failed.");
  1053. return ret;
  1054. }
  1055. GELOGI("GetAllAippInputOutputDims succ.");
  1056. return SUCCESS;
  1057. }
  1058. Status GeExecutor::GetOpDescInfo(uint32_t device_id, uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) {
  1059. GELOGI("Begin to GetOpDescInfo.");
  1060. Status ret = GraphExecutor::GetOpDescInfo(device_id, stream_id, task_id, op_desc_info);
  1061. if (ret != SUCCESS) {
  1062. GELOGE(ret, "GetOpDescInfo failed.");
  1063. return ret;
  1064. }
  1065. GELOGI("GetOpDescInfo succ.");
  1066. return SUCCESS;
  1067. }
  1068. Status GeExecutor::SetDump(const DumpConfig &dump_config) {
  1069. GELOGI("Start to set dump config");
  1070. auto ret = DumpManager::GetInstance().SetDumpConf(dump_config);
  1071. if (ret != SUCCESS) {
  1072. GELOGE(ret, "Set dump conf failed");
  1073. return ret;
  1074. }
  1075. GELOGI("Set dump config successfully");
  1076. return SUCCESS;
  1077. }
  1078. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示