You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

kernel_task_info_unittest.cc 38 kB

4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
4 years ago
1234567891011121314151617181920212223242526272829303132333435363738394041424344454647484950515253545556575859606162636465666768697071727374757677787980818283848586878889909192939495969798991001011021031041051061071081091101111121131141151161171181191201211221231241251261271281291301311321331341351361371381391401411421431441451461471481491501511521531541551561571581591601611621631641651661671681691701711721731741751761771781791801811821831841851861871881891901911921931941951961971981992002012022032042052062072082092102112122132142152162172182192202212222232242252262272282292302312322332342352362372382392402412422432442452462472482492502512522532542552562572582592602612622632642652662672682692702712722732742752762772782792802812822832842852862872882892902912922932942952962972982993003013023033043053063073083093103113123133143153163173183193203213223233243253263273283293303313323333343353363373383393403413423433443453463473483493503513523533543553563573583593603613623633643653663673683693703713723733743753763773783793803813823833843853863873883893903913923933943953963973983994004014024034044054064074084094104114124134144154164174184194204214224234244254264274284294304314324334344354364374384394404414424434444454464474484494504514524534544554564574584594604614624634644654664674684694704714724734744754764774784794804814824834844854864874884894904914924934944954964974984995005015025035045055065075085095105115125135145155165175185195205215225235245255265275285295305315325335345355365375385395405415425435445455465475485495505515525535545555565575585595605615625635645655665675685695705715725735745755765775785795805815825835845855865875885895905915925935945955965975985996006016026036046056066076086096106116126136146156166176186196206216226236246256266276286296306316326336346356366376386396406416426436446456466476486496506516526536546556566576586596606616626636646656666676686696706716726736746756766776786796806816826836846856866876886896906916926936946956966976986997007017027037047057067077087097107117127137147157167177187197207217227237247257267277287297307317327337347357367377387397407417427437447457467477487497507517527537547557567577587597607617627637647657667677687697707717727737747757767777787797807817827837847857867877887897907917927937947957967977987998008018028038048058068078088098108118128138148158168178188198208218228238248258268278288298308318328338348358368378388398408418428438448458468478488498508518528538548558568578588598608618628638648658668678688698708718728738748758768778788798808818828838848858868878888898908918928938948958968978988999009019029039049059069079089099109119129139149159169179189199209219229239249259269279289299309319329339349359369379389399409419429439449459469479489499509519529539549559569579589599609619629639649659669679689699709719729739749759769779789799809819829839849859869879889899909919929939949959969979989991000100110021003100410051006100710081009101010111012101310141015101610171018101910201021102210231024102510261027102810291030103110321033103410351036103710381039104010411042104310441045104610471048104910501051105210531054105510561057105810591060106110621063106410651066106710681069107010711072107310741075107610771078107910801081108210831084108510861087108810891090109110921093109410951096109710981099110011011102110311041105110611071108110911101111111211131114111511161117111811191120112111221123112411251126112711281129113011311132113311341135113611371138113911401141114211431144114511461147114811491150115111521153115411551156115711581159116011611162116311641165116611671168116911701171117211731174117511761177117811791180118111821183118411851186118711881189119011911192119311941195119611971198119912001201
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <gtest/gtest.h>
  17. #define private public
  18. #define protected public
  19. #include "graph/load/model_manager/davinci_model.h"
  20. #include "graph/load/model_manager/task_info/kernel_task_info.h"
  21. #include "graph/load/model_manager/task_info/hccl_task_info.h"
  22. namespace ge {
  23. extern OpDescPtr CreateOpDesc(string name, string type);
  24. class UtestKernelTaskInfo : public testing::Test {
  25. protected:
  26. void SetUp() {}
  27. void TearDown() {}
  28. };
  29. // test KernelTaskInfo Init.
  30. TEST_F(UtestKernelTaskInfo, success_kernel_taskInfo_not_te) {
  31. DavinciModel model(0, nullptr);
  32. domi::ModelTaskDef model_task_def;
  33. domi::TaskDef *task = model_task_def.add_task();
  34. task->set_type(RT_MODEL_TASK_KERNEL);
  35. TaskInfoPtr task_info = TaskInfoFactory::Instance().Create(static_cast<rtModelTaskType_t>(task->type()));
  36. task->stream_id_ = 0;
  37. rtStream_t stream = nullptr;
  38. rtStreamCreate(&stream, 0);
  39. model.stream_list_ = { stream };
  40. domi::KernelDef *kernel_def = task->mutable_kernel();
  41. domi::KernelContext *ctx = kernel_def->mutable_context();
  42. model.op_list_[0] = CreateOpDesc("relu", RELU);
  43. ctx->set_op_index(0);
  44. EXPECT_EQ(task_info->Init(*task, &model), FAILED);
  45. kernel_def->set_block_dim(10);
  46. kernel_def->set_args("args111111", 10);
  47. kernel_def->set_args_size(10);
  48. ctx->set_kernel_type(0);
  49. EXPECT_EQ(task_info->Init(*task, &model), INTERNAL_ERROR);
  50. task_info->Release();
  51. }
  52. TEST_F(UtestKernelTaskInfo, success_init_kernel_task_info_fail) {
  53. DavinciModel model(0, nullptr);
  54. KernelTaskInfo kernel_task_info;
  55. domi::TaskDef task_def;
  56. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  57. domi::KernelContext *ctx = kernel_def->mutable_context();
  58. model.op_list_[0] = CreateOpDesc("relu", RELU);
  59. ctx->set_op_index(0);
  60. rtStream_t stream = nullptr;
  61. rtStreamCreate(&stream, 0);
  62. model.stream_list_ = { stream };
  63. // Failed by rtGetFunctionByName.
  64. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  65. }
  66. // test InitTVMTask failed
  67. TEST_F(UtestKernelTaskInfo, init_tvm_task_fail) {
  68. DavinciModel model(0, nullptr);
  69. domi::TaskDef task_def;
  70. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  71. KernelTaskInfo kernel_task_info;
  72. kernel_task_info.davinci_model_ = &model;
  73. EXPECT_EQ(kernel_task_info.InitTVMTask(0, *kernel_def), PARAM_INVALID);
  74. task_def.clear_kernel();
  75. }
  76. // test InitTVMTask with kernel_type is TE
  77. TEST_F(UtestKernelTaskInfo, init_tvm_task_info_with_te_kernel_type) {
  78. DavinciModel model(0, nullptr);
  79. domi::TaskDef task_def;
  80. // DavinciModel is nullptr
  81. KernelTaskInfo kernel_task_info;
  82. EXPECT_EQ(kernel_task_info.Init(task_def, nullptr), PARAM_INVALID);
  83. rtStream_t stream = nullptr;
  84. rtStreamCreate(&stream, 0);
  85. model.stream_list_ = { stream };
  86. model.op_list_[0] = CreateOpDesc("", "");
  87. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  88. rtSmDesc_t l2CtrlInfo;
  89. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  90. kernel_def->set_args("args111111", 10);
  91. kernel_def->set_args_size(10);
  92. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  93. kernel_def->set_flowtable("fl", 2);
  94. kernel_def->set_block_dim(10);
  95. domi::KernelContext *ctx = kernel_def->mutable_context();
  96. ctx->set_kernel_type(2);
  97. ctx->set_op_index(4);
  98. ctx->set_args_offset("\0\0"); // args_offset = 0
  99. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  100. ctx->clear_args_offset();
  101. ctx->set_args_offset("args111111", 10);
  102. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  103. ctx->clear_op_index();
  104. ctx->set_op_index(0);
  105. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  106. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  107. kernel_def->clear_context();
  108. task_def.clear_kernel();
  109. }
  110. // test InitAICPUCustomTask with kernel_type is CUSTOMIZED
  111. TEST_F(UtestKernelTaskInfo, init_kernel_task_info_with_customized_kernel_type) {
  112. DavinciModel model(0, nullptr);
  113. rtStream_t stream = nullptr;
  114. rtStreamCreate(&stream, 0);
  115. model.stream_list_ = { stream };
  116. model.op_list_[0] = CreateOpDesc("", "");
  117. domi::TaskDef task_def;
  118. KernelTaskInfo kernel_task_info;
  119. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  120. rtSmDesc_t l2CtrlInfo;
  121. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  122. kernel_def->set_args("args111111", 10);
  123. kernel_def->set_args_size(10);
  124. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  125. kernel_def->set_flowtable("fl", 2);
  126. kernel_def->set_block_dim(10);
  127. domi::KernelContext *ctx = kernel_def->mutable_context();
  128. ctx->set_kernel_type(3);
  129. ctx->set_op_index(4);
  130. ctx->set_args_offset("\0\0"); // args_offset = 0
  131. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  132. ctx->clear_args_offset();
  133. ctx->set_args_offset("args111111", 10);
  134. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  135. ctx->clear_args_offset();
  136. ctx->set_op_index(0);
  137. const char task[] = "opattr";
  138. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  139. EXPECT_EQ(kernel_task_info.Init(task_def, &model), PARAM_INVALID);
  140. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  141. kernel_def->clear_context();
  142. task_def.clear_kernel();
  143. }
  144. // test InitAICPUCustomTask failed
  145. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed) {
  146. DavinciModel model(0, nullptr);
  147. rtStream_t stream = nullptr;
  148. rtStreamCreate(&stream, 0);
  149. model.stream_list_ = { stream };
  150. model.op_list_[0] = CreateOpDesc("", "");
  151. domi::TaskDef task_def;
  152. KernelTaskInfo kernel_task_info;
  153. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  154. domi::KernelContext *context = kernel_def->mutable_context();
  155. context->set_args_offset("\0\0");
  156. kernel_task_info.davinci_model_ = &model;
  157. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  158. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  159. context->clear_args_offset();
  160. context->set_args_offset("args111111", 10);
  161. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  162. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  163. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  164. kernel_def->clear_context();
  165. task_def.clear_kernel();
  166. }
  167. // test InitAICPUCustomTask failed
  168. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed2) {
  169. DavinciModel model(0, nullptr);
  170. rtStream_t stream = nullptr;
  171. rtStreamCreate(&stream, 0);
  172. model.stream_list_ = { stream };
  173. model.op_list_[0] = CreateOpDesc("", "");
  174. domi::TaskDef task_def;
  175. KernelTaskInfo kernel_task_info;
  176. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  177. domi::KernelContext *context = kernel_def->mutable_context();
  178. kernel_task_info.davinci_model_ = &model;
  179. context->set_args_offset("\0\0");
  180. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  181. // AttrUtils::GetBytes -> true
  182. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  183. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  184. kernel_def->clear_context();
  185. task_def.clear_kernel();
  186. }
  187. // test InitAICPUCustomTask failed
  188. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed3) {
  189. DavinciModel model(0, nullptr);
  190. rtStream_t stream = nullptr;
  191. rtStreamCreate(&stream, 0);
  192. model.stream_list_ = { stream };
  193. model.op_list_[0] = CreateOpDesc("", "");
  194. domi::TaskDef task_def;
  195. KernelTaskInfo kernel_task_info;
  196. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  197. domi::KernelContext *context = kernel_def->mutable_context();
  198. kernel_task_info.davinci_model_ = &model;
  199. context->set_args_offset("\0\0");
  200. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  201. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), PARAM_INVALID);
  202. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  203. kernel_def->clear_context();
  204. task_def.clear_kernel();
  205. }
  206. // test InitAICPUCustomTask failed
  207. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed4) {
  208. DavinciModel model(0, nullptr);
  209. rtStream_t stream = nullptr;
  210. rtStreamCreate(&stream, 0);
  211. model.stream_list_ = { stream };
  212. model.op_list_[0] = CreateOpDesc("", "");
  213. const char task[] = "opattr";
  214. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  215. domi::TaskDef task_def;
  216. KernelTaskInfo kernel_task_info;
  217. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  218. domi::KernelContext *context = kernel_def->mutable_context();
  219. kernel_task_info.davinci_model_ = &model;
  220. context->set_args_offset("args111111", 10);
  221. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  222. // rtMalloc RT_ERROR_NONE
  223. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  224. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  225. kernel_def->clear_context();
  226. task_def.clear_kernel();
  227. }
  228. // test InitAICPUCustomTask failed
  229. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed5) {
  230. DavinciModel model(0, nullptr);
  231. rtStream_t stream = nullptr;
  232. rtStreamCreate(&stream, 0);
  233. model.stream_list_ = { stream };
  234. model.op_list_[0] = CreateOpDesc("", "");
  235. const char task[] = "opattr";
  236. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  237. domi::TaskDef task_def;
  238. KernelTaskInfo kernel_task_info;
  239. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  240. domi::KernelContext *context = kernel_def->mutable_context();
  241. kernel_task_info.davinci_model_ = &model;
  242. context->set_args_offset("args111111", 10);
  243. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  244. // rtMalloc RT_ERROR_NONE
  245. // rtMemcpy RT_ERROR_INVALID_VALIUE
  246. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  247. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  248. kernel_def->clear_context();
  249. task_def.clear_kernel();
  250. }
  251. // test InitAICPUCustomTask failed
  252. TEST_F(UtestKernelTaskInfo, init_aicpu_custom_task_failed6) {
  253. DavinciModel model(0, nullptr);
  254. rtStream_t stream = nullptr;
  255. rtStreamCreate(&stream, 0);
  256. model.stream_list_ = { stream };
  257. model.op_list_[0] = CreateOpDesc("", "");
  258. const char task[] = "opattr";
  259. AttrUtils::SetBytes(model.op_list_[0], ATTR_NAME_OPATTR, Buffer::CopyFrom((uint8_t *)task, sizeof(task)));
  260. domi::TaskDef task_def;
  261. KernelTaskInfo kernel_task_info;
  262. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  263. domi::KernelContext *context = kernel_def->mutable_context();
  264. kernel_task_info.davinci_model_ = &model;
  265. context->set_args_offset("args111111", 10);
  266. // KernelTaskInfo::StoreInputOutputTensor -> SUCCESS
  267. // rtMalloc RT_ERROR_NONE
  268. // rtMemcpy RT_ERROR_NONE
  269. EXPECT_EQ(kernel_task_info.InitAICPUCustomTask(0, *kernel_def), FAILED);
  270. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  271. kernel_def->clear_context();
  272. task_def.clear_kernel();
  273. }
  274. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type) {
  275. DavinciModel model(0, nullptr);
  276. rtStream_t stream = nullptr;
  277. rtStreamCreate(&stream, 0);
  278. model.stream_list_ = { stream };
  279. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  280. domi::TaskDef task_def;
  281. KernelTaskInfo kernel_task_info;
  282. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  283. task_def.set_type(RT_MODEL_TASK_KERNEL);
  284. string args;
  285. args.append(100, '1');
  286. kernel_def->set_so_name("libDvpp.so");
  287. kernel_def->set_kernel_name("DvppResize");
  288. kernel_def->set_args(args.data(), 100);
  289. kernel_def->set_args_size(100);
  290. domi::KernelContext *ctx = kernel_def->mutable_context();
  291. ctx->set_kernel_type(6);
  292. ctx->set_op_index(0);
  293. // ModelUtils::GetInputDataAddrs -> ok
  294. // ModelUtils::GetOutputDataAddrs -> ok
  295. // rtMalloc -> RT_ERROR_NONE
  296. // rtMemcpy -> RT_ERROR_NONE
  297. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  298. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  299. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  300. kernel_def->clear_context();
  301. task_def.clear_kernel();
  302. }
  303. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type_fail) {
  304. DavinciModel model(0, nullptr);
  305. rtStream_t stream = nullptr;
  306. rtStreamCreate(&stream, 0);
  307. model.stream_list_ = { stream };
  308. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  309. domi::TaskDef task_def;
  310. KernelTaskInfo kernel_task_info;
  311. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  312. task_def.set_type(RT_MODEL_TASK_KERNEL);
  313. string args;
  314. args.append(100, '1');
  315. kernel_def->set_so_name("libDvpp.so");
  316. kernel_def->set_kernel_name("DvppResize");
  317. kernel_def->set_args(args.data(), 100);
  318. kernel_def->set_args_size(100);
  319. domi::KernelContext *ctx = kernel_def->mutable_context();
  320. ctx->set_kernel_type(6);
  321. ctx->set_op_index(0);
  322. // ModelUtils::GetInputDataAddrs -> ok
  323. // ModelUtils::GetOutputDataAddrs -> ok
  324. // rtMalloc -> RT_ERROR_NONE
  325. // rtMemcpy -> RT_ERROR_INVALID_VALUE
  326. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  327. const string ext_info = {1, 1, 1, 1, 0, 0, 0, 0};
  328. EXPECT_EQ(kernel_task_info.InitAicpuTaskExtInfo(ext_info), SUCCESS);
  329. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  330. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  331. kernel_def->clear_context();
  332. task_def.clear_kernel();
  333. }
  334. TEST_F(UtestKernelTaskInfo, init_kernel_taskInfo_with_aicpu_kernel_type_fail2) {
  335. DavinciModel model(0, nullptr);
  336. rtStream_t stream = nullptr;
  337. rtStreamCreate(&stream, 0);
  338. model.stream_list_ = { stream };
  339. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  340. domi::TaskDef task_def;
  341. KernelTaskInfo kernel_task_info;
  342. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  343. task_def.set_type(RT_MODEL_TASK_KERNEL);
  344. string args;
  345. args.append(100, '1');
  346. kernel_def->set_so_name("libDvpp.so");
  347. kernel_def->set_kernel_name("DvppResize");
  348. kernel_def->set_args(args.data(), 100);
  349. kernel_def->set_args_size(100);
  350. domi::KernelContext *ctx = kernel_def->mutable_context();
  351. ctx->set_kernel_type(6);
  352. ctx->set_op_index(0);
  353. // ModelUtils::GetInputDataAddrs -> ok
  354. // ModelUtils::GetOutputDataAddrs -> ok
  355. // rtMalloc -> RT_ERROR_INVALID_VALUE
  356. // rtMemcpy -> RT_ERROR_NONE
  357. EXPECT_EQ(kernel_task_info.Init(task_def, &model), SUCCESS);
  358. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  359. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  360. kernel_def->clear_context();
  361. task_def.clear_kernel();
  362. }
  363. // test StoreInputOutputTensor failed
  364. TEST_F(UtestKernelTaskInfo, store_input_output_tensor_fail) {
  365. std::vector<void *> input_data_addrs;
  366. std::vector<void *> output_data_addrs;
  367. std::vector<::tagCcAICPUTensor> input_descs;
  368. std::vector<::tagCcAICPUTensor> output_descs;
  369. KernelTaskInfo kernel_task_info;
  370. // rtMalloc -> RT_ERROR_INVALID_VALUE
  371. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  372. }
  373. TEST_F(UtestKernelTaskInfo, store_input_output_tensor_fail2) {
  374. std::vector<void *> input_data_addrs;
  375. std::vector<void *> output_data_addrs;
  376. std::vector<::tagCcAICPUTensor> input_descs;
  377. std::vector<::tagCcAICPUTensor> output_descs;
  378. KernelTaskInfo kernel_task_info;
  379. // rtMalloc -> RT_ERROR_INVALID_VALUE
  380. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  381. }
  382. // test InitCceTask success
  383. TEST_F(UtestKernelTaskInfo, kernel_task_info_init_cce_task) {
  384. DavinciModel model(0, nullptr);
  385. rtStream_t stream = nullptr;
  386. rtStreamCreate(&stream, 0);
  387. model.stream_list_ = { stream };
  388. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  389. domi::TaskDef task_def;
  390. KernelTaskInfo kernel_task_info;
  391. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  392. kernel_task_info.davinci_model_ = &model;
  393. kernel_def->set_flowtable("InitCceTask");
  394. domi::KernelContext *context = kernel_def->mutable_context();
  395. context->set_is_flowtable(true);
  396. rtSmDesc_t l2CtrlInfo;
  397. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  398. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  399. model.runtime_param_.logic_mem_base = 0;
  400. model.runtime_param_.mem_size = 0;
  401. model.runtime_param_.logic_weight_base = 0;
  402. model.runtime_param_.weight_size = 0;
  403. model.runtime_param_.logic_var_base = 0;
  404. model.runtime_param_.var_size = 0;
  405. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  406. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  407. // rtMalloc -> RT_ERROR_NONE
  408. // rtMemcpy -> RT_ERROR_NONE
  409. // rtMemAllocManaged -> RT_ERROR_NONE
  410. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  411. kernel_def->clear_context();
  412. task_def.clear_kernel();
  413. }
  414. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed1) {
  415. DavinciModel model(0, nullptr);
  416. domi::TaskDef task_def;
  417. KernelTaskInfo kernel_task_info;
  418. kernel_task_info.davinci_model_ = &model;
  419. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  420. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  421. task_def.clear_kernel();
  422. }
  423. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed2) {
  424. DavinciModel model(0, nullptr);
  425. rtStream_t stream = nullptr;
  426. rtStreamCreate(&stream, 0);
  427. model.stream_list_ = { stream };
  428. model.op_list_[0] = CreateOpDesc("", "");
  429. domi::TaskDef task_def;
  430. KernelTaskInfo kernel_task_info;
  431. kernel_task_info.davinci_model_ = &model;
  432. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  433. // KernelTaskInfo::SetContext -> SUCCESS
  434. domi::KernelContext *context = kernel_def->mutable_context();
  435. context->set_is_flowtable(true);
  436. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  437. kernel_def->clear_context();
  438. task_def.clear_kernel();
  439. }
  440. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed3) {
  441. DavinciModel model(0, nullptr);
  442. rtStream_t stream = nullptr;
  443. rtStreamCreate(&stream, 0);
  444. model.stream_list_ = { stream };
  445. model.op_list_[0] = CreateOpDesc("", "");
  446. domi::TaskDef task_def;
  447. KernelTaskInfo kernel_task_info;
  448. kernel_task_info.davinci_model_ = &model;
  449. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  450. // KernelTaskInfo::SetContext -> SUCCESS
  451. kernel_def->set_flowtable("InitCceTask");
  452. domi::KernelContext *context = kernel_def->mutable_context();
  453. context->set_is_flowtable(true);
  454. // KernelTaskInfo::UpdateCceArgs -> CCE_FAILED
  455. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  456. kernel_def->clear_context();
  457. task_def.clear_kernel();
  458. }
  459. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed4) {
  460. DavinciModel model(0, nullptr);
  461. rtStream_t stream = nullptr;
  462. rtStreamCreate(&stream, 0);
  463. model.stream_list_ = { stream };
  464. model.op_list_[0] = CreateOpDesc("", "");
  465. domi::TaskDef task_def;
  466. KernelTaskInfo kernel_task_info;
  467. kernel_task_info.davinci_model_ = &model;
  468. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  469. // KernelTaskInfo::SetContext -> SUCCESS
  470. kernel_def->set_flowtable("InitCceTask");
  471. domi::KernelContext *context = kernel_def->mutable_context();
  472. context->set_is_flowtable(true);
  473. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  474. // KernelTaskInfo::SetFlowtable -> RT_FAILED
  475. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  476. kernel_def->clear_context();
  477. task_def.clear_kernel();
  478. }
  479. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed5) {
  480. DavinciModel model(0, nullptr);
  481. rtStream_t stream = nullptr;
  482. rtStreamCreate(&stream, 0);
  483. model.stream_list_ = { stream };
  484. model.op_list_[0] = CreateOpDesc("", "");
  485. domi::TaskDef task_def;
  486. KernelTaskInfo kernel_task_info;
  487. kernel_task_info.davinci_model_ = &model;
  488. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  489. // KernelTaskInfo::SetContext -> SUCCESS
  490. kernel_def->set_flowtable("InitCceTask");
  491. domi::KernelContext *context = kernel_def->mutable_context();
  492. context->set_is_flowtable(true);
  493. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  494. // KernelTaskInfo::SetFlowtable -> SUCCESS
  495. // rtMalloc -> RT_ERROR_INVALID_VALUE
  496. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  497. kernel_def->clear_context();
  498. task_def.clear_kernel();
  499. }
  500. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed6) {
  501. DavinciModel model(0, nullptr);
  502. rtStream_t stream = nullptr;
  503. rtStreamCreate(&stream, 0);
  504. model.stream_list_ = { stream };
  505. model.op_list_[0] = CreateOpDesc("", "");
  506. domi::TaskDef task_def;
  507. KernelTaskInfo kernel_task_info;
  508. kernel_task_info.davinci_model_ = &model;
  509. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  510. // KernelTaskInfo::SetContext -> SUCCESS
  511. kernel_def->set_flowtable("InitCceTask");
  512. domi::KernelContext *context = kernel_def->mutable_context();
  513. context->set_is_flowtable(true);
  514. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  515. // KernelTaskInfo::SetFlowtable -> SUCCESS
  516. // rtMalloc -> RT_ERROR_NONE
  517. // rtMemcpy -> RT_ERROR_INVALID_VALUE
  518. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  519. kernel_def->clear_context();
  520. task_def.clear_kernel();
  521. }
  522. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_cce_task_failed7) {
  523. DavinciModel model(0, nullptr);
  524. rtStream_t stream = nullptr;
  525. rtStreamCreate(&stream, 0);
  526. model.stream_list_ = { stream };
  527. model.op_list_[0] = CreateOpDesc("", "");
  528. domi::TaskDef task_def;
  529. KernelTaskInfo kernel_task_info;
  530. kernel_task_info.davinci_model_ = &model;
  531. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  532. // KernelTaskInfo::SetContext -> SUCCESS
  533. kernel_def->set_flowtable("InitCceTask");
  534. domi::KernelContext *context = kernel_def->mutable_context();
  535. context->set_is_flowtable(true);
  536. // KernelTaskInfo::UpdateCceArgs -> SUCCESS
  537. // KernelTaskInfo::SetFlowtable -> SUCCESS
  538. rtSmDesc_t l2CtrlInfo;
  539. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  540. kernel_def->set_sm_desc(&l2CtrlInfo, sizeof(rtSmDesc_t));
  541. // rtMalloc -> RT_ERROR_NONE
  542. // rtMemcpy -> RT_ERROR_NONE
  543. // rtMemAllocManaged -> RT_ERROR_INVALID_VALUE
  544. EXPECT_EQ(kernel_task_info.InitCceTask(*kernel_def), INTERNAL_ERROR);
  545. kernel_def->clear_context();
  546. task_def.clear_kernel();
  547. }
  548. // test SetContext success
  549. TEST_F(UtestKernelTaskInfo, success_kernel_taskInfo_init_set_context) {
  550. DavinciModel model(0, nullptr);
  551. domi::TaskDef task_def;
  552. KernelTaskInfo kernel_task_info;
  553. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  554. domi::KernelContext *context = kernel_def->mutable_context();
  555. context->set_op_id(1);
  556. context->set_kernel_func_id(1);
  557. context->set_is_flowtable(true);
  558. context->set_args_count(1);
  559. context->set_args_offset("args111111", 10);
  560. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), SUCCESS);
  561. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  562. kernel_def->clear_context();
  563. task_def.clear_kernel();
  564. }
  565. // test SetContext failed
  566. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_set_context_failed1) {
  567. DavinciModel model(0, nullptr);
  568. domi::TaskDef task_def;
  569. KernelTaskInfo kernel_task_info;
  570. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  571. domi::KernelContext *context = kernel_def->mutable_context();
  572. context->set_op_id(1);
  573. context->set_kernel_func_id(1);
  574. context->set_is_flowtable(true);
  575. context->set_args_count(0);
  576. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), INTERNAL_ERROR);
  577. kernel_def->clear_context();
  578. task_def.clear_kernel();
  579. }
  580. TEST_F(UtestKernelTaskInfo, kernel_taskInfo_init_set_context_failed2) {
  581. DavinciModel model(0, nullptr);
  582. domi::TaskDef task_def;
  583. KernelTaskInfo kernel_task_info;
  584. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  585. domi::KernelContext *context = kernel_def->mutable_context();
  586. context->set_op_id(1);
  587. context->set_kernel_func_id(1);
  588. context->set_is_flowtable(true);
  589. context->set_args_count(5);
  590. context->set_args_offset("\0\0"); // args_offset = 0
  591. EXPECT_EQ(kernel_task_info.SetContext(*kernel_def), PARAM_INVALID);
  592. kernel_def->clear_context();
  593. task_def.clear_kernel();
  594. }
  595. // test UpdateCceArgs success
  596. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_cce_args) {
  597. DavinciModel model(0, nullptr);
  598. rtStream_t stream = nullptr;
  599. rtStreamCreate(&stream, 0);
  600. model.stream_list_ = { stream };
  601. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  602. domi::TaskDef task_def;
  603. KernelTaskInfo kernel_task_info;
  604. kernel_task_info.davinci_model_ = &model;
  605. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  606. domi::KernelContext *context = kernel_def->mutable_context();
  607. string flowtable("InitCceTask");
  608. string sm_desc("args");
  609. uint8_t test = 2;
  610. model.mem_base_ = &test;
  611. model.runtime_param_.logic_mem_base = 0;
  612. model.weights_mem_base_ = &test;
  613. model.runtime_param_.logic_weight_base = 0;
  614. uint8_t test1 = 16;
  615. model.var_mem_base_ = &test1;
  616. model.runtime_param_.logic_var_base = 0;
  617. context->set_is_flowtable(true);
  618. // KernelTaskInfo::CceUpdateKernelArgs ->SUCCESS
  619. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  620. context->clear_is_flowtable();
  621. context->set_is_flowtable(false);
  622. // KernelTaskInfo::CceUpdateKernelArgs ->SUCCESS
  623. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  624. kernel_def->clear_context();
  625. task_def.clear_kernel();
  626. model.mem_base_ = nullptr;
  627. model.weights_mem_base_ = nullptr;
  628. model.var_mem_base_ = nullptr;
  629. }
  630. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_cce_args_failed1) {
  631. DavinciModel model(0, nullptr);
  632. rtStream_t stream = nullptr;
  633. rtStreamCreate(&stream, 0);
  634. model.stream_list_ = { stream };
  635. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  636. domi::TaskDef task_def;
  637. KernelTaskInfo kernel_task_info;
  638. kernel_task_info.davinci_model_ = &model;
  639. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  640. domi::KernelContext *context = kernel_def->mutable_context();
  641. string flowtable("InitCceTask");
  642. string sm_desc("args");
  643. uint8_t test = 2;
  644. model.mem_base_ = &test;
  645. model.runtime_param_.logic_mem_base = 0;
  646. uint8_t test1 = 10;
  647. model.weights_mem_base_ = &test1;
  648. model.runtime_param_.logic_weight_base = 0;
  649. model.var_mem_base_ = &test1;
  650. model.runtime_param_.logic_var_base = 0;
  651. context->set_is_flowtable(true);
  652. // KernelTaskInfo::CceUpdateKernelArgs -> FAILED
  653. EXPECT_EQ(kernel_task_info.UpdateCceArgs(sm_desc, flowtable, *kernel_def), FAILED);
  654. kernel_def->clear_context();
  655. task_def.clear_kernel();
  656. model.mem_base_ = nullptr;
  657. model.weights_mem_base_ = nullptr;
  658. model.var_mem_base_ = nullptr;
  659. }
  660. // test SetFlowtable
  661. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable) {
  662. DavinciModel model(0, nullptr);
  663. rtStream_t stream = nullptr;
  664. rtStreamCreate(&stream, 0);
  665. model.stream_list_ = { stream };
  666. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  667. domi::TaskDef task_def;
  668. KernelTaskInfo kernel_task_info;
  669. kernel_task_info.davinci_model_ = &model;
  670. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  671. domi::KernelContext *context = kernel_def->mutable_context();
  672. string flowtable("InitCceTask");
  673. context->set_is_flowtable(false);
  674. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), SUCCESS);
  675. context->clear_is_flowtable();
  676. context->set_is_flowtable(true);
  677. // rtMalloc ->RT_ERROR_NONE
  678. // rtMemcpy ->RT_ERROR_NONE
  679. kernel_def->set_args("args111111", 10);
  680. context->set_args_offset("\0\0");
  681. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), SUCCESS);
  682. kernel_def->clear_context();
  683. task_def.clear_kernel();
  684. }
  685. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed1) {
  686. DavinciModel model(0, nullptr);
  687. rtStream_t stream = nullptr;
  688. rtStreamCreate(&stream, 0);
  689. model.stream_list_ = { stream };
  690. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  691. domi::TaskDef task_def;
  692. KernelTaskInfo kernel_task_info;
  693. kernel_task_info.davinci_model_ = &model;
  694. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  695. domi::KernelContext *context = kernel_def->mutable_context();
  696. string flowtable("SetFlowtable");
  697. context->set_is_flowtable(true);
  698. // rtMalloc -> RT_ERROR_INVALID_VALUE
  699. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  700. kernel_def->clear_context();
  701. task_def.clear_kernel();
  702. }
  703. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed2) {
  704. DavinciModel model(0, nullptr);
  705. rtStream_t stream = nullptr;
  706. rtStreamCreate(&stream, 0);
  707. model.stream_list_ = { stream };
  708. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  709. domi::TaskDef task_def;
  710. KernelTaskInfo kernel_task_info;
  711. kernel_task_info.davinci_model_ = &model;
  712. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  713. domi::KernelContext *context = kernel_def->mutable_context();
  714. string flowtable("SetFlowtable");
  715. context->set_is_flowtable(true);
  716. // rtMalloc ->RT_ERROR_NONE
  717. // rtMemcpy ->RT_ERROR_INVALID_VALUE
  718. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  719. kernel_def->clear_context();
  720. task_def.clear_kernel();
  721. }
  722. TEST_F(UtestKernelTaskInfo, kernel_task_info_set_flowtable_failed3) {
  723. DavinciModel model(0, nullptr);
  724. rtStream_t stream = nullptr;
  725. rtStreamCreate(&stream, 0);
  726. model.stream_list_ = { stream };
  727. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  728. domi::TaskDef task_def;
  729. KernelTaskInfo kernel_task_info;
  730. kernel_task_info.davinci_model_ = &model;
  731. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  732. domi::KernelContext *context = kernel_def->mutable_context();
  733. string flowtable("SetFlowtable");
  734. context->set_is_flowtable(true);
  735. // rtMalloc ->RT_ERROR_NONE
  736. // rtMemcpy ->RT_ERROR_NONE
  737. kernel_def->set_args("args", 4);
  738. context->set_args_offset("args111111", 10);
  739. EXPECT_EQ(kernel_task_info.SetFlowtable(flowtable, *kernel_def), FAILED);
  740. kernel_def->clear_context();
  741. task_def.clear_kernel();
  742. }
  743. TEST_F(UtestKernelTaskInfo, distribute_failed) {
  744. KernelTaskInfo kernel_task_info;
  745. DavinciModel model(0, nullptr);
  746. domi::TaskDef task_def;
  747. // Failed for SetStream
  748. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  749. // rtKernelLaunchWithFlag -> RT_ERROR_INVALID_VALUE
  750. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  751. }
  752. TEST_F(UtestKernelTaskInfo, distribute_success) {
  753. KernelTaskInfo kernel_task_info;
  754. DavinciModel model(0, nullptr);
  755. model.op_list_[0] = CreateOpDesc("FrameworkOp", "FrameworkOp");
  756. domi::TaskDef task_def;
  757. // rtModelGetTaskId -> RT_ERROR_INVALID_VALUE
  758. rtModel_t rt_model_handle = (rtModel_t *)0x12345678;
  759. model.rt_model_handle_ = rt_model_handle;
  760. // Failed for SetStream
  761. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  762. // rtKernelLaunchWithFlag -> RT_ERROR_INVALID_VALUE
  763. EXPECT_EQ(kernel_task_info.Distribute(), SUCCESS);
  764. model.rt_model_handle_ = nullptr;
  765. }
  766. // test success DistributeDumpTask
  767. TEST_F(UtestKernelTaskInfo, success_distribute_dump_task) {
  768. DavinciModel model(0, nullptr);
  769. domi::TaskDef task_def;
  770. KernelTaskInfo kernel_task_info;
  771. kernel_task_info.davinci_model_ = &model;
  772. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  773. kernel_def->set_stub_func("kerneltaskinfo");
  774. kernel_def->set_block_dim(10);
  775. kernel_def->set_args("args111111", 10);
  776. kernel_def->set_args_size(10);
  777. rtSmDesc_t l2CtrlInfo;
  778. l2CtrlInfo.data[0].L2_mirror_addr = 1024;
  779. kernel_def->set_sm_desc((void *)&l2CtrlInfo, sizeof(rtSmDesc_t));
  780. // for SetStream
  781. rtStream_t stream = nullptr;
  782. rtStreamCreate(&stream, 0);
  783. std::vector<rtStream_t> stream_list = { stream };
  784. EXPECT_EQ(kernel_task_info.SetStream(0, stream_list), SUCCESS);
  785. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  786. rtStreamDestroy(stream);
  787. task_def.clear_kernel();
  788. }
  789. // test success GetTaskID
  790. TEST_F(UtestKernelTaskInfo, success_get_task_id) {
  791. domi::ModelTaskDef model_task_def;
  792. domi::TaskDef *task = model_task_def.add_task();
  793. task->set_type(RT_MODEL_TASK_KERNEL);
  794. TaskInfoPtr task_info = TaskInfoFactory::Instance().Create(static_cast<rtModelTaskType_t>(task->type()));
  795. EXPECT_EQ(task_info->GetTaskID(), 0);
  796. KernelTaskInfo kernel_task_info;
  797. EXPECT_EQ(kernel_task_info.GetTaskID(), 0);
  798. HcclTaskInfo hccl_task_info;
  799. EXPECT_EQ(hccl_task_info.GetTaskID(), 0);
  800. }
  801. // test StoreInputOutputTensor success
  802. TEST_F(UtestKernelTaskInfo, success_store_input_output_tensor) {
  803. DavinciModel model(0, nullptr);
  804. domi::TaskDef task_def;
  805. KernelTaskInfo kernel_task_info;
  806. kernel_task_info.davinci_model_ = &model;
  807. std::vector<void *> input_data_addrs;
  808. std::vector<void *> output_data_addrs;
  809. std::vector<::tagCcAICPUTensor> input_descs;
  810. std::vector<::tagCcAICPUTensor> output_descs;
  811. int test = 1;
  812. int *addr = &test;
  813. void *input = addr;
  814. void *output = addr;
  815. input_data_addrs.push_back(input);
  816. output_data_addrs.push_back(output);
  817. tagCcAICPUTensor input_desc;
  818. tagCcAICPUTensor output_desc;
  819. input_descs.push_back(input_desc);
  820. output_descs.push_back(output_desc);
  821. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  822. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  823. }
  824. // test KernelTaskInfo release fail
  825. TEST_F(UtestKernelTaskInfo, fail_release) {
  826. DavinciModel model(0, nullptr);
  827. domi::TaskDef task_def;
  828. KernelTaskInfo kernel_task_info;
  829. kernel_task_info.davinci_model_ = &model;
  830. std::vector<void *> input_data_addrs;
  831. std::vector<void *> output_data_addrs;
  832. std::vector<::tagCcAICPUTensor> input_descs;
  833. std::vector<::tagCcAICPUTensor> output_descs;
  834. int test = 1;
  835. int *addr = &test;
  836. void *input = addr;
  837. void *output = addr;
  838. input_data_addrs.push_back(input);
  839. output_data_addrs.push_back(output);
  840. tagCcAICPUTensor input_desc;
  841. tagCcAICPUTensor output_desc;
  842. input_descs.push_back(input_desc);
  843. output_descs.push_back(output_desc);
  844. EXPECT_EQ(kernel_task_info.StoreInputOutputTensor(input_data_addrs, output_data_addrs, input_descs, output_descs), SUCCESS);
  845. // rtMemFreeManaged -> RT_ERROR_INVALID_VALUE
  846. EXPECT_EQ(kernel_task_info.Release(), SUCCESS);
  847. }
  848. // test KernelTaskInfo release fail
  849. TEST_F(UtestKernelTaskInfo, update_l2data_success) {
  850. DavinciModel model(0, nullptr);
  851. KernelTaskInfo kernel_task_info;
  852. kernel_task_info.davinci_model_ = &model;
  853. domi::KernelDef kernel_def;
  854. EXPECT_EQ(kernel_task_info.UpdateL2Data(kernel_def), SUCCESS);
  855. }
  856. // test fusion_end_task Init
  857. TEST_F(UtestKernelTaskInfo, kernel_task_info_init_success) {
  858. rtStream_t stream = nullptr;
  859. rtStreamCreate(&stream, 0);
  860. DavinciModel model(0, nullptr);
  861. auto model_def = MakeShared<domi::ModelTaskDef>();
  862. model.model_id_ = 1;
  863. model.name_ = "test";
  864. model.version_ = 0x01;
  865. model.stream_list_ = { stream };
  866. model.ge_model_ = MakeShared<GeModel>();
  867. model.ge_model_->SetModelTaskDef(model_def);
  868. auto op_desc = CreateOpDesc("data", DATA);
  869. op_desc->SetInputOffset({1});
  870. op_desc->SetOutputOffset({100});
  871. GeTensorDesc descin(GeShape({1, 1, 1, 1}), FORMAT_NCHW, DT_FLOAT);
  872. TensorUtils::SetSize(descin, 4);
  873. op_desc->AddInputDesc(descin);
  874. GeTensorDesc descout(GeShape({1, 1, 1, 1}), FORMAT_NCHW, DT_FLOAT16);
  875. TensorUtils::SetSize(descout, 32);
  876. op_desc->AddOutputDesc(descout);
  877. op_desc->SetId(0);
  878. model.op_list_[0] = op_desc;
  879. domi::TaskDef task_def;
  880. task_def.set_stream_id(0);
  881. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  882. domi::KernelContext *ctx = kernel_def->mutable_context();
  883. ctx->set_op_index(0);
  884. vector<string> original_op_names = { "conv", "add" };
  885. AttrUtils::GetListStr(op_desc, ATTR_NAME_DATA_DUMP_ORIGIN_OP_NAMES, original_op_names);
  886. KernelTaskInfo kernel_task_info;
  887. EXPECT_EQ(kernel_task_info.Init(task_def, &model), FAILED);
  888. }
  889. TEST_F(UtestKernelTaskInfo, kernel_task_info_calculate_args_te) {
  890. DavinciModel model(0, nullptr);
  891. domi::TaskDef task_def;
  892. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  893. domi::KernelContext *ctx = kernel_def->mutable_context();
  894. ctx->set_kernel_type(2);
  895. KernelTaskInfo kernel_task_info;
  896. EXPECT_EQ(kernel_task_info.CalculateArgs(task_def, &model), SUCCESS);
  897. }
  898. TEST_F(UtestKernelTaskInfo, kernel_task_info_calculate_args_aicpu) {
  899. DavinciModel model(0, nullptr);
  900. domi::TaskDef task_def;
  901. domi::KernelDef *kernel_def = task_def.mutable_kernel();
  902. domi::KernelContext *ctx = kernel_def->mutable_context();
  903. ctx->set_kernel_type(6);
  904. KernelTaskInfo kernel_task_info;
  905. EXPECT_EQ(kernel_task_info.CalculateArgs(task_def, &model), SUCCESS);
  906. }
  907. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_args_te) {
  908. DavinciModel model(0, nullptr);
  909. KernelTaskInfo kernel_task_info;
  910. kernel_task_info.kernel_type_ = ccKernelType::TE;
  911. kernel_task_info.davinci_model_ = &model;
  912. EXPECT_EQ(kernel_task_info.UpdateArgs(), SUCCESS);
  913. }
  914. TEST_F(UtestKernelTaskInfo, kernel_task_info_update_args_aicpu) {
  915. DavinciModel model(0, nullptr);
  916. KernelTaskInfo kernel_task_info;
  917. kernel_task_info.kernel_type_ = ccKernelType::TE;
  918. kernel_task_info.davinci_model_ = &model;
  919. kernel_task_info.args_size_ = 120;
  920. kernel_task_info.args_addr = std::unique_ptr<uint8_t[]>(new (std::nothrow) uint8_t[kernel_task_info.args_size_]);
  921. kernel_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  922. rtMalloc(&kernel_task_info.args_, kernel_task_info.args_size_, RT_MEMORY_HBM);
  923. EXPECT_EQ(kernel_task_info.UpdateArgs(), SUCCESS);
  924. }
  925. TEST_F(UtestKernelTaskInfo, kernel_task_info_super_kernel_info) {
  926. DavinciModel model(0, nullptr);
  927. KernelTaskInfo kernel_task_info;
  928. kernel_task_info.davinci_model_ = &model;
  929. EXPECT_EQ(kernel_task_info.SaveSuperKernelInfo(), SUCCESS);
  930. kernel_task_info.UpdateSKTTaskId();
  931. EXPECT_EQ(kernel_task_info.SKTFinalize(), SUCCESS);
  932. }
  933. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示