You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

ffts_task_info_unittest.cc 9.2 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212
  1. /**
  2. * Copyright 2021 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <gtest/gtest.h>
  17. #define private public
  18. #define protected public
  19. #include "graph/load/model_manager/task_info/ffts_task_info.h"
  20. #include "cce/aicpu_engine_struct.h"
  21. #include "common/ge/ge_util.h"
  22. #include "common/properties_manager.h"
  23. #include "framework/common/debug/ge_log.h"
  24. #include "framework/common/fmk_error_codes.h"
  25. #include "graph/attr_value.h"
  26. #include "graph/load/model_manager/davinci_model.h"
  27. #include "graph/load/model_manager/model_manager.h"
  28. #include "runtime/rt_ffts.h"
  29. namespace ge {
  30. extern OpDescPtr CreateOpDesc(string name, string type);
  31. class UtestFftsTaskInfo : public testing::Test {
  32. protected:
  33. void SetUp() {}
  34. void TearDown() {}
  35. public:
  36. void CreateFftsTaskInfo(DavinciModel &davinci_model, domi::TaskDef &task_def, FftsTaskInfo &ffts_task_info) {
  37. rtStream_t stream = nullptr;
  38. rtStreamCreate(&stream, 0);
  39. davinci_model.stream_list_ = { stream };
  40. task_def.set_stream_id(0);
  41. domi::FftsTaskDef *ffts_task_def = task_def.mutable_ffts_task();
  42. davinci_model.op_list_[0] = CreateOpDesc("test", PARTITIONEDCALL);
  43. ffts_task_def->set_op_index(0);
  44. ffts_task_def->set_addr_size(2);
  45. domi::FftsDescInfoDef *ffts_desc = ffts_task_def->mutable_ffts_desc();
  46. ffts_desc->set_tm(0);
  47. rtFftsTaskInfo_t sub_task_info;
  48. ffts_task_info.sub_task_info_ = sub_task_info;
  49. ffts_task_def->set_ffts_type(RT_FFTS_TYPE_AUTO_THREAD);
  50. }
  51. };
  52. // test FftsTaskInfo Init with no subtask and no ticket cache
  53. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_without_subtask) {
  54. DavinciModel davinci_model(0, nullptr);
  55. rtStream_t stream = nullptr;
  56. rtStreamCreate(&stream, 0);
  57. davinci_model.stream_list_ = { stream };
  58. domi::TaskDef task_def;
  59. task_def.set_stream_id(0);
  60. domi::FftsTaskDef *ffts_task_def = task_def.mutable_ffts_task();
  61. FftsTaskInfo ffts_task_info;
  62. // init failed when model without op_desc
  63. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), PARAM_INVALID);
  64. davinci_model.op_list_[0] = CreateOpDesc("test", PARTITIONEDCALL);
  65. ffts_task_def->set_op_index(0);
  66. ffts_task_def->set_addr_size(2);
  67. domi::FftsDescInfoDef *ffts_desc = ffts_task_def->mutable_ffts_desc();
  68. ffts_desc->set_tm(0);
  69. rtFftsTaskInfo_t sub_task_info;
  70. ffts_task_info.sub_task_info_ = sub_task_info;
  71. ffts_task_def->set_ffts_type(RT_FFTS_TYPE_AUTO_THREAD);
  72. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  73. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  74. }
  75. // test FftsTaskInfo Init with subtask and no ticket cache: AutoThreadAicAivDef
  76. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_with_auto_thread_subgraph) {
  77. DavinciModel davinci_model(0, nullptr);
  78. domi::TaskDef task_def;
  79. FftsTaskInfo ffts_task_info;
  80. CreateFftsTaskInfo(davinci_model, task_def, ffts_task_info);
  81. domi::FftsSubTaskDef *ffts_sub_task_def = task_def.mutable_ffts_task()->add_sub_task();
  82. ffts_sub_task_def->set_thread_dim(static_cast<uint32_t>(1));
  83. //sub_task_def.has_auto_thread_aic_aiv() == sub_task_def.has_manual_thread_aic_aiv()
  84. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), FAILED);
  85. domi::AutoThreadAicAivDef *auto_thread_aic_aiv_def = ffts_sub_task_def->mutable_auto_thread_aic_aiv();
  86. domi::AutoThreadPrefetchDef *src_prefetch = auto_thread_aic_aiv_def->add_src_prefetch();
  87. // without InitIoAddrs
  88. ffts_task_info.thread_dim_ = 0;
  89. RuntimeParam runtime_param;
  90. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  91. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  92. }
  93. // test FftsTaskInfo Init with subtask and no ticket cache: ManualThreadAicAivDef
  94. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_with_manual_thread_subgraph) {
  95. DavinciModel davinci_model(0, nullptr);
  96. domi::TaskDef task_def;
  97. FftsTaskInfo ffts_task_info;
  98. CreateFftsTaskInfo(davinci_model, task_def, ffts_task_info);
  99. domi::FftsSubTaskDef *ffts_sub_task_def = task_def.mutable_ffts_task()->add_sub_task();
  100. ffts_sub_task_def->set_thread_dim(static_cast<uint32_t>(1));
  101. //sub_task_def.has_auto_thread_aic_aiv() == sub_task_def.has_manual_thread_aic_aiv()
  102. domi::ManualThreadAicAivDef *manual_thread_aic_aiv_def = ffts_sub_task_def->mutable_manual_thread_aic_aiv();
  103. manual_thread_aic_aiv_def->add_thread_prefetch_dmu_idx(static_cast<uint32_t>(0));
  104. manual_thread_aic_aiv_def->add_thread_blk_dim(static_cast<uint32_t>(0));
  105. manual_thread_aic_aiv_def->add_thread_task_func_stub("ffts");
  106. domi::ManualThreadDmuDef *prefetch_list = manual_thread_aic_aiv_def->add_prefetch_list();
  107. prefetch_list->set_data_addr(static_cast<uint64_t>(0));
  108. // without InitIoAddrs
  109. ffts_task_info.thread_dim_ = 0;
  110. RuntimeParam runtime_param;
  111. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  112. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  113. }
  114. // test FftsTaskInfo Init with subtask and no ticket cache: ManualThreadNopDef
  115. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_with_manual_thread_nop_subgraph) {
  116. DavinciModel davinci_model(0, nullptr);
  117. domi::TaskDef task_def;
  118. FftsTaskInfo ffts_task_info;
  119. CreateFftsTaskInfo(davinci_model, task_def, ffts_task_info);
  120. domi::FftsSubTaskDef *ffts_sub_task_def = task_def.mutable_ffts_task()->add_sub_task();
  121. ffts_sub_task_def->set_thread_dim(static_cast<uint32_t>(1));
  122. domi::AutoThreadAicAivDef *auto_thread_aic_aiv_def = ffts_sub_task_def->mutable_auto_thread_aic_aiv();
  123. domi::ManualThreadNopDef *manual_thread_nop = ffts_sub_task_def->mutable_manual_thread_nop();
  124. domi::ManualThreadDependencyDef *src_dep_tbl = manual_thread_nop->add_src_dep_tbl();
  125. src_dep_tbl->add_dependency(static_cast<uint32_t>(0));
  126. // without InitIoAddrs
  127. ffts_task_info.thread_dim_ = 0;
  128. RuntimeParam runtime_param;
  129. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  130. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  131. }
  132. // test FftsTaskInfo Init with no subtask and ticket cache:AutoThreadCacheDef
  133. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_with_auto_thread_ticket_cache) {
  134. DavinciModel davinci_model(0, nullptr);
  135. domi::TaskDef task_def;
  136. FftsTaskInfo ffts_task_info;
  137. CreateFftsTaskInfo(davinci_model, task_def, ffts_task_info);
  138. domi::TicketCacheDef *ticket_cache_def = task_def.mutable_ffts_task()->add_ticket_cache();
  139. //ticket_cache_def.has_auto_thread_cache() == ticket_cache_def.has_manual_thread_cache()
  140. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), FAILED);
  141. domi::AutoThreadCacheDef *auto_thread_cache = ticket_cache_def->mutable_auto_thread_cache();
  142. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  143. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  144. }
  145. // test FftsTaskInfo Init with no subtask and ticket cache:ManualThreadCacheDef
  146. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_with_manual_thread_ticket_cache) {
  147. DavinciModel davinci_model(0, nullptr);
  148. domi::TaskDef task_def;
  149. FftsTaskInfo ffts_task_info;
  150. CreateFftsTaskInfo(davinci_model, task_def, ffts_task_info);
  151. domi::TicketCacheDef *ticket_cache_def = task_def.mutable_ffts_task()->add_ticket_cache();
  152. domi::ManualThreadCacheDef *manual_thread_cache = ticket_cache_def->mutable_manual_thread_cache();
  153. manual_thread_cache->add_slice_dmu_idx(static_cast<uint32_t>(0));
  154. manual_thread_cache->add_ticket_cache_ref_cnt_tbl(static_cast<uint32_t>(0));
  155. domi::ManualThreadDmuDef *dmu_list = manual_thread_cache->add_dmu_list();
  156. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  157. EXPECT_EQ(ffts_task_info.Init(task_def, &davinci_model), SUCCESS);
  158. }
  159. // test FftsTaskInfo UpdateArgs
  160. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_update_args) {
  161. DavinciModel davinci_model(0, nullptr);
  162. FftsTaskInfo ffts_task_info;
  163. ffts_task_info.davinci_model_ = &davinci_model;
  164. ffts_task_info.io_addrs_ = { (void*)0x12345678, (void*)0x22345678 };
  165. EXPECT_EQ(ffts_task_info.UpdateArgs(), SUCCESS);
  166. }
  167. // test FftsTaskInfo CalculateArgs
  168. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_calculate_args) {
  169. DavinciModel davinci_model(0, nullptr);
  170. domi::TaskDef task_def;
  171. FftsTaskInfo ffts_task_info;
  172. EXPECT_EQ(ffts_task_info.CalculateArgs(task_def, &davinci_model), SUCCESS);
  173. }
  174. // test FftsTaskInfo Distribute
  175. TEST_F(UtestFftsTaskInfo, success_ffts_task_info_distribute) {
  176. DavinciModel davinci_model(0, nullptr);
  177. FftsTaskInfo ffts_task_info;
  178. rtFftsTaskInfo_t sub_task_info;
  179. ffts_task_info.sub_task_info_ = sub_task_info;
  180. rtStream_t stream = nullptr;
  181. rtStreamCreate(&stream, 0);
  182. ffts_task_info.stream_ = stream;
  183. EXPECT_EQ(ffts_task_info.Distribute(), SUCCESS);
  184. }
  185. } // namespace ge

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示