You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

mem_assigner_unittest.cc 30 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #include <gtest/gtest.h>
  17. #include <memory>
  18. #include "graph/anchor.h"
  19. #include "graph/attr_value.h"
  20. #include "graph/debug/ge_attr_define.h"
  21. #include "graph/utils/graph_utils.h"
  22. #include "graph/utils/node_utils.h"
  23. #include "graph/utils/op_desc_utils.h"
  24. #include "graph/utils/tensor_utils.h"
  25. #include "omg/omg_inner_types.h"
  26. #include "../passes/graph_builder_utils.h"
  27. #define protected public
  28. #define private public
  29. #include "graph/build/memory/binary_block_mem_assigner.h"
  30. #include "graph/build/memory/graph_mem_assigner.h"
  31. #include "graph/build/memory/hybrid_mem_assigner.h"
  32. #include "graph/build/memory/max_block_mem_assigner.h"
  33. #include "graph/manager/graph_var_manager.h"
  34. #undef protected
  35. #undef private
  36. using namespace std;
  37. using namespace testing;
  38. using namespace ge;
  39. using domi::GetContext;
  40. class UtestMemoryAssignerTest : public testing::Test {
  41. public:
  42. ge::OpDescPtr CreateOpWithWsSize(const string &name, int64_t wsByte, const string &type = "some",
  43. int64_t size = 1024) {
  44. ge::OpDescPtr op_def = make_shared<ge::OpDesc>(name, type);
  45. auto desc_temp_ptr = make_shared<ge::GeTensorDesc>();
  46. auto desc_temp = *desc_temp_ptr;
  47. TensorUtils::SetSize(desc_temp, size);
  48. op_def->AddInputDesc(desc_temp);
  49. op_def->AddOutputDesc(desc_temp);
  50. std::vector<int64_t> workspace_bytes;
  51. workspace_bytes.push_back(wsByte);
  52. op_def->SetWorkspaceBytes(workspace_bytes);
  53. return op_def;
  54. }
  55. ge::OpDescPtr CreateRefOpWithWsSize(const string &name, int64_t wsByte, const string &type = "some") {
  56. ge::OpDescPtr op_def = make_shared<ge::OpDesc>(name, type);
  57. auto desc_temp_ptr = make_shared<ge::GeTensorDesc>();
  58. auto desc_temp = *desc_temp_ptr;
  59. TensorUtils::SetSize(desc_temp, 1024);
  60. op_def->AddInputDesc(desc_temp);
  61. auto desc_output_ptr = make_shared<ge::GeTensorDesc>();
  62. auto desc_output = *desc_output_ptr;
  63. TensorUtils::SetSize(desc_output, 6500);
  64. ge::TensorUtils::SetReuseInput(desc_output, true);
  65. ge::TensorUtils::SetReuseInputIndex(desc_output, 0);
  66. op_def->AddOutputDesc(desc_output);
  67. std::vector<int64_t> workspace_bytes;
  68. workspace_bytes.push_back(wsByte);
  69. op_def->SetWorkspaceBytes(workspace_bytes);
  70. return op_def;
  71. }
  72. void MakeGraph(ge::ComputeGraphPtr &graph, const string &type = "some") {
  73. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 6000, type);
  74. op_def_a->SetStreamId(0);
  75. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 120000);
  76. op_def_b->SetStreamId(0);
  77. ge::OpDescPtr op_def_c = CreateOpWithWsSize("C", 16000);
  78. op_def_c->SetStreamId(1);
  79. ge::OpDescPtr op_def_d = CreateOpWithWsSize("D", 24000);
  80. op_def_d->SetStreamId(2);
  81. ge::OpDescPtr op_def_e = CreateOpWithWsSize("E", 24000);
  82. op_def_e->SetStreamId(3);
  83. ge::OpDescPtr op_def_f = CreateOpWithWsSize("F", 30000);
  84. op_def_f->SetStreamId(2);
  85. ge::OpDescPtr op_def_g = CreateOpWithWsSize("G", 32000);
  86. op_def_g->SetStreamId(3);
  87. ge::OpDescPtr op_def_h = CreateOpWithWsSize("H", 48000);
  88. op_def_h->SetStreamId(2);
  89. ge::OpDescPtr op_def_i = CreateOpWithWsSize("I", 60000);
  90. op_def_i->SetStreamId(2);
  91. ge::OpDescPtr op_def_j = CreateOpWithWsSize("J", 256000, NETOUTPUT);
  92. op_def_j->SetStreamId(3);
  93. // add node
  94. ge::NodePtr node_a = graph->AddNode(op_def_a);
  95. ge::NodePtr node_b = graph->AddNode(op_def_b);
  96. ge::NodePtr node_c = graph->AddNode(op_def_c);
  97. ge::NodePtr node_d = graph->AddNode(op_def_d);
  98. ge::NodePtr node_e = graph->AddNode(op_def_e);
  99. ge::NodePtr node_f = graph->AddNode(op_def_f);
  100. ge::NodePtr node_g = graph->AddNode(op_def_g);
  101. ge::NodePtr node_h = graph->AddNode(op_def_h);
  102. ge::NodePtr node_i = graph->AddNode(op_def_i);
  103. ge::NodePtr node_j = graph->AddNode(op_def_j);
  104. // add edge
  105. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_b->GetInDataAnchor(0));
  106. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_c->GetInDataAnchor(0));
  107. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  108. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_e->GetInDataAnchor(0));
  109. ge::GraphUtils::AddEdge(node_c->GetOutDataAnchor(0), node_g->GetInDataAnchor(0));
  110. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_f->GetInDataAnchor(0));
  111. ge::GraphUtils::AddEdge(node_e->GetOutDataAnchor(0), node_g->GetInDataAnchor(1));
  112. ge::GraphUtils::AddEdge(node_f->GetOutDataAnchor(0), node_h->GetInDataAnchor(0));
  113. ge::GraphUtils::AddEdge(node_g->GetOutDataAnchor(0), node_j->GetInDataAnchor(0));
  114. ge::GraphUtils::AddEdge(node_h->GetOutDataAnchor(0), node_i->GetInDataAnchor(0));
  115. ge::GraphUtils::AddEdge(node_i->GetOutDataAnchor(0), node_j->GetInDataAnchor(1));
  116. GetContext().out_nodes_map["H"] = {0};
  117. GetContext().out_nodes_map["I"] = {0};
  118. GetContext().out_nodes_map["J"] = {0};
  119. graph->TopologicalSorting();
  120. }
  121. void MakeReuseGraph(ge::ComputeGraphPtr graph) {
  122. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 6000);
  123. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 120000);
  124. ge::OpDescPtr op_def_c = CreateRefOpWithWsSize("C", 120000);
  125. ge::OpDescPtr op_def_d = make_shared<ge::OpDesc>("D", "CONSTANT");
  126. ge::NodePtr node_a = graph->AddNode(op_def_a);
  127. ge::NodePtr node_b = graph->AddNode(op_def_b);
  128. ge::NodePtr node_c = graph->AddNode(op_def_c);
  129. ge::NodePtr node_d = graph->AddNode(op_def_d);
  130. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_b->GetInDataAnchor(0));
  131. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_c->GetInDataAnchor(0));
  132. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  133. GetContext().out_nodes_map["B"] = {0};
  134. GetContext().out_nodes_map["C"] = {0};
  135. graph->TopologicalSorting();
  136. }
  137. ComputeGraphPtr MakeCascadeContinuousMemoryGraph() {
  138. ge::ut::GraphBuilder builder("graph");
  139. auto data = builder.AddNode("data", "Data", 1, 1);
  140. auto addn1 = builder.AddNode("addn1", "AddN", 1, 1);
  141. auto addn2 = builder.AddNode("addn2", "AddN", 1, 1);
  142. auto addn3 = builder.AddNode("addn3", "AddN", 1, 1);
  143. auto concat1 = builder.AddNode("concat1", "Concat", 2, 1);
  144. auto concat2 = builder.AddNode("concat2", "Concat", 2, 1);
  145. auto netoutput = builder.AddNode("netoutput", "NetOutput", 2, 0);
  146. ge::AttrUtils::SetBool(concat1->GetOpDesc(), ATTR_NAME_NOPADDING_CONTINUOUS_INPUT, true);
  147. ge::AttrUtils::SetBool(concat1->GetOpDesc(), ATTR_NAME_CONTINUOUS_INPUT_ALLOC, true);
  148. ge::AttrUtils::SetBool(concat1->GetOpDesc(), ATTR_NAME_OUTPUT_REUSE_INPUT, true);
  149. ge::AttrUtils::SetBool(concat2->GetOpDesc(), ATTR_NAME_NOPADDING_CONTINUOUS_INPUT, true);
  150. ge::AttrUtils::SetBool(concat2->GetOpDesc(), ATTR_NAME_CONTINUOUS_INPUT_ALLOC, true);
  151. ge::AttrUtils::SetBool(concat2->GetOpDesc(), ATTR_NAME_OUTPUT_REUSE_INPUT, true);
  152. addn1->GetOpDesc()->SetOutputOffset({100});
  153. addn2->GetOpDesc()->SetOutputOffset({200});
  154. concat1->GetOpDesc()->SetOutputOffset({100});
  155. addn3->GetOpDesc()->SetOutputOffset({700});
  156. concat2->GetOpDesc()->SetOutputOffset({500});
  157. ge::AttrUtils::SetListInt(addn1->GetOpDesc(), ATTR_NAME_OUTPUT_OFFSET_FOR_BUFFER_FUSION, {100});
  158. ge::AttrUtils::SetListInt(addn2->GetOpDesc(), ATTR_NAME_OUTPUT_OFFSET_FOR_BUFFER_FUSION, {100});
  159. ge::AttrUtils::SetListInt(addn3->GetOpDesc(), ATTR_NAME_OUTPUT_OFFSET_FOR_BUFFER_FUSION, {100});
  160. ge::AttrUtils::SetListInt(concat1->GetOpDesc(), ATTR_NAME_OUTPUT_OFFSET_FOR_BUFFER_FUSION, {200});
  161. ge::AttrUtils::SetListInt(concat2->GetOpDesc(), ATTR_NAME_OUTPUT_OFFSET_FOR_BUFFER_FUSION, {300});
  162. builder.AddDataEdge(data, 0, addn1, 0);
  163. builder.AddDataEdge(data, 0, addn2, 0);
  164. builder.AddDataEdge(addn1, 0, concat1, 0);
  165. builder.AddDataEdge(addn2, 0, concat1, 1);
  166. builder.AddDataEdge(concat1, 0, concat2, 0);
  167. builder.AddDataEdge(addn3, 0, concat2, 1);
  168. return builder.GetGraph();
  169. }
  170. ComputeGraphPtr MakeRefNodeGraph() {
  171. ge::ut::GraphBuilder builder("graph");
  172. auto var_input = builder.AddNode("var", "Variable", 1, 1);
  173. auto const_input = builder.AddNode("const", "Const", 1, 1);
  174. auto assign = builder.AddNode("assgin", "Assign", 2, 1);
  175. // add link
  176. builder.AddDataEdge(var_input, 0, assign, 0);
  177. builder.AddDataEdge(const_input, 0, assign, 1);
  178. // set offset
  179. assign->GetOpDesc()->SetInputOffset({100, 0});
  180. assign->GetOpDesc()->SetOutputOffset({10000});
  181. var_input->GetOpDesc()->SetOutputOffset({10000});
  182. const_input->GetOpDesc()->SetOutputOffset({1000});
  183. // set mem type
  184. ge::AttrUtils::SetListInt(assign->GetOpDesc(), ATTR_NAME_INPUT_MEM_TYPE_LIST, {RT_MEMORY_HBM, RT_MEMORY_L1});
  185. // set ref
  186. auto output_tensordesc = assign->GetOpDesc()->MutableOutputDesc(0);
  187. ge::TensorUtils::SetReuseInput(*output_tensordesc, true);
  188. uint32_t reuse_input_index = 0;
  189. ge::TensorUtils::SetReuseInputIndex(*output_tensordesc, reuse_input_index);
  190. return builder.GetGraph();
  191. }
  192. void MakeFftsReuseGraph(ge::ComputeGraphPtr graph, int32_t thread_scope_id_1 = kInvalidThreadScopeId,
  193. int32_t thread_scope_id_2 = kInvalidThreadScopeId) {
  194. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 512);
  195. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 0);
  196. ge::OpDescPtr op_def_c = CreateOpWithWsSize("C", 512);
  197. ge::OpDescPtr op_def_d = CreateOpWithWsSize("D", 512);
  198. ge::OpDescPtr op_def_e = CreateOpWithWsSize("E", 0);
  199. ge::OpDescPtr op_def_f = CreateOpWithWsSize("F", 512, "some", 2048UL);
  200. ge::OpDescPtr op_def_g = CreateOpWithWsSize("G", 0);
  201. if (thread_scope_id_1 != kInvalidThreadScopeId) {
  202. (void)ge::AttrUtils::SetInt(op_def_a, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_1);
  203. (void)ge::AttrUtils::SetInt(op_def_b, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_1);
  204. (void)ge::AttrUtils::SetInt(op_def_c, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_1);
  205. }
  206. if (thread_scope_id_2 != kInvalidThreadScopeId) {
  207. (void)ge::AttrUtils::SetInt(op_def_d, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_2);
  208. (void)ge::AttrUtils::SetInt(op_def_e, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_2);
  209. (void)ge::AttrUtils::SetInt(op_def_f, ATTR_NAME_THREAD_SCOPE_ID, thread_scope_id_2);
  210. }
  211. ge::NodePtr node_a = graph->AddNode(op_def_a);
  212. ge::NodePtr node_b = graph->AddNode(op_def_b);
  213. ge::NodePtr node_c = graph->AddNode(op_def_c);
  214. ge::NodePtr node_d = graph->AddNode(op_def_d);
  215. ge::NodePtr node_e = graph->AddNode(op_def_e);
  216. ge::NodePtr node_f = graph->AddNode(op_def_f);
  217. ge::NodePtr node_g = graph->AddNode(op_def_g);
  218. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_b->GetInDataAnchor(0));
  219. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_c->GetInDataAnchor(0));
  220. ge::GraphUtils::AddEdge(node_c->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  221. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_e->GetInDataAnchor(0));
  222. ge::GraphUtils::AddEdge(node_e->GetOutDataAnchor(0), node_f->GetInDataAnchor(0));
  223. ge::GraphUtils::AddEdge(node_f->GetOutDataAnchor(0), node_g->GetInDataAnchor(0));
  224. graph->TopologicalSorting();
  225. }
  226. void MakeSessionScopeReuseGraph(ge::ComputeGraphPtr graph) {
  227. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 512);
  228. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 0);
  229. ge::OpDescPtr op_def_c = CreateOpWithWsSize("C", 512);
  230. ge::OpDescPtr op_def_d = CreateOpWithWsSize("D", 512);
  231. ge::OpDescPtr op_def_e = CreateOpWithWsSize("E", 1024);
  232. ge::OpDescPtr op_def_f = CreateOpWithWsSize("F", 512, "some", 2048UL);
  233. ge::OpDescPtr op_def_g = CreateOpWithWsSize("G", 0);
  234. std::vector<int64_t> workspace_bytes;
  235. workspace_bytes.push_back(1024);
  236. workspace_bytes.push_back(512);
  237. op_def_c->SetWorkspaceBytes(workspace_bytes);
  238. vector<int32_t> workspace_no_reuse_scope = { 0 , 1 };
  239. (void)ge::AttrUtils::SetListInt(op_def_c, ATTR_NAME_WORKSPACE_MEMORY_NO_REUSE_SCOPE, workspace_no_reuse_scope);
  240. vector<int32_t> workspace_no_reuse_scope_e = { 1 };
  241. (void)ge::AttrUtils::SetListInt(op_def_e, ATTR_NAME_WORKSPACE_MEMORY_NO_REUSE_SCOPE, workspace_no_reuse_scope_e);
  242. ge::NodePtr node_a = graph->AddNode(op_def_a);
  243. ge::NodePtr node_b = graph->AddNode(op_def_b);
  244. ge::NodePtr node_c = graph->AddNode(op_def_c);
  245. ge::NodePtr node_d = graph->AddNode(op_def_d);
  246. ge::NodePtr node_e = graph->AddNode(op_def_e);
  247. ge::NodePtr node_f = graph->AddNode(op_def_f);
  248. ge::NodePtr node_g = graph->AddNode(op_def_g);
  249. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_b->GetInDataAnchor(0));
  250. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_c->GetInDataAnchor(0));
  251. ge::GraphUtils::AddEdge(node_c->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  252. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_e->GetInDataAnchor(0));
  253. ge::GraphUtils::AddEdge(node_e->GetOutDataAnchor(0), node_f->GetInDataAnchor(0));
  254. ge::GraphUtils::AddEdge(node_f->GetOutDataAnchor(0), node_g->GetInDataAnchor(0));
  255. graph->TopologicalSorting();
  256. }
  257. void MakeContinuousReuseGraph(ge::ComputeGraphPtr graph, bool nopading = false) {
  258. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 512);
  259. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 0);
  260. ge::OpDescPtr op_def_c = CreateOpWithWsSize("C", 512);
  261. ge::OpDescPtr op_def_d = CreateOpWithWsSize("D", 512);
  262. ge::OpDescPtr op_def_e = CreateOpWithWsSize("E", 1024);
  263. ge::OpDescPtr op_def_f = CreateOpWithWsSize("F", 512, "some", 2048UL);
  264. ge::OpDescPtr op_def_g = CreateOpWithWsSize("G", 0);
  265. if (nopading) {
  266. (void)ge::AttrUtils::SetBool(op_def_d, ATTR_NAME_NOPADDING_CONTINUOUS_INPUT, true);
  267. (void)ge::AttrUtils::SetBool(op_def_d, ATTR_NAME_NOPADDING_CONTINUOUS_OUTPUT, true);
  268. (void)ge::AttrUtils::SetBool(op_def_d, ATTR_NAME_OUTPUT_REUSE_INPUT, true);
  269. (void)ge::AttrUtils::SetInt(op_def_d, ATTR_NAME_REUSE_INPUT_ON_DIM_INDEX, 0);
  270. } else {
  271. (void)ge::AttrUtils::SetBool(op_def_d, ATTR_NAME_CONTINUOUS_INPUT, true);
  272. (void)ge::AttrUtils::SetBool(op_def_d, ATTR_NAME_CONTINUOUS_OUTPUT, true);
  273. }
  274. ge::NodePtr node_a = graph->AddNode(op_def_a);
  275. ge::NodePtr node_b = graph->AddNode(op_def_b);
  276. ge::NodePtr node_c = graph->AddNode(op_def_c);
  277. ge::NodePtr node_d = graph->AddNode(op_def_d);
  278. ge::NodePtr node_e = graph->AddNode(op_def_e);
  279. ge::NodePtr node_f = graph->AddNode(op_def_f);
  280. ge::NodePtr node_g = graph->AddNode(op_def_g);
  281. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  282. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  283. ge::GraphUtils::AddEdge(node_c->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  284. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_e->GetInDataAnchor(0));
  285. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_f->GetInDataAnchor(0));
  286. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_g->GetInDataAnchor(0));
  287. graph->TopologicalSorting();
  288. }
  289. void MakeMultiBatchReuseGraph(ge::ComputeGraphPtr graph) {
  290. ge::OpDescPtr op_def_a = CreateOpWithWsSize("A", 512);
  291. ge::OpDescPtr op_def_b = CreateOpWithWsSize("B", 0);
  292. ge::OpDescPtr op_def_c = CreateOpWithWsSize("C", 512);
  293. ge::OpDescPtr op_def_d = CreateOpWithWsSize("D", 512);
  294. ge::OpDescPtr op_def_e = CreateOpWithWsSize("E", 1024);
  295. ge::OpDescPtr op_def_f = CreateOpWithWsSize("F", 512, "some", 2048UL);
  296. ge::OpDescPtr op_def_g = CreateOpWithWsSize("G", 0);
  297. (void)ge::AttrUtils::SetStr(op_def_b, ATTR_NAME_BATCH_LABEL, "Batch_0");
  298. (void)ge::AttrUtils::SetStr(op_def_c, ATTR_NAME_BATCH_LABEL, "Batch_0");
  299. (void)ge::AttrUtils::SetStr(op_def_e, ATTR_NAME_BATCH_LABEL, "Batch_1");
  300. (void)ge::AttrUtils::SetStr(op_def_f, ATTR_NAME_BATCH_LABEL, "Batch_1");
  301. vector<int32_t> workspace_no_reuse_scope = { 1 };
  302. (void)ge::AttrUtils::SetListInt(op_def_c, ATTR_NAME_WORKSPACE_MEMORY_NO_REUSE_SCOPE, workspace_no_reuse_scope);
  303. (void)ge::AttrUtils::SetListInt(op_def_e, ATTR_NAME_WORKSPACE_MEMORY_NO_REUSE_SCOPE, workspace_no_reuse_scope);
  304. ge::NodePtr node_a = graph->AddNode(op_def_a);
  305. ge::NodePtr node_b = graph->AddNode(op_def_b);
  306. ge::NodePtr node_c = graph->AddNode(op_def_c);
  307. ge::NodePtr node_d = graph->AddNode(op_def_d);
  308. ge::NodePtr node_e = graph->AddNode(op_def_e);
  309. ge::NodePtr node_f = graph->AddNode(op_def_f);
  310. ge::NodePtr node_g = graph->AddNode(op_def_g);
  311. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_b->GetInDataAnchor(0));
  312. ge::GraphUtils::AddEdge(node_b->GetOutDataAnchor(0), node_c->GetInDataAnchor(0));
  313. ge::GraphUtils::AddEdge(node_c->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  314. ge::GraphUtils::AddEdge(node_a->GetOutDataAnchor(0), node_e->GetInDataAnchor(0));
  315. ge::GraphUtils::AddEdge(node_e->GetOutDataAnchor(0), node_f->GetInDataAnchor(0));
  316. ge::GraphUtils::AddEdge(node_f->GetOutDataAnchor(0), node_d->GetInDataAnchor(0));
  317. ge::GraphUtils::AddEdge(node_d->GetOutDataAnchor(0), node_g->GetInDataAnchor(0));
  318. graph->TopologicalSorting();
  319. }
  320. protected:
  321. void SetUp() {}
  322. void TearDown() { GetContext().out_nodes_map.clear(); }
  323. };
  324. namespace ge {
  325. class MockBlockMemAssigner : public BlockMemAssigner {
  326. public:
  327. explicit MockBlockMemAssigner(ge::ComputeGraphPtr compute_graph, const std::map<std::string, std::string> &anchor_to_symbol, const std::map<std::string, std::list<NodeIndexIO>> &symbol_to_anchors) : BlockMemAssigner(compute_graph, anchor_to_symbol, symbol_to_anchors) {};
  328. virtual ~MockBlockMemAssigner(){};
  329. Status GetMemoryRanges(std::vector<int64_t> &ranges) override { return FAILED; }
  330. };
  331. } // namespace ge
  332. // when check GetMemoryRanges return fail, Assign return fail
  333. TEST_F(UtestMemoryAssignerTest, Mock_block_mem_assigner_failed) {
  334. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  335. MakeGraph(graph);
  336. std::map<std::string, std::string> anchor_to_symbol;
  337. std::map<std::string, std::list<NodeIndexIO>> symbol_to_anchors;
  338. EXPECT_EQ(GraphUtils::GetRefMapping(graph, symbol_to_anchors, anchor_to_symbol), GRAPH_SUCCESS);
  339. MockBlockMemAssigner mock_assigner(graph, anchor_to_symbol, symbol_to_anchors);
  340. EXPECT_EQ(mock_assigner.Assign(), FAILED);
  341. }
  342. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_continuous_input) {
  343. ge::ComputeGraphPtr graph = MakeCascadeContinuousMemoryGraph();
  344. auto addn1 = graph->FindNode("addn1");
  345. auto addn2 = graph->FindNode("addn2");
  346. EXPECT_EQ(addn1->GetOpDesc()->GetOutputOffset()[0], 100);
  347. EXPECT_EQ(addn2->GetOpDesc()->GetOutputOffset()[0], 200);
  348. GraphMemoryAssigner memoryAssigner(graph);
  349. MemoryOffset memory_offset(RT_MEMORY_HBM, 0);
  350. memoryAssigner.memory_offset_.emplace(RT_MEMORY_HBM, memory_offset);
  351. EXPECT_EQ(memoryAssigner.ReAssignContinuousMemory(false), GRAPH_SUCCESS);
  352. EXPECT_EQ(addn1->GetOpDesc()->GetOutputOffset()[0], 500);
  353. EXPECT_EQ(addn2->GetOpDesc()->GetOutputOffset()[0], 600);
  354. }
  355. TEST_F(UtestMemoryAssignerTest, block_memory_assign_nopading_continuous_memory) {
  356. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  357. MakeContinuousReuseGraph(graph, true);
  358. HybridMemAssigner hybridMemAssigner(graph);
  359. ge::Status ret = hybridMemAssigner.Assign();
  360. size_t offset = 0;
  361. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  362. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  363. offset = it->second;
  364. }
  365. EXPECT_EQ(offset, 8192);
  366. EXPECT_EQ(ret, SUCCESS);
  367. }
  368. TEST_F(UtestMemoryAssignerTest, block_memory_assign_continuous_memory) {
  369. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  370. MakeContinuousReuseGraph(graph);
  371. map<uint64_t, size_t> mem_offset;
  372. size_t zero_copy_mem_size = 0;
  373. MemoryAssigner memoryAssigner(graph);
  374. ge::Status ret = memoryAssigner.AssignMemory(false, mem_offset, zero_copy_mem_size);
  375. size_t offset = 0;
  376. auto it = mem_offset.find(RT_MEMORY_HBM);
  377. if (it != mem_offset.end()) {
  378. offset = it->second;
  379. }
  380. EXPECT_EQ(offset, 11264);
  381. EXPECT_EQ(ret, SUCCESS);
  382. }
  383. TEST_F(UtestMemoryAssignerTest, graph_memory_set_last_used_attr) {
  384. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  385. MakeGraph(graph);
  386. auto node_f = graph->FindNode("F");
  387. MemoryAssigner memory_assigner(graph);
  388. map<uint64_t, size_t> mem_offset;
  389. size_t zero_memory_size = 0;
  390. EXPECT_EQ(memory_assigner.AssignMemory(false, mem_offset, zero_memory_size), GRAPH_SUCCESS);
  391. bool flag = 0;
  392. (void) ge::AttrUtils::GetBool(node_f->GetOpDesc()->GetInputDesc(0), ATTR_NAME_IS_END_OF_INPUTMEM_LIFECYCLE, flag);
  393. EXPECT_EQ(flag, true);
  394. }
  395. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_ref_var) {
  396. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  397. MakeGraph(graph, VARIABLE);
  398. auto node_a = graph->FindNode("A");
  399. auto node_b = graph->FindNode("B");
  400. std::string value = "A";
  401. (void) ge::AttrUtils::SetStr(node_b->GetOpDesc()->MutableOutputDesc(0), REF_VAR_SRC_VAR_NAME, value);
  402. MemoryAssigner memory_assigner(graph);
  403. map<uint64_t, size_t> mem_offset;
  404. size_t zero_memory_size = 0;
  405. VarManager::Instance(0)->Init(0, 0, 0, 0);
  406. EXPECT_EQ(memory_assigner.AssignMemory(false, mem_offset, zero_memory_size), GRAPH_SUCCESS);
  407. EXPECT_EQ(node_b->GetOpDesc()->GetOutputOffset()[0], node_a->GetOpDesc()->GetOutputOffset()[0]);
  408. }
  409. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_ref_var_not_found) {
  410. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  411. MakeGraph(graph, VARIABLE);
  412. ge::ComputeGraphPtr sub_graph = make_shared<ge::ComputeGraph>("");
  413. MakeReuseGraph(sub_graph);
  414. graph->AddSubGraph(sub_graph);
  415. auto node_a = graph->FindNode("A");
  416. auto node_b = graph->FindNode("B");
  417. std::string value = "M";
  418. (void) ge::AttrUtils::SetStr(node_b->GetOpDesc()->MutableOutputDesc(0), REF_VAR_SRC_VAR_NAME, value);
  419. MemoryAssigner memory_assigner(graph);
  420. map<uint64_t, size_t> mem_offset;
  421. size_t zero_memory_size = 0;
  422. VarManager::Instance(0)->Init(0, 0, 0, 0);
  423. EXPECT_NE(memory_assigner.AssignMemory(false, mem_offset, zero_memory_size), GRAPH_SUCCESS);
  424. }
  425. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_set_input_offset) {
  426. ge::ComputeGraphPtr graph = MakeRefNodeGraph();
  427. auto assgin = graph->FindNode("assgin");
  428. EXPECT_EQ(assgin->GetOpDesc()->GetOutputOffset()[0], 10000);
  429. EXPECT_EQ(assgin->GetOpDesc()->GetInputOffset()[0], 100);
  430. EXPECT_EQ(assgin->GetOpDesc()->GetInputOffset()[1], 0);
  431. GraphMemoryAssigner memoryAssigner(graph);
  432. MemoryOffset memory_offset(RT_MEMORY_HBM, 0);
  433. memoryAssigner.memory_offset_.emplace(RT_MEMORY_HBM, memory_offset);
  434. EXPECT_EQ(memoryAssigner.SetInputOffset(), GRAPH_SUCCESS);
  435. EXPECT_EQ(assgin->GetOpDesc()->GetOutputOffset()[0], 10100);
  436. EXPECT_EQ(assgin->GetOpDesc()->GetInputOffset()[0], 10100);
  437. EXPECT_EQ(assgin->GetOpDesc()->GetInputOffset()[1], 0);
  438. EXPECT_EQ(memoryAssigner.CheckOffset(), GRAPH_SUCCESS);
  439. }
  440. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_update_ref_op_offset_reverse) {
  441. ge::ut::GraphBuilder builder("graph");
  442. auto data_input = builder.AddNode("data", "Data", 1, 1);
  443. auto const_input = builder.AddNode("const", "Const", 1, 1);
  444. auto add = builder.AddNode("add", "Add", 2, 1);
  445. // add link
  446. builder.AddDataEdge(data_input, 0, add, 0);
  447. builder.AddDataEdge(const_input, 0, add, 1);
  448. // set ref
  449. uint32_t reuse_input_index = 0;
  450. auto output_tensordesc = data_input->GetOpDesc()->MutableOutputDesc(0);
  451. ge::TensorUtils::SetReuseInput(*output_tensordesc, true);
  452. ge::TensorUtils::SetReuseInputIndex(*output_tensordesc, reuse_input_index);
  453. auto output_tensordesc1 = add->GetOpDesc()->MutableOutputDesc(0);
  454. ge::TensorUtils::SetReuseInput(*output_tensordesc1, true);
  455. ge::TensorUtils::SetReuseInputIndex(*output_tensordesc1, reuse_input_index);
  456. ge::ComputeGraphPtr graph = builder.GetGraph();
  457. GraphMemoryAssigner memoryAssigner(graph);
  458. EXPECT_EQ(memoryAssigner.UpdateRefOpOffsetReverse(add), SUCCESS);
  459. }
  460. TEST_F(UtestMemoryAssignerTest, graph_memory_assign_atomic_output_and_workspace) {
  461. ge::ut::GraphBuilder builder("graph");
  462. auto data_input = builder.AddNode("data", "Data", 1, 1);
  463. auto const_input = builder.AddNode("const", "Const", 1, 1);
  464. auto add = builder.AddNode("add", "Add", 2, 1);
  465. // add link
  466. builder.AddDataEdge(data_input, 0, add, 0);
  467. builder.AddDataEdge(const_input, 0, add, 1);
  468. ge::ComputeGraphPtr graph = builder.GetGraph();
  469. auto node = graph->FindNode("add");
  470. EXPECT_NE(node, nullptr);
  471. auto output_tensor_desc = node->GetOpDesc()->MutableOutputDesc(0);
  472. ge::TensorUtils::SetSize(*output_tensor_desc, 100);
  473. vector<int64_t> output_list = {0};
  474. node->GetOpDesc()->SetOutputOffset(output_list);
  475. vector<int64_t> workspace_list = {0};
  476. node->GetOpDesc()->SetWorkspace(workspace_list);
  477. vector<int64_t> atomic_output_index = {0};
  478. bool set_attr = ge::AttrUtils::SetListInt(node->GetOpDesc(), ATOMIC_ATTR_OUTPUT_INDEX, atomic_output_index);
  479. EXPECT_EQ(set_attr, true);
  480. map<string, map<int64_t, int64_t>> workspace_info;
  481. workspace_info["add"][0] = 100;
  482. set_attr = node->GetOpDesc()->SetExtAttr(EXT_ATTR_ATOMIC_WORKSPACE_INFO, workspace_info);
  483. EXPECT_EQ(set_attr, true);
  484. {
  485. bool is_fusion_node = false;
  486. set_attr = ge::AttrUtils::SetBool(node->GetOpDesc(), ATOMIC_ATTR_IS_FUSION_NODE, is_fusion_node);
  487. EXPECT_EQ(set_attr, true);
  488. GraphMemoryAssigner graph_memory_assigner(graph);
  489. graph_memory_assigner.memory_offset_.insert({RT_MEMORY_HBM, MemoryOffset(RT_MEMORY_HBM, 0)});
  490. vector<int64_t> mem_offset_end;
  491. Status ret = graph_memory_assigner.AssignAtomicOutputAndWorkspaceMemory(node, mem_offset_end);
  492. EXPECT_EQ(ret, SUCCESS);
  493. EXPECT_EQ(mem_offset_end.size(), 2);
  494. MemoryOffset mem_offset = graph_memory_assigner.memory_offset_.at(RT_MEMORY_HBM);
  495. EXPECT_EQ(mem_offset.mem_offset_, 1024);
  496. }
  497. {
  498. bool is_fusion_node = true;
  499. set_attr = ge::AttrUtils::SetBool(node->GetOpDesc(), ATOMIC_ATTR_IS_FUSION_NODE, is_fusion_node);
  500. EXPECT_EQ(set_attr, true);
  501. GraphMemoryAssigner graph_memory_assigner(graph);
  502. graph_memory_assigner.memory_offset_.insert({RT_MEMORY_HBM, MemoryOffset(RT_MEMORY_HBM, 0)});
  503. vector<int64_t> mem_offset_end;
  504. Status ret = graph_memory_assigner.AssignAtomicOutputAndWorkspaceMemory(node, mem_offset_end);
  505. EXPECT_EQ(ret, SUCCESS);
  506. EXPECT_EQ(mem_offset_end.size(), 2);
  507. MemoryOffset mem_offset = graph_memory_assigner.memory_offset_.at(RT_MEMORY_HBM);
  508. EXPECT_EQ(mem_offset.mem_offset_, 1024);
  509. }
  510. }
  511. TEST_F(UtestMemoryAssignerTest, Mock_ffts_reuse_no_functinon_op) {
  512. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  513. MakeFftsReuseGraph(graph, kInvalidThreadScopeId, kInvalidThreadScopeId);
  514. HybridMemAssigner hybridMemAssigner(graph);
  515. ge::Status ret = hybridMemAssigner.Assign();
  516. size_t offset = 0;
  517. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  518. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  519. offset = it->second;
  520. }
  521. EXPECT_EQ(offset, 5120);
  522. EXPECT_EQ(ret, SUCCESS);
  523. }
  524. TEST_F(UtestMemoryAssignerTest, Mock_ffts_reuse_two_functinon_op) {
  525. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  526. MakeFftsReuseGraph(graph, 0, 1);
  527. HybridMemAssigner hybridMemAssigner(graph);
  528. ge::Status ret = hybridMemAssigner.Assign();
  529. size_t offset = 0;
  530. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  531. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  532. offset = it->second;
  533. }
  534. EXPECT_EQ(offset, 6656);
  535. EXPECT_EQ(ret, SUCCESS);
  536. }
  537. TEST_F(UtestMemoryAssignerTest, Mock_ffts_reuse_one_functinon_op) {
  538. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  539. MakeFftsReuseGraph(graph, 0, kInvalidThreadScopeId);
  540. HybridMemAssigner hybridMemAssigner(graph);
  541. ge::Status ret = hybridMemAssigner.Assign();
  542. size_t offset = 0;
  543. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  544. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  545. offset = it->second;
  546. }
  547. EXPECT_EQ(offset, 5632);
  548. EXPECT_EQ(ret, SUCCESS);
  549. }
  550. TEST_F(UtestMemoryAssignerTest, one_session_scope_op) {
  551. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  552. MakeSessionScopeReuseGraph(graph);
  553. HybridMemAssigner hybridMemAssigner(graph);
  554. ge::Status ret = hybridMemAssigner.Assign();
  555. size_t offset = 0;
  556. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  557. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  558. offset = it->second;
  559. }
  560. auto mem_type_session_scope = (kSessionScopeMemory | RT_MEMORY_HBM);
  561. size_t session_scope_offset = 0;
  562. it = hybridMemAssigner.GetMemOffsets().find(mem_type_session_scope);
  563. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  564. session_scope_offset = it->second;
  565. }
  566. EXPECT_EQ(offset, 5120);
  567. EXPECT_EQ(session_scope_offset, 1536);
  568. EXPECT_EQ(ret, SUCCESS);
  569. }
  570. TEST_F(UtestMemoryAssignerTest, multi_batch_reuse) {
  571. ge::ComputeGraphPtr graph = make_shared<ge::ComputeGraph>("");
  572. MakeMultiBatchReuseGraph(graph);
  573. HybridMemAssigner hybridMemAssigner(graph);
  574. ge::Status ret = hybridMemAssigner.Assign();
  575. size_t offset = 0;
  576. auto it = hybridMemAssigner.GetMemOffsets().find(RT_MEMORY_HBM);
  577. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  578. offset = it->second;
  579. }
  580. auto mem_type_session_scope = (kSessionScopeMemory | RT_MEMORY_HBM);
  581. size_t session_scope_offset = 0;
  582. it = hybridMemAssigner.GetMemOffsets().find(mem_type_session_scope);
  583. if (it != hybridMemAssigner.GetMemOffsets().end()) {
  584. session_scope_offset = it->second;
  585. }
  586. EXPECT_EQ(offset, 6656);
  587. EXPECT_EQ(session_scope_offset, 1536);
  588. EXPECT_EQ(ret, SUCCESS);
  589. }

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示