You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

compute_graph.h 12 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef INC_GRAPH_COMPUTE_GRAPH_H_
  17. #define INC_GRAPH_COMPUTE_GRAPH_H_
  18. #include <map>
  19. #include <memory>
  20. #include <string>
  21. #include <utility>
  22. #include <vector>
  23. #include <deque>
  24. #include "detail/attributes_holder.h"
  25. #include "graph/anchor.h"
  26. #include "graph/node.h"
  27. #include "graph/op_desc.h"
  28. #include "graph/range_vistor.h"
  29. namespace ge {
  30. class Node;
  31. using NodePtr = std::shared_ptr<Node>;
  32. class Edge;
  33. using EdgePtr = std::shared_ptr<Edge>;
  34. class InDataAnchor;
  35. using InDataAnchorPtr = std::shared_ptr<InDataAnchor>;
  36. class OutDataAnchor;
  37. using OutDataAnchorPtr = std::shared_ptr<OutDataAnchor>;
  38. class ControlAnchor;
  39. using ControlAnchorPtr = std::shared_ptr<ControlAnchor>;
  40. class InControlAnchor;
  41. using InControlAnchorPtr = std::shared_ptr<InControlAnchor>;
  42. class OutControlAnchor;
  43. using OutControlAnchorPtr = std::shared_ptr<OutControlAnchor>;
  44. class GeAttrValue;
  45. using AttrValuePtr = std::shared_ptr<GeAttrValue>;
  46. using ConstComputeGraph = const ComputeGraph;
  47. class OperatorImpl;
  48. using OperatorImplPtr = std::shared_ptr<OperatorImpl>;
  49. class ComputeGraph : public std::enable_shared_from_this<ComputeGraph>, public AttrHolder {
  50. friend class GraphUtils;
  51. public:
  52. template <class T>
  53. using Vistor = RangeVistor<T, std::shared_ptr<ConstComputeGraph>>;
  54. explicit ComputeGraph(const std::string &name);
  55. ~ComputeGraph() override;
  56. std::string GetName() const;
  57. void SetName(const std::string &name);
  58. using AttrHolder::DelAttr;
  59. using AttrHolder::GetAttr;
  60. using AttrHolder::HasAttr;
  61. using AttrHolder::SetAttr;
  62. size_t GetAllNodesSize() const;
  63. Vistor<NodePtr> GetAllNodes() const;
  64. // is_unknown_shape: false, same with GetAllNodes func
  65. // is_unknown_shape: true, same with GetDirectNodes func
  66. Vistor<NodePtr> GetNodes(bool is_unknown_shape) const;
  67. size_t GetDirectNodesSize() const;
  68. Vistor<NodePtr> GetDirectNode() const;
  69. Vistor<NodePtr> GetInputNodes() const;
  70. Vistor<NodePtr> GetOutputNodes() const;
  71. NodePtr FindNode(const std::string &name) const;
  72. NodePtr FindFirstNodeMatchType(const std::string &name) const;
  73. // AddNode with NodePtr
  74. NodePtr AddNode(NodePtr node);
  75. NodePtr AddNode(OpDescPtr op);
  76. NodePtr AddNode(OpDescPtr op, int64_t id); // for unserialize
  77. NodePtr AddNodeFront(NodePtr node);
  78. NodePtr AddNodeFront(const OpDescPtr &op);
  79. NodePtr AddInputNode(NodePtr node);
  80. NodePtr AddOutputNode(NodePtr node);
  81. // insert node with specific pre_node
  82. NodePtr AddNodeAfter(OpDescPtr &op, const NodePtr &pre_node);
  83. NodePtr AddNodeAfter(NodePtr node, const NodePtr &pre_node);
  84. graphStatus RemoveNode(const NodePtr &node);
  85. graphStatus RemoveInputNode(const NodePtr &node);
  86. graphStatus RemoveOutputNode(const NodePtr &node);
  87. graphStatus RemoveConstInput(const NodePtr &node);
  88. /// Add a subgraph to this graph. The subgraph must has a parent graph and parent node,
  89. /// which means the member functions `SetParentGraph` and `SetParentNode` of the subgraph
  90. /// must be called before add it to the root graph. and subgraph->GetParentNode()->GetOwnerGraph()
  91. /// must equal to subgraph->GetOwnerGraph().
  92. /// The subgraphs can only be added to a *root graph*. A root graph is a graph without any parent graph.
  93. /// The subgraph's name SHOULD(not must) be the same as the parameter `name`
  94. graphStatus AddSubgraph(const std::string &name, const std::shared_ptr<ComputeGraph> &subgraph);
  95. graphStatus AddSubgraph(const std::shared_ptr<ComputeGraph> &subgraph);
  96. void RemoveSubgraph(const std::string &name);
  97. void RemoveSubgraph(const std::shared_ptr<ComputeGraph> &subgraph);
  98. std::shared_ptr<ComputeGraph> GetSubgraph(const std::string &name) const;
  99. std::vector<std::shared_ptr<ComputeGraph>> GetAllSubgraphs() const;
  100. // obsolete
  101. std::shared_ptr<ComputeGraph> AddSubGraph(std::shared_ptr<ComputeGraph> sub_graph);
  102. // obsolete
  103. graphStatus RemoveSubGraph(const std::shared_ptr<ComputeGraph> &sub_graph);
  104. ///
  105. /// @brief Update input-mapping
  106. /// @param [in] input_mapping : index_of_cur_graph_node_input -> index_of_new_graph_node_input
  107. /// @return graphStatus
  108. ///
  109. graphStatus UpdateInputMapping(const std::map<uint32_t, uint32_t> &input_mapping);
  110. ///
  111. /// @brief Update output-mapping
  112. /// @param [in] output_mapping : index_of_cur_graph_node_output -> index_of_new_graph_node_output
  113. /// @return graphStatus
  114. ///
  115. graphStatus UpdateOutputMapping(const std::map<uint32_t, uint32_t> &output_mapping);
  116. graphStatus TopologicalSorting();
  117. bool IsValid() const;
  118. void Dump() const;
  119. graphStatus IsolateNode(const NodePtr &node);
  120. graphStatus Verify();
  121. graphStatus InferShape();
  122. graphStatus InferOriginFormat();
  123. graphStatus InferShapeInNeed();
  124. graphStatus InsertEventNodes();
  125. bool operator==(const ComputeGraph &r_compute_graph) const;
  126. const std::map<std::vector<std::string>, std::vector<std::string>> &GetShareParamLayer() const {
  127. return params_share_map_;
  128. }
  129. void SetShareParamLayer(const std::map<std::vector<std::string>, std::vector<std::string>> params_share_map) {
  130. params_share_map_ = params_share_map;
  131. }
  132. void SetInputsOrder(const std::vector<std::string> &inputs_order) { inputs_order_ = inputs_order; }
  133. void SetGraphOutNodes(std::map<std::string, std::vector<int32_t>> out_nodes_map) { out_nodes_map_ = out_nodes_map; }
  134. void AppendGraphOutNodes(std::map<std::string, std::vector<int32_t>> out_nodes_map) {
  135. for (auto &item : out_nodes_map) {
  136. (void)out_nodes_map_.emplace(item.first, item.second);
  137. }
  138. }
  139. shared_ptr<ComputeGraph> GetParentGraph();
  140. void SetParentGraph(const shared_ptr<ComputeGraph> &parent);
  141. shared_ptr<Node> GetParentNode();
  142. void SetParentNode(const shared_ptr<Node> &parent);
  143. const std::map<std::string, std::vector<int32_t>> &GetGraphOutNodes() const { return out_nodes_map_; }
  144. void SetOrigGraph(ComputeGraphPtr orig_graph) { origGraph_ = orig_graph; }
  145. ComputeGraphPtr GetOrigGraph(void) { return origGraph_; }
  146. void SetOutputSize(uint32_t size) { output_size_ = size; }
  147. uint32_t GetOutputSize() const { return output_size_; }
  148. void SetInputSize(uint32_t size) { input_size_ = size; }
  149. uint32_t GetInputSize() const { return input_size_; }
  150. // false: known shape true: unknow shape
  151. bool GetGraphUnknownFlag() const { return is_unknown_shape_graph_; }
  152. void SetGraphUnknownFlag(bool flag) { is_unknown_shape_graph_ = flag; }
  153. ///
  154. /// Set is need train iteration.
  155. /// If set true, it means this graph need to be run iteration some
  156. /// times(according variant "npu_runconfig/iterations_per_loop").
  157. /// @param need_iteration is need iteration
  158. ///
  159. void SetNeedIteration(bool need_iteration) { need_iteration_ = need_iteration; }
  160. void SetUserDefOutput(const std::string &output_name);
  161. const std::string GetOutput();
  162. ///
  163. /// Get is need train iteration.
  164. /// @return is need iteration
  165. ///
  166. bool GetNeedIteration() const { return need_iteration_; }
  167. void SetGraphOpName(const std::map<uint32_t, std::string> &op_name_map) { op_name_map_ = op_name_map; }
  168. const std::map<uint32_t, std::string> &GetGraphOpName() const { return op_name_map_; }
  169. const std::map<OperatorImplPtr, NodePtr> &GetAllNodesInfo() const;
  170. void SetAllNodesInfo(const std::map<OperatorImplPtr, NodePtr> &nodes) { all_nodes_infos_ = nodes; }
  171. void SetGraphOutNodesInfo(std::vector<std::pair<NodePtr, int32_t>> &out_nodes_info) {
  172. output_nodes_info_ = out_nodes_info;
  173. }
  174. void AppendGraphOutNodesInfo(std::vector<std::pair<NodePtr, int32_t>> &out_nodes_info) {
  175. output_nodes_info_.insert(output_nodes_info_.end(), out_nodes_info.begin(), out_nodes_info.end());
  176. }
  177. const std::vector<std::pair<NodePtr, int32_t>> &GetGraphOutNodesInfo() const { return output_nodes_info_; }
  178. void SetGraphTargetNodesInfo(const std::vector<NodePtr> &target_nodes_info) {
  179. target_nodes_info_ = target_nodes_info;
  180. }
  181. const std::vector<NodePtr> &GetGraphTargetNodesInfo() const { return target_nodes_info_; }
  182. void SetSessionID(uint64_t session_id) { session_id_ = session_id; }
  183. uint64_t GetSessionID() const { return session_id_; }
  184. void SetGraphID(uint32_t graph_id) { graph_id_ = graph_id; }
  185. uint32_t GetGraphID() const { return graph_id_; }
  186. void SaveDataFormat(ge::Format data_format) { data_format_ = data_format; }
  187. ge::Format GetDataFormat() const { return data_format_; }
  188. bool IsSummaryGraph() const { return is_summary_graph_; }
  189. void SetSummaryFlag(bool is_summary_graph) { is_summary_graph_ = is_summary_graph; }
  190. // Graph Before BFE
  191. ComputeGraphPtr origGraph_;
  192. protected:
  193. ProtoAttrMapHelper MutableAttrMap() override;
  194. ConstProtoAttrMapHelper GetAttrMap() const override;
  195. private:
  196. graphStatus DFSTopologicalSorting(std::vector<NodePtr> &node_vec, std::map<NodePtr, uint32_t> &map_in_edge_num,
  197. std::vector<NodePtr> &stack);
  198. graphStatus BFSTopologicalSorting(std::vector<NodePtr> &node_vec, std::map<NodePtr, uint32_t> &map_in_edge_num,
  199. std::deque<NodePtr> &stack);
  200. graphStatus CollectBreadthOutNode(const NodePtr &node, std::map<NodePtr, uint32_t> &map_in_edge_num,
  201. std::map<string, NodePtr> &breadth_node_map);
  202. graphStatus TopologicalSortingGraph();
  203. graphStatus SortNodes(std::vector<NodePtr> &stack, std::map<NodePtr, uint32_t> &mapInEdgeNum);
  204. Vistor<NodePtr> AllGraphNodes(std::vector<std::shared_ptr<ComputeGraph>> &subgraphs) const;
  205. size_t GetInEdgeSize(const NodePtr &node);
  206. size_t GetOutEdgeSize(const NodePtr &node);
  207. graphStatus RemoveExtraOutEdge(const NodePtr &node);
  208. bool GraphMembersAreEqual(const ComputeGraph &r_graph) const;
  209. bool GraphAttrsAreEqual(const ComputeGraph &r_graph) const;
  210. bool VectorInputNodePtrIsEqual(const std::vector<NodePtr> &r_node_ptr_vector,
  211. const std::vector<NodePtr> &l_node_ptr_vector) const;
  212. friend class ModelSerializeImp;
  213. friend class GraphDebugImp;
  214. friend class OnnxUtils;
  215. std::string name_;
  216. uint32_t graph_id_ = 0;
  217. ProtoAttrMapHelper attrs_;
  218. std::vector<NodePtr> nodes_;
  219. std::map<OperatorImplPtr, NodePtr> all_nodes_infos_;
  220. std::vector<NodePtr> target_nodes_info_;
  221. std::vector<NodePtr> input_nodes_;
  222. std::vector<std::string> inputs_order_;
  223. uint32_t input_size_ = 1;
  224. std::map<std::string, std::vector<int32_t>> out_nodes_map_;
  225. uint32_t output_size_ = 1;
  226. std::vector<std::pair<NodePtr, int32_t>> output_nodes_info_;
  227. std::vector<std::shared_ptr<ComputeGraph>> sub_graph_;
  228. std::map<std::string, std::shared_ptr<ComputeGraph>> names_to_subgraph_;
  229. std::weak_ptr<ComputeGraph> parent_graph_;
  230. std::weak_ptr<Node> parent_node_;
  231. // the members followed should not in the ComputeGraph class
  232. bool is_valid_flag_;
  233. bool is_summary_graph_ = false;
  234. // Indicates whether it is need iteration
  235. bool need_iteration_ = false;
  236. std::map<std::vector<std::string>, std::vector<std::string>> params_share_map_;
  237. // TaskIdx -> op_name Map
  238. std::map<uint32_t, std::string> op_name_map_;
  239. uint64_t session_id_ = 0;
  240. ge::Format data_format_ = ge::FORMAT_ND;
  241. // unknown graph indicator, default is false, mean known shape
  242. bool is_unknown_shape_graph_ = false;
  243. };
  244. } // namespace ge
  245. #endif // INC_GRAPH_COMPUTE_GRAPH_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示