You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

compute_graph.h 11 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287
  1. /**
  2. * Copyright 2019-2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef INC_GRAPH_COMPUTE_GRAPH_H_
  17. #define INC_GRAPH_COMPUTE_GRAPH_H_
  18. #include <map>
  19. #include <memory>
  20. #include <string>
  21. #include <utility>
  22. #include <vector>
  23. #include <deque>
  24. #include "detail/attributes_holder.h"
  25. #include "graph/anchor.h"
  26. #include "graph/node.h"
  27. #include "graph/op_desc.h"
  28. #include "graph/range_vistor.h"
  29. namespace ge {
  30. class Node;
  31. using NodePtr = std::shared_ptr<Node>;
  32. class Edge;
  33. using EdgePtr = std::shared_ptr<Edge>;
  34. class InDataAnchor;
  35. using InDataAnchorPtr = std::shared_ptr<InDataAnchor>;
  36. class OutDataAnchor;
  37. using OutDataAnchorPtr = std::shared_ptr<OutDataAnchor>;
  38. class ControlAnchor;
  39. using ControlAnchorPtr = std::shared_ptr<ControlAnchor>;
  40. class InControlAnchor;
  41. using InControlAnchorPtr = std::shared_ptr<InControlAnchor>;
  42. class OutControlAnchor;
  43. using OutControlAnchorPtr = std::shared_ptr<OutControlAnchor>;
  44. class GeAttrValue;
  45. using AttrValuePtr = std::shared_ptr<GeAttrValue>;
  46. using ConstComputeGraph = const ComputeGraph;
  47. class OperatorImpl;
  48. using OperatorImplPtr = std::shared_ptr<OperatorImpl>;
  49. class ComputeGraph : public std::enable_shared_from_this<ComputeGraph>, public AttrHolder {
  50. friend class GraphUtils;
  51. public:
  52. template <class T>
  53. using Vistor = RangeVistor<T, std::shared_ptr<ConstComputeGraph>>;
  54. explicit ComputeGraph(const std::string &name);
  55. ~ComputeGraph() override;
  56. std::string GetName() const;
  57. void SetName(const std::string &name);
  58. using AttrHolder::DelAttr;
  59. using AttrHolder::GetAttr;
  60. using AttrHolder::HasAttr;
  61. using AttrHolder::SetAttr;
  62. size_t GetAllNodesSize() const;
  63. Vistor<NodePtr> GetAllNodes() const;
  64. size_t GetDirectNodesSize() const;
  65. Vistor<NodePtr> GetDirectNode() const;
  66. Vistor<NodePtr> GetInputNodes() const;
  67. Vistor<NodePtr> GetOutputNodes() const;
  68. NodePtr FindNode(const std::string &name) const;
  69. // AddNode with NodePtr
  70. NodePtr AddNode(NodePtr node);
  71. NodePtr AddNode(OpDescPtr op);
  72. NodePtr AddNode(OpDescPtr op, int64_t id); // for unserialize.
  73. NodePtr AddNodeFront(NodePtr node);
  74. NodePtr AddNodeFront(const OpDescPtr &op);
  75. NodePtr AddInputNode(NodePtr node);
  76. NodePtr AddOutputNode(NodePtr node);
  77. graphStatus RemoveNode(const NodePtr &node);
  78. graphStatus RemoveInputNode(const NodePtr &node);
  79. graphStatus RemoveOutputNode(const NodePtr &node);
  80. graphStatus RemoveConstInput(const NodePtr &node);
  81. /// Add a subgraph to this graph. The subgraph must has a parent graph and parent node,
  82. /// which means the member functions `SetParentGraph` and `SetParentNode` of the subgraph
  83. /// must be called before add it to the root graph. and subgraph->GetParentNode()->GetOwnerGraph()
  84. /// must equal to subgraph->GetOwnerGraph().
  85. /// The subgraphs can only be added to a *root graph*. A root graph is a graph without any parent graph.
  86. /// The subgraph's name SHOULD(not must) be the same as the parameter `name`
  87. graphStatus AddSubgraph(const std::string &name, const std::shared_ptr<ComputeGraph> &subgraph);
  88. graphStatus AddSubgraph(const std::shared_ptr<ComputeGraph> &subgraph);
  89. void RemoveSubgraph(const std::string &name);
  90. void RemoveSubgraph(const std::shared_ptr<ComputeGraph> &subgraph);
  91. std::shared_ptr<ComputeGraph> GetSubgraph(const std::string &name) const;
  92. std::vector<std::shared_ptr<ComputeGraph>> GetAllSubgraphs() const;
  93. // obsolete
  94. std::shared_ptr<ComputeGraph> AddSubGraph(std::shared_ptr<ComputeGraph> sub_graph);
  95. // obsolete
  96. graphStatus RemoveSubGraph(const std::shared_ptr<ComputeGraph> &sub_graph);
  97. ///
  98. /// @brief Update input-mapping
  99. /// @param [in] input_mapping : index_of_cur_graph_node_input -> index_of_new_graph_node_input
  100. /// @return graphStatus
  101. ///
  102. graphStatus UpdateInputMapping(const std::map<uint32_t, uint32_t> &input_mapping);
  103. ///
  104. /// @brief Update output-mapping
  105. /// @param [in] output_mapping : index_of_cur_graph_node_output -> index_of_new_graph_node_output
  106. /// @return graphStatus
  107. ///
  108. graphStatus UpdateOutputMapping(const std::map<uint32_t, uint32_t> &output_mapping);
  109. graphStatus TopologicalSorting();
  110. bool IsValid() const;
  111. void Dump() const;
  112. graphStatus IsolateNode(const NodePtr &node);
  113. graphStatus Verify();
  114. graphStatus InferShape();
  115. graphStatus InferOriginFormat();
  116. graphStatus InferShapeInNeed();
  117. graphStatus InsertEventNodes();
  118. bool operator==(const ComputeGraph &r_compute_graph) const;
  119. const std::map<std::vector<std::string>, std::vector<std::string>> &GetShareParamLayer() const {
  120. return params_share_map_;
  121. }
  122. void SetShareParamLayer(const std::map<std::vector<std::string>, std::vector<std::string>> params_share_map) {
  123. params_share_map_ = params_share_map;
  124. }
  125. void SetInputsOrder(const std::vector<std::string> &inputs_order) { inputs_order_ = inputs_order; }
  126. void SetGraphOutNodes(std::map<std::string, std::vector<int32_t>> out_nodes_map) { out_nodes_map_ = out_nodes_map; }
  127. void AppendGraphOutNodes(std::map<std::string, std::vector<int32_t>> out_nodes_map) {
  128. for (auto &item : out_nodes_map) {
  129. (void)out_nodes_map_.emplace(item.first, item.second);
  130. }
  131. }
  132. shared_ptr<ComputeGraph> GetParentGraph();
  133. void SetParentGraph(const shared_ptr<ComputeGraph> &parent);
  134. shared_ptr<Node> GetParentNode();
  135. void SetParentNode(const shared_ptr<Node> &parent);
  136. const std::map<std::string, std::vector<int32_t>> &GetGraphOutNodes() const { return out_nodes_map_; }
  137. void SetOrigGraph(ComputeGraphPtr orig_graph) { origGraph_ = orig_graph; }
  138. ComputeGraphPtr GetOrigGraph(void) { return origGraph_; }
  139. void SetOutputSize(uint32_t size) { output_size_ = size; }
  140. uint32_t GetOutputSize() const { return output_size_; }
  141. void SetInputSize(uint32_t size) { input_size_ = size; }
  142. uint32_t GetInputSize() const { return input_size_; }
  143. ///
  144. /// Set is need train iteration.
  145. /// If set true, it means this graph need to be run iteration some
  146. /// times(according variant "npu_runconfig/iterations_per_loop").
  147. /// @param need_iteration is need iteration
  148. ///
  149. void SetNeedIteration(bool need_iteration) { need_iteration_ = need_iteration; }
  150. void SetUserDefOutput(const std::string &output_name);
  151. const std::string GetOutput();
  152. ///
  153. /// Get is need train iteration.
  154. /// @return is need iteration
  155. ///
  156. bool GetNeedIteration() const { return need_iteration_; }
  157. void SetGraphOpName(const std::map<uint32_t, std::string> &op_name_map) { op_name_map_ = op_name_map; }
  158. const std::map<uint32_t, std::string> &GetGraphOpName() const { return op_name_map_; }
  159. const std::map<OperatorImplPtr, NodePtr> &GetAllNodesInfo() const;
  160. void SetAllNodesInfo(const std::map<OperatorImplPtr, NodePtr> &nodes) { all_nodes_infos_ = nodes; }
  161. void SetGraphOutNodesInfo(std::vector<std::pair<NodePtr, int32_t>> &out_nodes_info) {
  162. output_nodes_info_ = out_nodes_info;
  163. }
  164. void AppendGraphOutNodesInfo(std::vector<std::pair<NodePtr, int32_t>> &out_nodes_info) {
  165. output_nodes_info_.insert(output_nodes_info_.end(), out_nodes_info.begin(), out_nodes_info.end());
  166. }
  167. const std::vector<std::pair<NodePtr, int32_t>> &GetGraphOutNodesInfo() const { return output_nodes_info_; }
  168. void SetGraphTargetNodesInfo(const std::vector<NodePtr> &target_nodes_info) {
  169. target_nodes_info_ = target_nodes_info;
  170. }
  171. const std::vector<NodePtr> &GetGraphTargetNodesInfo() const { return target_nodes_info_; }
  172. void SetSessionID(uint64_t session_id) { session_id_ = session_id; }
  173. uint64_t GetSessionID() const { return session_id_; }
  174. void SetGraphID(uint32_t graph_id) { graph_id_ = graph_id; }
  175. uint32_t GetGraphID() const { return graph_id_; }
  176. void SaveDataFormat(ge::Format data_format) { data_format_ = data_format; }
  177. ge::Format GetDataFormat() const { return data_format_; }
  178. bool IsSummaryGraph() const { return is_summary_graph_; }
  179. void SetSummaryFlag(bool is_summary_graph) { is_summary_graph_ = is_summary_graph; }
  180. // Graph Before BFE
  181. ComputeGraphPtr origGraph_;
  182. protected:
  183. ProtoAttrMapHelper MutableAttrMap() override;
  184. ConstProtoAttrMapHelper GetAttrMap() const override;
  185. private:
  186. graphStatus DFSTopologicalSorting(std::vector<NodePtr> &node_vec, std::map<NodePtr, uint32_t> &map_in_edge_num,
  187. std::vector<NodePtr> &stack);
  188. graphStatus BFSTopologicalSorting(std::vector<NodePtr> &node_vec, std::map<NodePtr, uint32_t> &map_in_edge_num,
  189. std::deque<NodePtr> &stack);
  190. graphStatus CollectBreadthOutNode(const NodePtr &node, std::map<NodePtr, uint32_t> &map_in_edge_num,
  191. std::map<string, NodePtr> &breadth_node_map);
  192. graphStatus TopologicalSortingGraph();
  193. graphStatus SortNodes(std::vector<NodePtr> &stack, std::map<NodePtr, uint32_t> &mapInEdgeNum);
  194. Vistor<NodePtr> AllGraphNodes(std::vector<std::shared_ptr<ComputeGraph>> &subgraphs) const;
  195. size_t GetInEdgeSize(const NodePtr &node);
  196. size_t GetOutEdgeSize(const NodePtr &node);
  197. graphStatus RemoveExtraOutEdge(const NodePtr &node);
  198. bool GraphMembersAreEqual(const ComputeGraph &r_graph) const;
  199. bool GraphAttrsAreEqual(const ComputeGraph &r_graph) const;
  200. bool VectorInputNodePtrIsEqual(const std::vector<NodePtr> &r_node_ptr_vector,
  201. const std::vector<NodePtr> &l_node_ptr_vector) const;
  202. friend class ModelSerializeImp;
  203. friend class GraphDebugImp;
  204. friend class OnnxUtils;
  205. std::string name_;
  206. uint32_t graph_id_ = 0;
  207. ProtoAttrMapHelper attrs_;
  208. std::vector<NodePtr> nodes_;
  209. std::map<OperatorImplPtr, NodePtr> all_nodes_infos_;
  210. std::vector<NodePtr> target_nodes_info_;
  211. std::vector<NodePtr> input_nodes_;
  212. std::vector<std::string> inputs_order_;
  213. uint32_t input_size_ = 1;
  214. std::map<std::string, std::vector<int32_t>> out_nodes_map_;
  215. uint32_t output_size_ = 1;
  216. std::vector<std::pair<NodePtr, int32_t>> output_nodes_info_;
  217. std::vector<std::shared_ptr<ComputeGraph>> sub_graph_;
  218. std::map<std::string, std::shared_ptr<ComputeGraph>> names_to_subgraph_;
  219. std::weak_ptr<ComputeGraph> parent_graph_;
  220. std::weak_ptr<Node> parent_node_;
  221. // the members followed should not in the ComputeGraph class
  222. bool is_valid_flag_;
  223. bool is_summary_graph_ = false;
  224. // Indicates whether it is need iteration
  225. bool need_iteration_ = false;
  226. std::map<std::vector<std::string>, std::vector<std::string>> params_share_map_;
  227. // TaskIdx -> op_name Map
  228. std::map<uint32_t, std::string> op_name_map_;
  229. uint64_t session_id_ = 0;
  230. ge::Format data_format_ = ge::FORMAT_ND;
  231. };
  232. } // namespace ge
  233. #endif // INC_GRAPH_COMPUTE_GRAPH_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示