You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

data_dumper.h 6.5 kB

5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
5 years ago
4 years ago
5 years ago
4 years ago
5 years ago
4 years ago
4 years ago
4 years ago
5 years ago
5 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180
  1. /**
  2. * Copyright 2020 Huawei Technologies Co., Ltd
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_
  17. #define GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_
  18. #include <map>
  19. #include <memory>
  20. #include <string>
  21. #include <vector>
  22. #include "framework/common/ge_inner_error_codes.h"
  23. #include "common/properties_manager.h"
  24. #include "graph/node.h"
  25. #include "graph/compute_graph.h"
  26. #include "proto/ge_ir.pb.h"
  27. #include "proto/op_mapping_info.pb.h"
  28. #include "runtime/mem.h"
  29. #include "task_info/task_info.h"
  30. #include "framework/common/ge_types.h"
  31. #include "runtime/base.h"
  32. namespace ge {
  33. class DataDumper {
  34. public:
  35. explicit DataDumper(const RuntimeParam &rsh)
  36. : model_name_(),
  37. model_id_(0),
  38. runtime_param_(rsh),
  39. dev_mem_load_(nullptr),
  40. dev_mem_unload_(nullptr),
  41. op_list_(),
  42. input_map_(),
  43. load_flag_(false),
  44. device_id_(0),
  45. global_step_(0),
  46. loop_per_iter_(0),
  47. loop_cond_(0),
  48. compute_graph_(nullptr),
  49. ref_info_() {}
  50. ~DataDumper();
  51. void SetModelName(const std::string &model_name) { model_name_ = model_name; }
  52. void SetModelId(uint32_t model_id) { model_id_ = model_id; }
  53. void SetDeviceId(uint32_t device_id) { device_id_ = device_id; }
  54. void SetComputeGraph(const ComputeGraphPtr &compute_graph) { compute_graph_ = compute_graph; };
  55. void SetRefInfo(const std::map<OpDescPtr, void *> &ref_info) { ref_info_ = ref_info; };
  56. void SetL1FusionAddr(void *addr) { l1_fusion_addr_ = addr; };
  57. void SetLoopAddr(void *global_step, void *loop_per_iter, void *loop_cond);
  58. void SaveDumpInput(const std::shared_ptr<Node> &node);
  59. void SaveDumpOpInfo(const RuntimeParam &model_param, const OpDescPtr &op, uint32_t task_id, uint32_t stream_id);
  60. // args is device memory stored first output addr
  61. void SaveDumpTask(uint32_t task_id, uint32_t stream_id, const std::shared_ptr<OpDesc> &op_desc, uintptr_t args);
  62. void SaveEndGraphId(uint32_t task_id, uint32_t stream_id);
  63. void SetOmName(const std::string &om_name) { om_name_ = om_name; }
  64. void SaveOpDebugId(uint32_t task_id, uint32_t stream_id, void *op_debug_addr, bool is_op_debug);
  65. Status LoadDumpInfo();
  66. Status UnloadDumpInfo();
  67. void SetDumpProperties(const DumpProperties &dump_properties) { dump_properties_ = dump_properties; }
  68. const DumpProperties &GetDumpProperties() const { return dump_properties_; }
  69. bool GetOpDescInfo(uint32_t stream_id, uint32_t task_id, OpDescInfo &op_desc_info) const;
  70. const std::vector<OpDescInfo> &GetAllOpDescInfo() const { return op_desc_info_; }
  71. // Dump exception info
  72. Status DumpExceptionInput(const OpDescInfo &op_desc_info, const string &dump_file);
  73. Status DumpExceptionOutput(const OpDescInfo &op_desc_info, const string &dump_file);
  74. Status DumpExceptionInfo(const std::vector<rtExceptionInfo> exception_infos);
  75. private:
  76. void ReleaseDevMem(void **ptr) noexcept;
  77. void PrintCheckLog(string &dump_list_key);
  78. std::string model_name_;
  79. // for inference data dump
  80. std::string om_name_;
  81. uint32_t model_id_;
  82. const RuntimeParam &runtime_param_;
  83. void *dev_mem_load_;
  84. void *dev_mem_unload_;
  85. struct InnerDumpInfo;
  86. struct InnerInputMapping;
  87. std::vector<OpDescInfo> op_desc_info_;
  88. std::vector<InnerDumpInfo> op_list_;
  89. uint32_t end_graph_task_id_ = 0;
  90. uint32_t end_graph_stream_id_ = 0;
  91. bool is_end_graph_ = false;
  92. std::multimap<std::string, InnerInputMapping> input_map_;
  93. bool load_flag_;
  94. uint32_t device_id_;
  95. uintptr_t global_step_;
  96. uintptr_t loop_per_iter_;
  97. uintptr_t loop_cond_;
  98. ComputeGraphPtr compute_graph_;
  99. std::map<OpDescPtr, void *> ref_info_;
  100. void *l1_fusion_addr_ = nullptr;
  101. uint32_t op_debug_task_id_ = 0;
  102. uint32_t op_debug_stream_id_ = 0;
  103. void *op_debug_addr_ = nullptr;
  104. bool is_op_debug_ = false;
  105. DumpProperties dump_properties_;
  106. // Build task info of op mapping info
  107. Status BuildTaskInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  108. Status DumpOutput(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  109. Status DumpRefOutput(const DataDumper::InnerDumpInfo &inner_dump_info, aicpu::dump::Output &output, size_t i,
  110. const std::string &node_name_index);
  111. Status DumpOutputWithTask(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  112. Status DumpInput(const InnerDumpInfo &inner_dump_info, aicpu::dump::Task &task);
  113. Status DumpRefInput(const DataDumper::InnerDumpInfo &inner_dump_info, aicpu::dump::Input &input, size_t i,
  114. const std::string &node_name_index);
  115. Status ExecuteLoadDumpInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  116. void SetEndGraphIdToAicpu(uint32_t task_id, uint32_t stream_id, aicpu::dump::OpMappingInfo &op_mapping_info);
  117. void SetOpDebugIdToAicpu(uint32_t task_id, uint32_t stream_id, void *op_debug_addr,
  118. aicpu::dump::OpMappingInfo &op_mapping_info);
  119. Status ExecuteUnLoadDumpInfo(aicpu::dump::OpMappingInfo &op_mapping_info);
  120. Status GenerateInput(aicpu::dump::Input &input,
  121. const OpDesc::Vistor<GeTensorDesc> &tensor_descs,
  122. const uintptr_t &addr,
  123. size_t index);
  124. Status GenerateOutput(aicpu::dump::Output &output,
  125. const OpDesc::Vistor<GeTensorDesc> &tensor_descs,
  126. const uintptr_t &addr,
  127. size_t index);
  128. void GenerateOpBuffer(const int64_t &size, aicpu::dump::Task &task);
  129. };
  130. struct DataDumper::InnerDumpInfo {
  131. uint32_t task_id;
  132. uint32_t stream_id;
  133. std::shared_ptr<OpDesc> op;
  134. uintptr_t args;
  135. bool is_task;
  136. int input_anchor_index;
  137. int output_anchor_index;
  138. std::vector<int64_t> dims;
  139. int64_t data_size;
  140. };
  141. struct DataDumper::InnerInputMapping {
  142. std::shared_ptr<OpDesc> data_op;
  143. int input_anchor_index;
  144. int output_anchor_index;
  145. };
  146. } // namespace ge
  147. #endif // GE_GRAPH_LOAD_NEW_MODEL_MANAGER_DATA_DUMPER_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示