You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

tune_api.h 4.1 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157
  1. /**
  2. * @file tune_api.h
  3. *
  4. * Copyright (c) Huawei Technologies Co., Ltd. 2020-2021. All rights reserved.\n
  5. *
  6. * This program is distributed in the hope that it will be useful,
  7. * but WITHOUT ANY WARRANTY; without even the implied warranty of
  8. * MERCHANTABILITY or FITNESS FOR A PARTICULAR PURPOSE.\n
  9. * 描述:aoe调优接口头文件
  10. */
  11. /** @defgroup aoe aoe调优接口 */
  12. #ifndef TUNE_API_H
  13. #define TUNE_API_H
  14. #include <vector>
  15. #include <map>
  16. #include <string>
  17. #include "graph/graph.h"
  18. #include "ge/ge_api.h"
  19. #include "aoe_types.h"
  20. /**
  21. * @ingroup aoe
  22. *
  23. * aoe status
  24. */
  25. enum MsTuneStatus {
  26. MSTUNE_SUCCESS, /** tune success */
  27. MSTUNE_FAILED, /** tune failed */
  28. };
  29. // Option key: for train options sets
  30. const std::string MSTUNE_SELF_KEY = "mstune";
  31. const std::string MSTUNE_GEINIT_KEY = "initialize";
  32. const std::string MSTUNE_GESESS_KEY = "session";
  33. #ifdef __cplusplus
  34. extern "C" {
  35. #endif
  36. struct RunnerInitConfig {
  37. // onilne online
  38. std::string profPath;
  39. std::string parserPath;
  40. // ncs only
  41. std::vector<uint32_t> devList;
  42. };
  43. struct RunnerOpInfo {
  44. std::string opName;
  45. uint64_t opCostTime;
  46. uint64_t aicoreCostTime;
  47. // gradient_split only
  48. std::string modelName;
  49. std::string opType;
  50. std::vector<uint64_t> start;
  51. std::vector<uint64_t> end;
  52. };
  53. struct RunnerModelInfo {
  54. uint64_t totalCostTime;
  55. };
  56. struct RunnerRunResult {
  57. std::vector<RunnerModelInfo> modelInfo;
  58. std::vector<RunnerOpInfo> opInfo;
  59. };
  60. struct RunnerResult {
  61. uint64_t totalCostTime;
  62. std::map<std::string, uint64_t> opCostTime;
  63. std::map<std::string, uint64_t> aicoreCostTime;
  64. };
  65. struct RunnerDataBuf {
  66. void *ptr = nullptr;
  67. size_t size = 0;
  68. };
  69. struct AOEBufferData {
  70. std::shared_ptr<uint8_t> data = nullptr;
  71. uint64_t length;
  72. };
  73. struct RunnerConfig {
  74. bool isProf;
  75. uint32_t loop;
  76. // offline only
  77. std::vector<RunnerDataBuf> input;
  78. std::vector<RunnerDataBuf> output;
  79. std::string modelPath;
  80. RunnerDataBuf modelData;
  81. // online only
  82. uint32_t devId;
  83. std::vector<std::vector<ge::Tensor>> inputs;
  84. std::vector<ge::Graph> dependGraph; // run graph (for training)
  85. };
  86. #ifdef __cplusplus
  87. }
  88. #endif
  89. /**
  90. * @ingroup aoe
  91. * @par 描述: 命令行调优
  92. *
  93. * @attention 无
  94. * @param option [IN] 调优参数
  95. * @param msg [OUT] 调优异常下返回信息
  96. * @retval #MSTUNE_SUCCESS 执行成功
  97. * @retval #MSTUNE_FAILED 执行失败
  98. * @par 依赖:
  99. * @li tune_api.cpp:该接口所属的开发包。
  100. * @li tune_api.h:该接口声明所在的头文件。
  101. * @see 无
  102. * @since
  103. */
  104. AoeStatus AoeOfflineTuning(const std::map<std::string, std::string> &option, std::string &msg);
  105. /**
  106. * @ingroup aoe
  107. * @par 描述: 梯度调优
  108. *
  109. * @attention 无
  110. * @param tuningGraph [IN] 调优图
  111. * @param dependGraph [IN] 调优依赖图
  112. * @param session [IN] ge连接会话
  113. * @param option [IN] 参数集. 包含调优参数及ge参数
  114. * @retval #MSTUNE_SUCCESS 执行成功
  115. * @retval #MSTUNE_FAILED 执行失败
  116. * @par 依赖:
  117. * @li tune_api.cpp:该接口所属的开发包。
  118. * @li tune_api.h:该接口声明所在的头文件。
  119. * @see 无
  120. * @since
  121. */
  122. extern "C" MsTuneStatus MsTrainTuning(ge::Graph &tuningGraph, std::vector<ge::Graph> &dependGraph,
  123. ge::Session *session, const std::map<std::string, std::map<std::string, std::string>> &option);
  124. /**
  125. * @ingroup aoe
  126. * @par 描述: 梯度调优
  127. *
  128. * @attention 无
  129. * @param tuningGraph [IN] 调优图
  130. * @param dependGraph [IN] 调优依赖图
  131. * @param session [IN] ge连接会话
  132. * @param option [IN] 参数集. 包含调优参数及ge参数
  133. * @retval #AOE_SUCCESS 执行成功
  134. * @retval #AOE_FAILED 执行失败
  135. * @par 依赖:
  136. * @li tune_api.cpp:该接口所属的开发包。
  137. * @li tune_api.h:该接口声明所在的头文件。
  138. * @see 无
  139. * @since
  140. */
  141. extern "C" AoeStatus AoeOnlineTuning(ge::Graph &tuningGraph, std::vector<ge::Graph> &dependGraph,
  142. ge::Session *session, const std::map<std::string, std::map<std::string, std::string>> &option);
  143. #endif

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示