You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

memory_api.h 2.4 kB

4 years ago
4 years ago
4 years ago
123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172
  1. /**
  2. * Copyright (c) Huawei Technologies Co., Ltd. 2021. All rights reserved.
  3. *
  4. * Licensed under the Apache License, Version 2.0 (the "License");
  5. * you may not use this file except in compliance with the License.
  6. * You may obtain a copy of the License at
  7. *
  8. * http://www.apache.org/licenses/LICENSE-2.0
  9. *
  10. * Unless required by applicable law or agreed to in writing, software
  11. * distributed under the License is distributed on an "AS IS" BASIS,
  12. * WITHOUT WARRANTIES OR CONDITIONS OF ANY KIND, either express or implied.
  13. * See the License for the specific language governing permissions and
  14. * limitations under the License.
  15. */
  16. #ifndef INC_FRAMEWORK_MEMORY_MEMORY_API_H_
  17. #define INC_FRAMEWORK_MEMORY_MEMORY_API_H_
  18. #include <string>
  19. #include <vector>
  20. #include "external/ge/ge_api_error_codes.h"
  21. #include "graph/types.h"
  22. #include "runtime/mem.h"
  23. namespace ge {
  24. enum MemStorageType {
  25. HBM = 0,
  26. RDMA_HBM,
  27. HOST_DDR,
  28. };
  29. struct HostVarInfo {
  30. uint64_t base_addr;
  31. uint64_t var_size;
  32. };
  33. struct TensorInfo {
  34. std::string var_name;
  35. std::vector<int64_t> dims;
  36. DataType data_type;
  37. };
  38. ///
  39. /// \param size [in] rdma pool memory size to be allocated.
  40. /// \param mem_type [in] memory type for rdma pool.
  41. /// \return Status result of function
  42. GE_FUNC_VISIBILITY Status InitRdmaPool(size_t size, rtMemType_t mem_type = RT_MEMORY_HBM);
  43. ///
  44. /// \param var_info [in] host variable addr infos.
  45. /// \param mem_type [in] memory type for rdma pool.
  46. /// \return Status result of function
  47. GE_FUNC_VISIBILITY Status RdmaRemoteRegister(const std::vector<HostVarInfo> &var_info,
  48. rtMemType_t mem_type = RT_MEMORY_HBM);
  49. ///
  50. /// \param tensor_info [in] description for tensor stored shared memory.
  51. /// \param dev_addr [out] malloced shared memory addr.
  52. /// \param memory_size [out] malloced shared memory size.
  53. /// \return Status result of function
  54. GE_FUNC_VISIBILITY Status MallocSharedMemory(const TensorInfo &tensor_info, uint64_t &dev_addr, uint64_t &memory_size);
  55. ///
  56. /// \param var_name [in] var_name name of host variable.
  57. /// \param base_addr [out] base_addr vase addr of host variable.
  58. /// \param var_size [out] var_size memory_size of host variable.
  59. /// \return Status result of function
  60. GE_FUNC_VISIBILITY Status GetVarBaseAddrAndSize(const std::string &var_name, uint64_t &base_addr, uint64_t &var_size);
  61. } // namespace ge
  62. #endif // INC_FRAMEWORK_MEMORY_MEMORY_API_H_

图引擎模块(GE)是MindSpore的一个子模块,其代码由C++实现,位于前端模块ME和底层硬件之间,起到承接作用。图引擎模块以ME下发的图作为输入,然后进行一系列的深度图优化操作,最后输出一张可以在底层硬件上高效运行的图。GE针对昇腾AI处理器的硬件结构特点,做了特定的优化工作,以此来充分发挥出昇腾AI处理器的强大算力。在进行模型训练/推理时,GE会被自动调用而用户并不感知。GE主要由GE API和GE Core两部分组成,详细的架构图如下所示