You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

CMakeLists.txt 18 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483
  1. cmake_minimum_required(VERSION 3.9.0)
  2. project(MegEngine)
  3. set(CMAKE_CXX_STANDARD 14)
  4. set(CMAKE_CXX_STANDARD_REQUIRED ON)
  5. set(CMAKE_CXX_EXTENSIONS OFF)
  6. set(CMAKE_POSITION_INDEPENDENT_CODE ON)
  7. set(CMAKE_MODULE_PATH ${PROJECT_SOURCE_DIR}/cmake/Modules)
  8. if(NOT MSVC AND NOT APPLE)
  9. set(CMAKE_CXX_ARCHIVE_CREATE "<CMAKE_AR> Dqc <TARGET> <LINK_FLAGS> <OBJECTS>")
  10. set(CMAKE_CXX_ARCHIVE_APPEND "<CMAKE_AR> Dq <TARGET> <LINK_FLAGS> <OBJECTS>")
  11. set(CMAKE_CXX_ARCHIVE_FINISH "<CMAKE_RANLIB> -D <TARGET>")
  12. endif()
  13. include(CheckCXXCompilerFlag)
  14. CHECK_CXX_COMPILER_FLAG(-Wclass-memaccess CXX_SUPPORT_WCLASS_MEMACCESS)
  15. set(MGE_ARCH AUTO CACHE STRING "Architecture on which MegEngine to be built.")
  16. set_property(CACHE MGE_ARCH PROPERTY STRINGS AUTO
  17. x86_64 i386
  18. naive fallback
  19. )
  20. option(MGE_WITH_JIT "Build MegEngine with JIT." ON)
  21. option(MGE_WITH_HALIDE "Build MegEngine with Halide JIT" ON)
  22. option(MGE_DISABLE_FLOAT16 "Disable MegEngine float16 support." OFF)
  23. option(MGE_WITH_CUDA "Enable MegEngine CUDA support." ON)
  24. option(MGE_CUDA_USE_STATIC "Enable MegEngine CUDA static linking." ON)
  25. option(MGE_WITH_TRT "Build MegEngine with TensorRT." ON)
  26. option(MGE_USE_SYSTEM_LIB "Build MegEngine with system libraries." OFF)
  27. option(MGB_WITH_FLATBUFFERS "Build MegBrain with FlatBuffers serialization support." ON)
  28. if(${MGE_ARCH} STREQUAL "AUTO")
  29. if(${CMAKE_SYSTEM_PROCESSOR} STREQUAL "x86_64")
  30. set(MGE_ARCH "x86_64")
  31. elseif(${CMAKE_SYSTEM_PROCESSOR} STREQUAL "i386" OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL "i686")
  32. set(MGE_ARCH "i386")
  33. else()
  34. message(FATAL "Unknown machine architecture for MegEngine.")
  35. endif()
  36. endif()
  37. CHECK_CXX_COMPILER_FLAG(-fuse-ld=gold CXX_SUPPORT_GOLD)
  38. if(CXX_SUPPORT_GOLD AND NOT ANDROID AND NOT APPLE)
  39. message("-- Using GNU gold linker.")
  40. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} -fuse-ld=gold")
  41. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fuse-ld=gold")
  42. endif()
  43. if(NOT MGE_WITH_JIT)
  44. if(MGE_WITH_HALIDE)
  45. message(WARNING "MGE_WITH_HALIDE is set to OFF with MGE_WITH_JIT disabled")
  46. set(MGE_WITH_HALIDE OFF)
  47. endif()
  48. endif()
  49. if(MGE_WITH_CUDA)
  50. include(CheckLanguage)
  51. check_language(CUDA)
  52. if(NOT CMAKE_CUDA_COMPILER)
  53. message(FATAL_ERROR "CUDA compiler not found in PATH")
  54. endif()
  55. enable_language(CUDA)
  56. set(CMAKE_CUDA_STANDARD 14)
  57. set(CMAKE_CUDA_STANDARD_REQUIRED ON)
  58. endif()
  59. if(NOT MGE_WITH_CUDA)
  60. message("-- Disable JIT support, as CUDA is not enabled.")
  61. set(MGE_WITH_JIT OFF)
  62. set(MGE_WITH_HALIDE OFF)
  63. message("-- Disable TensorRT support, as CUDA is not enabled.")
  64. set(MGE_WITH_TRT OFF)
  65. endif()
  66. find_package(PythonInterp 3 REQUIRED)
  67. set(THREADS_PREFER_PTHREAD_FLAG ON)
  68. find_package(Threads)
  69. if(NOT "${CMAKE_THREAD_LIBS_INIT}" STREQUAL "")
  70. if(${CMAKE_THREAD_LIBS_INIT} STREQUAL "-pthread" AND MGE_WITH_CUDA)
  71. set_property(TARGET Threads::Threads
  72. PROPERTY INTERFACE_COMPILE_OPTIONS "$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-pthread>"
  73. "$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>")
  74. endif()
  75. endif()
  76. set(MGE_BLAS MKL CACHE STRING "BLAS implementaion used by MegEngine.")
  77. set_property(CACHE MGE_BLAS PROPERTY STRINGS MKL OpenBLAS)
  78. set(MGE_CUDA_GENCODE "" CACHE STRING "Overwrite -gencode specifications for CUDA")
  79. if(NOT CMAKE_CUDA_HOST_COMPILER)
  80. set(CMAKE_CUDA_HOST_COMPILER $(CMAKE_CXX_COMPILER))
  81. endif()
  82. option(MGE_ENABLE_RTTI "Build with RTTI" ON)
  83. option(MGE_ENABLE_LOGGING "Build with logging" ON)
  84. option(MGE_DEBUG_UTIL "Enable debug utility" ON)
  85. if(NOT CMAKE_CONFIGURATION_TYPES AND NOT CMAKE_BUILD_TYPE)
  86. message(STATUS "Setting build type to 'RelWithDebInfo' as none was specified.")
  87. set(CMAKE_BUILD_TYPE RelWithDebInfo)
  88. endif()
  89. if(NOT MGE_ENABLE_RTTI)
  90. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fno-rtti")
  91. endif()
  92. option(MGE_ENABLE_EXCEPTIONS "Build with exceptions" ON)
  93. if(NOT MGE_ENABLE_EXCEPTIONS)
  94. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fno-exception")
  95. endif()
  96. option(MGE_WITH_TEST "Enable test for MegEngine." OFF)
  97. if(MGE_WITH_TEST)
  98. include(cmake/gtest.cmake)
  99. endif()
  100. option(MGE_WITH_DISTRIBUTED "Build with distributed support" ON)
  101. if(NOT MGE_WITH_CUDA)
  102. message("-- Disable distributed support, as CUDA is not enabled.")
  103. set(MGE_WITH_DISTRIBUTED OFF)
  104. endif()
  105. option(MGE_INFERENCE_ONLY "Build inference only library." OFF)
  106. option(MGE_WITH_PYTHON_MODULE "Build MegEngine Python Module." ON)
  107. if(MGE_INFERENCE_ONLY)
  108. message("-- Disable distributed support for inference only build.")
  109. set(MGE_WITH_DISTRIBUTED OFF)
  110. message("-- Disable python module for inference only build.")
  111. set(MGE_WITH_PYTHON_MODULE OFF)
  112. message("-- Disable tests for inference only build.")
  113. set(MGE_WITH_TEST OFF)
  114. endif()
  115. if(MGE_WITH_DISTRIBUTED)
  116. include(cmake/protobuf.cmake)
  117. include(cmake/zmq.cmake)
  118. endif()
  119. if(MGB_WITH_FLATBUFFERS)
  120. include(cmake/flatbuffers.cmake)
  121. endif()
  122. if(MSVC)
  123. add_compile_definitions(NOMINMAX=1 _USE_MATH_DEFINES=1 WIN32=1)
  124. else()
  125. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -Wextra")
  126. set(CMAKE_CXX_FLAGS_DEBUG "-O0 -g")
  127. if(ANDROID)
  128. set(CMAKE_CXX_FLAGS_RELEASE "-Ofast -DNDEBUG")
  129. else()
  130. set(CMAKE_CXX_FLAGS_RELEASE "-O3 -DNDEBUG")
  131. endif()
  132. endif()
  133. if(MGE_WITH_CUDA)
  134. include_directories(${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES})
  135. foreach(path ${CMAKE_CUDA_HOST_IMPLICIT_LINK_DIRECTORIES})
  136. get_filename_component(_NAME ${path} NAME)
  137. if(NOT ${_NAME} STREQUAL "stubs")
  138. list(APPEND CUDA_LINK_DIRECTORIES ${path})
  139. endif()
  140. endforeach()
  141. link_directories(${CUDA_LINK_DIRECTORIES})
  142. set(CMAKE_CUDA_FLAGS_DEBUG "-O0 -g")
  143. set(CMAKE_CUDA_FLAGS_RELEASE "-O3")
  144. set(CMAKE_CUDA_FLAGS_RELWITHDEBINFO "-O3 -g")
  145. set(CMAKE_CUDA_FLAGS_MINSIZEREL "-Os")
  146. set(CMAKE_CUDA_FLAGS "-Xcompiler -Wall,-Wextra -Xfatbin -compress-all")
  147. if(NOT MGE_ENABLE_RTTI)
  148. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xcompiler -fno-rtti")
  149. endif()
  150. if(NOT MGE_ENABLE_EXCEPTIONS)
  151. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xcompiler -fno-exception")
  152. endif()
  153. if(NOT MGE_CUDA_GENCODE)
  154. if(${MGE_ARCH} STREQUAL "x86_64" OR ${MGE_ARCH} STREQUAL "i386")
  155. set(MEGDNN_THREADS_512 0)
  156. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.0.0")
  157. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  158. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  159. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  160. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=sm_70")
  161. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_75,code=sm_75")
  162. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_75,code=compute_75")
  163. elseif(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "9.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "9.0.0")
  164. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  165. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  166. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  167. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=sm_70")
  168. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=compute_70")
  169. else()
  170. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_35,code=sm_35")
  171. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  172. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  173. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  174. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=compute_61")
  175. endif()
  176. else()
  177. message(FATAL_ERROR "Unsupported CUDA host arch.")
  178. endif()
  179. else()
  180. set(MEGDNN_THREADS_512 1)
  181. endif()
  182. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} ${MGE_CUDA_GENCODE}")
  183. include(cmake/cudnn.cmake)
  184. if(MGE_WITH_TRT)
  185. include(cmake/tensorrt.cmake)
  186. endif()
  187. if(MGE_CUDA_USE_STATIC)
  188. if(MGE_WITH_TRT)
  189. list(APPEND MGE_CUDA_LIBS -Wl,--whole-archive libnvinfer libcudnn -Wl,--no-whole-archive)
  190. else()
  191. list(APPEND MGE_CUDA_LIBS -Wl,--whole-archive libcudnn -Wl,--no-whole-archive)
  192. endif()
  193. list(APPEND MGE_CUDA_LIBS cusolver_static cublas_static curand_static culibos cudart_static cusparse_static)
  194. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.1.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.1.0")
  195. list(APPEND MGE_CUDA_LIBS cublasLt_static)
  196. endif()
  197. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.0.0")
  198. # mark all symbols from liblapack_static.a as weak to avoid
  199. # duplicated definition with mkl
  200. find_library(
  201. LAPACK_STATIC_PATH lapack_static
  202. HINTS ${CMAKE_CUDA_HOST_IMPLICIT_LINK_DIRECTORIES})
  203. if(NOT LAPACK_STATIC_PATH)
  204. message(FATAL_ERROR "liblapack_static.a not found")
  205. endif()
  206. set(LAPACK_STATIC_COPY_PATH ${CMAKE_CURRENT_BINARY_DIR}/liblapack_static_copy.a)
  207. # add a target that run objcopy
  208. add_custom_command(
  209. OUTPUT ${LAPACK_STATIC_COPY_PATH}
  210. COMMAND ${CMAKE_OBJCOPY} -w -W* ${LAPACK_STATIC_PATH} ${LAPACK_STATIC_COPY_PATH}
  211. VERBATIM)
  212. add_custom_target(lapack_static_weak_target DEPENDS ${LAPACK_STATIC_COPY_PATH})
  213. # create a library named "lapack_static_weak"
  214. add_library(lapack_static_weak STATIC IMPORTED GLOBAL)
  215. add_dependencies(lapack_static_weak lapack_static_weak_target)
  216. set_target_properties(
  217. lapack_static_weak PROPERTIES
  218. IMPORTED_LOCATION ${LAPACK_STATIC_COPY_PATH})
  219. list(APPEND MGE_CUDA_LIBS lapack_static_weak ${LAPACK_STATIC_COPY_PATH})
  220. endif()
  221. else()
  222. if(MGE_WITH_TRT)
  223. list(APPEND MGE_CUDA_LIBS libnvinfer)
  224. endif()
  225. list(APPEND MGE_CUDA_LIBS libcudnn)
  226. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.1.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.1.0")
  227. list(APPEND MGE_CUDA_LIBS cublasLt cusolver cublas curand)
  228. endif()
  229. endif()
  230. add_subdirectory(dnn/cuda-stub)
  231. list(APPEND MGE_CUDA_LIBS nvrtc cuda-stub nvToolsExt)
  232. set(MGE_CUDA_LIBS "${MGE_CUDA_LIBS}")
  233. endif()
  234. find_program(CCACHE_BIN ccache)
  235. if(CCACHE_BIN)
  236. set(CMAKE_CXX_COMPILER_LAUNCHER ${CCACHE_BIN})
  237. if(MGE_WITH_CUDA AND NOT ${CMAKE_VERSION} VERSION_LESS "3.10.0")
  238. message("-- Using ccache as CMAKE_CUDA_COMPILER_LAUNCHER")
  239. set(CMAKE_CUDA_COMPILER_LAUNCHER ${CCACHE_BIN})
  240. endif()
  241. endif()
  242. if(${MGE_ARCH} STREQUAL "x86_64" OR ${MGE_ARCH} STREQUAL "i386")
  243. if(${MGE_BLAS} STREQUAL "MKL")
  244. include(cmake/mkl.cmake)
  245. set(MGE_BLAS_LIBS libmkl)
  246. elseif(${MGE_BLAS} STREQUAL "OpenBLAS")
  247. include(cmake/OpenBLAS.cmake)
  248. set(MGE_BLAS_LIBS libopenblas)
  249. else()
  250. message(FATAL_ERROR "Unknown BLAS implementation ${MGE_BLAS}")
  251. endif()
  252. endif()
  253. option(MGE_WITH_MKLDNN "Enable Intel MKL_DNN support," ON)
  254. # MKLDNN build
  255. if(MGE_WITH_MKLDNN AND ${MGE_ARCH} STREQUAL "x86_64")
  256. include(cmake/MKL_DNN.cmake)
  257. set(MEGDNN_X86_WITH_MKL_DNN 1)
  258. endif()
  259. # RTTI
  260. if(MGE_ENABLE_RTTI)
  261. set(MEGDNN_ENABLE_MANGLING 0)
  262. set(MEGDNN_ENABLE_RTTI 1)
  263. else()
  264. set(MEGDNN_ENABLE_MANGLING 1)
  265. set(MEGDNN_ENABLE_RTTI 0)
  266. endif()
  267. set(MGB_VERBOSE_TYPEINFO_NAME ${MGE_ENABLE_RTTI})
  268. # Logging
  269. set(MGB_ENABLE_LOGGING ${MGE_ENABLE_LOGGING})
  270. set(MEGDNN_ENABLE_LOGGING ${MGE_ENABLE_LOGGING})
  271. set(MGB_ENABLE_JSON ${MGE_ENABLE_LOGGING})
  272. # Exception
  273. if(NOT MGE_ENABLE_EXCEPTIONS)
  274. message(STATUS "Exceptions disabled; MegEngine would kill itself when it is supposed to throw an exception.")
  275. endif()
  276. set(MGB_ENABLE_EXCEPTION ${MGE_ENABLE_EXCEPTIONS})
  277. set(MEGDNN_ENABLE_EXCEPTIONS ${MGE_ENABLE_EXCEPTIONS})
  278. # JIT
  279. if(MGE_WITH_JIT AND MGE_WITH_HALIDE)
  280. set(HALIDE_SHARED_LIBRARY OFF CACHE BOOL "Build as a shared library")
  281. include(cmake/Halide.cmake)
  282. endif()
  283. set(MGB_JIT ${MGE_WITH_JIT})
  284. set(MGB_JIT_HALIDE ${MGE_WITH_HALIDE})
  285. # Thread
  286. if(CMAKE_THREAD_LIBS_INIT)
  287. set(MGB_HAVE_THREAD 1)
  288. endif()
  289. if(MGE_WITH_TEST)
  290. # use intra-op multi threads
  291. set(MEGDNN_ENABLE_MULTI_THREADS 1)
  292. endif()
  293. # CUDA
  294. set(MGB_CUDA ${MGE_WITH_CUDA})
  295. set(MEGDNN_WITH_CUDA ${MGE_WITH_CUDA})
  296. # Debug info
  297. if(${CMAKE_BUILD_TYPE} STREQUAL "Debug" OR ${CMAKE_BUILD_TYPE} STREQUAL "RelWithDebInfo")
  298. set(MGB_ASSERT_LOC 1)
  299. set(MGB_ENABLE_DEBUG_UTIL 1)
  300. else()
  301. set(MGB_ASSERT_LOC 0)
  302. set(MGB_ENABLE_DEBUG_UTIL 0)
  303. endif()
  304. # TensorRT
  305. set(MGB_ENABLE_TENSOR_RT ${MGE_WITH_TRT})
  306. # Inference only
  307. if(MGE_INFERENCE_ONLY)
  308. set(MGB_ENABLE_GRAD 0)
  309. set(MGB_BUILD_SLIM_SERVING 1)
  310. else()
  311. set(MGB_ENABLE_GRAD 1)
  312. set(MGB_BUILD_SLIM_SERVING 0)
  313. endif()
  314. # Distributed communication
  315. set(MGB_ENABLE_OPR_MM ${MGE_WITH_DISTRIBUTED})
  316. # MGE_ARCH related flags
  317. if(MGE_ARCH STREQUAL "x86_64" OR MGE_ARCH STREQUAL "i386")
  318. if(MGE_BLAS STREQUAL "MKL")
  319. set(MEGDNN_X86_WITH_MKL 1)
  320. elseif(MGE_BLAS STREQUAL "OpenBLAS")
  321. set(MEGDNN_X86_WITH_OPENBLAS 1)
  322. endif()
  323. endif()
  324. # Enable Naive
  325. if(MGE_ARCH STREQUAL "naive")
  326. set(MEGDNN_NAIVE 1)
  327. message(WARNING "MEGDNN_NAIVE is enabled; MegDNN performance is degraded.")
  328. endif()
  329. if(MGE_ARCH STREQUAL "x86_64" OR MGE_ARCH STREQUAL "i386")
  330. set(MEGDNN_X86 1)
  331. if(MGE_ARCH STREQUAL "x86_64")
  332. set(MEGDNN_X86_64 1)
  333. set(MEGDNN_64_BIT 1)
  334. if(NOT MSVC)
  335. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -m64")
  336. endif()
  337. else()
  338. set(MEGDNN_X86_32 1)
  339. if(NOT MSVC)
  340. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -m32")
  341. endif()
  342. endif()
  343. if(NOT MSVC)
  344. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -msse4.2 -mfpmath=sse")
  345. endif()
  346. endif()
  347. set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${MARCH}")
  348. # Write out megbrain_build_config.h
  349. # It defines macros needed by both megbrain and dnn
  350. configure_file(src/megbrain_build_config.h.in ${CMAKE_CURRENT_BINARY_DIR}/genfiles/megbrain_build_config.h)
  351. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/genfiles/megbrain_build_config.h DESTINATION include)
  352. add_subdirectory(dnn)
  353. list(APPEND MGB_OPR_PARAM_DEFS_SRCS ${CMAKE_CURRENT_SOURCE_DIR}/tools/param_defs/mgb_opr_param_defs.py)
  354. set(MGB_OPR_PARAM_DEFS_SCRIPT ${CMAKE_CURRENT_SOURCE_DIR}/dnn/scripts/gen_param_defs.py)
  355. set(MGB_OPR_PARAM_DEFS_OUT_DIR ${CMAKE_CURRENT_BINARY_DIR}/src/opr/include/)
  356. file(MAKE_DIRECTORY ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr)
  357. add_custom_command(
  358. OUTPUT
  359. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  360. COMMAND ${PYTHON_EXECUTABLE} ${MGB_OPR_PARAM_DEFS_SCRIPT} ${MGB_OPR_PARAM_DEFS_SRCS}
  361. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  362. DEPENDS ${MGB_OPR_PARAM_DEFS_SRCS} ${MGB_OPR_PARAM_DEFS_SCRIPT}
  363. VERBATIM
  364. )
  365. list(APPEND MGB_OPR_PARAM_DEFS_OUTS
  366. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  367. )
  368. install(FILES ${MGB_OPR_PARAM_DEFS_OUTS} DESTINATION include/megbrain/opr/)
  369. list(APPEND MGB_OPR_PARAM_DEFS_INC ${MGB_OPR_PARAM_DEFS_OUT_DIR})
  370. add_custom_target(_mgb_opr_param_defs DEPENDS ${MGB_OPR_PARAM_DEFS_OUTS})
  371. add_library(mgb_opr_param_defs INTERFACE)
  372. target_include_directories(mgb_opr_param_defs INTERFACE ${MGB_OPR_PARAM_DEFS_INC})
  373. add_dependencies(mgb_opr_param_defs _mgb_opr_param_defs)
  374. if(MGE_WITH_DISTRIBUTED)
  375. add_subdirectory(${PROJECT_SOURCE_DIR}/third_party/MegRay)
  376. endif()
  377. add_subdirectory(src)
  378. add_subdirectory(sdk/load-and-run)
  379. if(MGE_WITH_PYTHON_MODULE)
  380. add_subdirectory(python_module)
  381. endif()
  382. if(MGE_WITH_TEST AND MGE_ENABLE_RTTI)
  383. add_subdirectory(test)
  384. endif()
  385. if(TARGET _mgb)
  386. add_custom_target(
  387. develop
  388. COMMAND ${CMAKE_COMMAND} -E create_symlink
  389. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/$<TARGET_FILE_NAME:_mgb>
  390. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/$<TARGET_FILE_NAME:_mgb>
  391. COMMAND ${CMAKE_COMMAND} -E create_symlink
  392. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/mgb.py
  393. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/mgb.py
  394. COMMAND ${CMAKE_COMMAND} -E create_symlink
  395. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/opr.py
  396. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/opr.py
  397. COMMAND ${CMAKE_COMMAND} -E create_symlink
  398. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/opr_param_defs.py
  399. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/opr_param_defs.py
  400. COMMAND ${CMAKE_COMMAND} -E create_symlink
  401. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/include
  402. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/include
  403. DEPENDS _mgb
  404. VERBATIM
  405. )
  406. endif()
  407. IF(APPLE)
  408. set(CMAKE_THREAD_LIBS_INIT "-lpthread")
  409. set(CMAKE_HAVE_THREADS_LIBRARY 1)
  410. set(CMAKE_USE_WIN32_THREADS_INIT 0)
  411. set(CMAKE_USE_PTHREADS_INIT 1)
  412. set(THREADS_PREFER_PTHREAD_FLAG ON)
  413. ENDIF()

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台