You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

CMakeLists.txt 31 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312313314315316317318319320321322323324325326327328329330331332333334335336337338339340341342343344345346347348349350351352353354355356357358359360361362363364365366367368369370371372373374375376377378379380381382383384385386387388389390391392393394395396397398399400401402403404405406407408409410411412413414415416417418419420421422423424425426427428429430431432433434435436437438439440441442443444445446447448449450451452453454455456457458459460461462463464465466467468469470471472473474475476477478479480481482483484485486487488489490491492493494495496497498499500501502503504505506507508509510511512513514515516517518519520521522523524525526527528529530531532533534535536537538539540541542543544545546547548549550551552553554555556557558559560561562563564565566567568569570571572573574575576577578579580581582583584585586587588589590591592593594595596597598599600601602603604605606607608609610611612613614615616617618619620621622623624625626627628629630631632633634635636637638639640641642643644645646647648649650651652653654655656657658659660661662663664665666667668669670671672673674675676677678679680681682683684685686687688689690691692693694695696697698699700701702703704705706707708709710711712713714715716717718719720721722723724725726727728729730731732733734735736737738739740741742743744745746747748749750751752753754755756757758759760761762763764765766767768769770771772773774775776777778779780781782783784785786787788789790791792793794795796797798799800801802
  1. cmake_minimum_required(VERSION 3.14.4)
  2. include (cmake/FetchMegBrainVersion.cmake)
  3. project(MegEngine LANGUAGES C CXX VERSION ${MGB_VER_STRING})
  4. set(CMAKE_CXX_STANDARD 14)
  5. set(CMAKE_CXX_STANDARD_REQUIRED ON)
  6. set(CMAKE_CXX_EXTENSIONS OFF)
  7. set(CMAKE_POSITION_INDEPENDENT_CODE ON)
  8. set(CMAKE_MODULE_PATH ${PROJECT_SOURCE_DIR}/cmake/Modules)
  9. set(CMAKE_POLICY_DEFAULT_CMP0048 NEW)
  10. if(NOT MSVC AND NOT APPLE AND NOT WIN32)
  11. set(CMAKE_CXX_ARCHIVE_CREATE "<CMAKE_AR> Dqc <TARGET> <LINK_FLAGS> <OBJECTS>")
  12. set(CMAKE_CXX_ARCHIVE_APPEND "<CMAKE_AR> Dq <TARGET> <LINK_FLAGS> <OBJECTS>")
  13. set(CMAKE_CXX_ARCHIVE_FINISH "<CMAKE_RANLIB> -D <TARGET>")
  14. endif()
  15. include(GNUInstallDirs)
  16. include(CheckCXXCompilerFlag)
  17. CHECK_CXX_COMPILER_FLAG(-Wclass-memaccess CXX_SUPPORT_WCLASS_MEMACCESS)
  18. set(MGE_ARCH AUTO CACHE STRING "Architecture on which MegEngine to be built.")
  19. set_property(CACHE MGE_ARCH PROPERTY STRINGS AUTO
  20. x86_64 i386
  21. armv7 aarch64
  22. naive fallback
  23. )
  24. set (MGE_EXPORT_TARGETS MegEngine-targets)
  25. option(MGE_WITH_JIT "Build MegEngine with JIT." ON)
  26. option(MGE_WITH_HALIDE "Build MegEngine with Halide JIT" ON)
  27. option(MGE_ARMV8_2_FEATURE_FP16 "Enable armv8.2-a+fp16 support" OFF)
  28. option(MGE_ARMV8_2_FEATURE_DOTPROD "enable armv8.2-a+dotprod support" OFF)
  29. option(MGE_DISABLE_FLOAT16 "Disable MegEngine float16 support." OFF)
  30. option(MGE_WITH_CUDA "Enable MegEngine CUDA support." ON)
  31. option(MGE_CUDA_USE_STATIC "Enable MegEngine CUDA static linking." ON)
  32. option(MGE_WITH_TRT "Build MegEngine with TensorRT." ON)
  33. option(MGE_USE_SYSTEM_LIB "Build MegEngine with system libraries." OFF)
  34. option(MGB_WITH_FLATBUFFERS "Build MegBrain with FlatBuffers serialization support." ON)
  35. option(MGE_WITH_CAMBRICON "Build MegEngine with Cambricon support" OFF)
  36. option(BUILD_SHARED_LIBS "Build shared libraries" ON)
  37. option(MGE_WITH_ATLAS "Build MegEngine with Atlas support" OFF)
  38. option(MGE_ENABLE_RTTI "Build with RTTI" ON)
  39. option(MGE_ENABLE_LOGGING "Build with logging" ON)
  40. option(MGE_DEBUG_UTIL "Enable debug utility" ON)
  41. option(MGE_ENABLE_EXCEPTIONS "Build with exceptions" ON)
  42. option(MGE_WITH_TEST "Enable test for MegEngine." OFF)
  43. option(MGE_WITH_DISTRIBUTED "Build with distributed support" ON)
  44. option(MGE_BUILD_IMPERATIVE_RT "Build _imperative_rt.so instead of _mgb.so " OFF)
  45. option(MGE_BUILD_SDK "Build load_and_run" ON)
  46. option(MGE_INFERENCE_ONLY "Build inference only library." OFF)
  47. option(MGE_WITH_PYTHON_MODULE "Build MegEngine Python Module." ON)
  48. option(MGE_WITH_MKLDNN "Enable Intel MKL_DNN support," ON)
  49. option(MGE_WITH_ROCM "Enable ROCM support" OFF)
  50. if (APPLE)
  51. set (BUILD_SHARED_LIBS OFF)
  52. message("build static for xcode framework require")
  53. endif()
  54. if (MGE_USE_SYSTEM_LIB)
  55. set (MGE_CUDA_USE_STATIC OFF)
  56. endif()
  57. if (MGB_WITH_FLATBUFFERS)
  58. set(MGB_ENABLE_FBS_SERIALIZATION ON)
  59. endif()
  60. if(CMAKE_TOOLCHAIN_FILE)
  61. message("We are cross compiling.")
  62. message("config FLATBUFFERS_FLATC_EXECUTABLE to: ${PROJECT_SOURCE_DIR}/build_dir/host_flatc/install/bin/flatc")
  63. set(FLATBUFFERS_FLATC_EXECUTABLE "${PROJECT_SOURCE_DIR}/build_dir/host_flatc/install/bin/flatc")
  64. if(ANDROID_TOOLCHAIN_ROOT)
  65. if(NOT "${ANDROID_ARCH_NAME}" STREQUAL "")
  66. set(ANDROID_ARCH ${ANDROID_ARCH_NAME})
  67. endif()
  68. if(${ANDROID_ARCH} STREQUAL "arm")
  69. set(MGE_ARCH "armv7")
  70. elseif(${ANDROID_ARCH} STREQUAL "arm64")
  71. set(MGE_ARCH "aarch64")
  72. else()
  73. message(FATAL_ERROR "DO NOT SUPPORT ANDROID ARCH NOW")
  74. endif()
  75. elseif(IOS_TOOLCHAIN_ROOT)
  76. if(${IOS_ARCH} STREQUAL "armv7")
  77. set(MGE_ARCH "armv7")
  78. elseif(${IOS_ARCH} STREQUAL "arm64")
  79. set(MGE_ARCH "aarch64")
  80. elseif(${IOS_ARCH} STREQUAL "armv7k")
  81. set(MGE_ARCH "armv7")
  82. elseif(${IOS_ARCH} STREQUAL "arm64e")
  83. set(MGE_ARCH "aarch64")
  84. elseif(${IOS_ARCH} STREQUAL "armv7s")
  85. set(MGE_ARCH "armv7")
  86. else()
  87. message(FATAL_ERROR "Unsupported IOS_ARCH.")
  88. endif()
  89. elseif(NOT "${ARM_CROSS_BUILD_ARCH}" STREQUAL "")
  90. set(MGE_ARCH ${ARM_CROSS_BUILD_ARCH})
  91. else()
  92. message(FATAL_ERROR "Unknown cross-compiling settings.")
  93. endif()
  94. message("CONFIG MGE_ARCH TO ${MGE_ARCH}")
  95. endif()
  96. if(${MGE_ARCH} STREQUAL "AUTO")
  97. if(${CMAKE_SYSTEM_PROCESSOR} STREQUAL "x86_64" OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL "AMD64")
  98. set(MGE_ARCH "x86_64")
  99. elseif(${CMAKE_SYSTEM_PROCESSOR} STREQUAL "i386" OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL "i686")
  100. set(MGE_ARCH "i386")
  101. elseif(${CMAKE_SYSTEM_PROCESSOR} STREQUAL "aarch64" OR ${CMAKE_SYSTEM_PROCESSOR} STREQUAL "arm64")
  102. set(MGE_ARCH "aarch64")
  103. elseif(${CMAKE_SYSTEM_PROCESSOR} MATCHES "^arm")
  104. set(MGE_ARCH "armv7")
  105. else()
  106. message(FATAL "Unknown machine architecture for MegEngine.")
  107. endif()
  108. endif()
  109. if(${MGE_ARCH} STREQUAL "x86_64" OR ${MGE_ARCH} STREQUAL "i386" OR ${MGE_ARCH} STREQUAL "armv7" OR ${MGE_ARCH} STREQUAL "aarch64")
  110. option(MGE_ENABLE_CPUINFO "Build cpuinfo library for check runtime." ON)
  111. if(MGE_ENABLE_CPUINFO)
  112. message("-- Enable cpuinfo runtime check and little kernel optimize.")
  113. add_definitions(-DMGB_ENABLE_CPUINFO_CHECK)
  114. include(cmake/cpuinfo.cmake)
  115. endif()
  116. endif()
  117. if(MSVC OR WIN32)
  118. add_compile_definitions(NOMINMAX=1 _USE_MATH_DEFINES=1 WIN32=1)
  119. message("-- into windows build...")
  120. message("-- CMAKE_C_COMPILER_ID: ${CMAKE_C_COMPILER_ID}")
  121. if (${CMAKE_C_COMPILER_ID} STREQUAL "Clang-cl")
  122. message(FATAL_ERROR "only support clang-cl for windows build, pls check detail: scripts/cmake-build/BUILD_README.md")
  123. endif()
  124. # add flags for enable sse instruction optimize for X86, enable avx header to compile avx code
  125. set(WIN_FLAGS "-msse4.2 -O2 -D_AVX_ -D_AVX2_ -D__AVX__ -D__AVX2__ -D__FMA__")
  126. # if u CPU is cascadelake series, u can enable for performance
  127. # set(WIN_FLAGS "{WIN_FLAGS} -march=cascadelake -mtune=cascadelake")
  128. # set(WIN_FLAGS "{WIN_FLAGS} -mavx512cd -mavx512vl -mavx512dq -mavx512bw -mavx512vbmi -mavx512vnni")
  129. # for windows build
  130. set(WIN_FLAGS "${WIN_FLAGS} -Wno-error=implicit-int-conversion -Wno-error=double-promotion")
  131. set(WIN_FLAGS "${WIN_FLAGS} -Wno-error=zero-as-null-pointer-constant -Wno-error=implicit-int-conversion")
  132. set(WIN_FLAGS "${WIN_FLAGS} -Wno-error=float-conversion -Wno-error=shadow-field -Wno-error=covered-switch-default")
  133. set(WIN_FLAGS "${WIN_FLAGS} -Wno-error=deprecated -Wno-error=documentation -Wno-error=unreachable-code-break")
  134. set(WIN_FLAGS "${WIN_FLAGS} /DWIN32 -Wno-macro-redefined /D_WIN32_WINNT=0x0601 /wd4819")
  135. set(WIN_FLAGS "${WIN_FLAGS} /D_CRT_SECURE_NO_DEPRECATE /D_CRT_SECURE_NO_WARNINGS /DNOGDI /D_USE_MATH_DEFINES /bigobj")
  136. set(WIN_FLAGS "${WIN_FLAGS} /Zm500 /EHs /wd4351 /wd4291 /wd4250 /wd4996 /wd4819 -Wno-inconsistent-dllimport")
  137. set(CMAKE_C_FLAGS "${CMAKE_C_FLAGS} ${WIN_FLAGS}")
  138. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${WIN_FLAGS}")
  139. #FIXME: fix halide JIT on windows
  140. message("-- disable jit and halide on windows host build...")
  141. set(MGE_WITH_HALIDE OFF)
  142. set(MGE_WITH_JIT OFF)
  143. #FIXME: fix MegRay on windows
  144. message("-- Disable distributed build on windows host build...")
  145. set(MGE_WITH_DISTRIBUTED OFF)
  146. else()
  147. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -Wall -Wextra")
  148. set(CMAKE_CXX_FLAGS_DEBUG "-O0 -g")
  149. if(ANDROID)
  150. set(CMAKE_CXX_FLAGS_RELEASE "-Ofast -DNDEBUG")
  151. set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "-Ofast -DNDEBUG -g")
  152. else()
  153. set(CMAKE_CXX_FLAGS_RELEASE "-O3 -DNDEBUG")
  154. set(CMAKE_CXX_FLAGS_RELWITHDEBINFO "-O3 -DNDEBUG -g")
  155. endif()
  156. endif()
  157. CHECK_CXX_COMPILER_FLAG(-fuse-ld=gold CXX_SUPPORT_GOLD)
  158. if(CXX_SUPPORT_GOLD AND NOT ANDROID AND NOT APPLE AND NOT MSVC AND NOT WIN32)
  159. message("-- Using GNU gold linker.")
  160. set(MGE_COMMON_LINKER_FLAGS "-fuse-ld=gold")
  161. set(CMAKE_SHARED_LINKER_FLAGS "${CMAKE_SHARED_LINKER_FLAGS} ${MGE_COMMON_LINKER_FLAGS}")
  162. set(CMAKE_MODULE_LINKER_FLAGS "${CMAKE_MODULE_LINKER_FLAGS} ${MGE_COMMON_LINKER_FLAGS}")
  163. set(CMAKE_EXE_LINKER_FLAGS "${CMAKE_EXE_LINKER_FLAGS} ${MGE_COMMON_LINKER_FLAGS}")
  164. endif()
  165. if(NOT MGE_WITH_JIT)
  166. if(MGE_WITH_HALIDE)
  167. message(WARNING "MGE_WITH_HALIDE is set to OFF with MGE_WITH_JIT disabled")
  168. set(MGE_WITH_HALIDE OFF)
  169. endif()
  170. endif()
  171. if(MGE_WITH_CUDA)
  172. include(CheckLanguage)
  173. check_language(CUDA)
  174. if(NOT CMAKE_CUDA_COMPILER)
  175. message(FATAL_ERROR "CUDA compiler not found in PATH")
  176. endif()
  177. enable_language(CUDA)
  178. set(CMAKE_CUDA_STANDARD 14)
  179. set(CMAKE_CUDA_STANDARD_REQUIRED ON)
  180. endif()
  181. if(NOT MGE_WITH_CUDA)
  182. message("-- Disable JIT support, as CUDA is not enabled.")
  183. set(MGE_WITH_JIT OFF)
  184. set(MGE_WITH_HALIDE OFF)
  185. message("-- Disable TensorRT support, as CUDA is not enabled.")
  186. set(MGE_WITH_TRT OFF)
  187. endif()
  188. find_package(PythonInterp 3 REQUIRED)
  189. set(THREADS_PREFER_PTHREAD_FLAG ON)
  190. find_package(Threads)
  191. if(NOT "${CMAKE_THREAD_LIBS_INIT}" STREQUAL "")
  192. if(${CMAKE_THREAD_LIBS_INIT} STREQUAL "-pthread" AND MGE_WITH_CUDA)
  193. set_property(TARGET Threads::Threads
  194. PROPERTY INTERFACE_COMPILE_OPTIONS "$<$<COMPILE_LANGUAGE:CUDA>:-Xcompiler=-pthread>"
  195. "$<$<NOT:$<COMPILE_LANGUAGE:CUDA>>:-pthread>")
  196. endif()
  197. endif()
  198. set(MGE_BLAS MKL CACHE STRING "BLAS implementaion used by MegEngine.")
  199. set_property(CACHE MGE_BLAS PROPERTY STRINGS MKL OpenBLAS)
  200. set(MGE_CUDA_GENCODE "" CACHE STRING "Overwrite -gencode specifications for CUDA")
  201. if(NOT CMAKE_CUDA_HOST_COMPILER)
  202. set(CMAKE_CUDA_HOST_COMPILER $(CMAKE_CXX_COMPILER))
  203. endif()
  204. if(NOT CMAKE_CONFIGURATION_TYPES AND NOT CMAKE_BUILD_TYPE)
  205. message(STATUS "Setting build type to 'RelWithDebInfo' as none was specified.")
  206. set(CMAKE_BUILD_TYPE RelWithDebInfo)
  207. endif()
  208. if(NOT MGE_ENABLE_RTTI)
  209. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fno-rtti")
  210. endif()
  211. if(NOT MGE_ENABLE_EXCEPTIONS)
  212. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -fno-exception")
  213. endif()
  214. if(MGE_WITH_TEST)
  215. include(cmake/gtest.cmake)
  216. endif()
  217. if(MGE_BUILD_IMPERATIVE_RT)
  218. add_compile_definitions(MGB_ENABLE_IMPERATIVE_RUNTIME)
  219. set(CMAKE_CXX_STANDARD 17)
  220. endif()
  221. if(NOT MGE_WITH_CUDA)
  222. message("-- Disable distributed support, as CUDA is not enabled.")
  223. set(MGE_WITH_DISTRIBUTED OFF)
  224. endif()
  225. if(MGE_INFERENCE_ONLY)
  226. message("-- Disable distributed support for inference only build.")
  227. set(MGE_WITH_DISTRIBUTED OFF)
  228. message("-- Disable python module for inference only build.")
  229. set(MGE_WITH_PYTHON_MODULE OFF)
  230. endif()
  231. if(MGE_WITH_DISTRIBUTED)
  232. include(cmake/protobuf.cmake)
  233. include(cmake/zmq.cmake)
  234. endif()
  235. if(MGB_WITH_FLATBUFFERS)
  236. include(cmake/flatbuffers.cmake)
  237. endif()
  238. if(MGE_WITH_CUDA)
  239. include_directories(${CMAKE_CUDA_TOOLKIT_INCLUDE_DIRECTORIES})
  240. foreach(path ${CMAKE_CUDA_HOST_IMPLICIT_LINK_DIRECTORIES})
  241. get_filename_component(_NAME ${path} NAME)
  242. if(NOT ${_NAME} STREQUAL "stubs")
  243. list(APPEND CUDA_LINK_DIRECTORIES ${path})
  244. endif()
  245. endforeach()
  246. link_directories(${CUDA_LINK_DIRECTORIES})
  247. set(CMAKE_CUDA_FLAGS_DEBUG "-O0 -g")
  248. set(CMAKE_CUDA_FLAGS_RELEASE "-O3")
  249. set(CMAKE_CUDA_FLAGS_RELWITHDEBINFO "-O3 -g")
  250. set(CMAKE_CUDA_FLAGS_MINSIZEREL "-Os")
  251. if(MSVC OR WIN32)
  252. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xfatbin -compress-all")
  253. set(CCBIN_FLAG "${CCBIN_FLAG} /wd4819 /wd4334 /wd4267 /wd4002 /wd4244 /wd4068")
  254. if(${CMAKE_BUILD_TYPE} STREQUAL "Debug")
  255. set(CCBIN_FLAG "${CCBIN_FLAG} -D_ITERATOR_DEBUG_LEVEL=2 -MTd")
  256. endif()
  257. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --compiler-options \" ${CCBIN_FLAG} \" ")
  258. else()
  259. set(CMAKE_CUDA_FLAGS "-Xcompiler -Wall,-Wextra -Xfatbin -compress-all")
  260. endif()
  261. if(NOT MGE_ENABLE_RTTI)
  262. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xcompiler -fno-rtti")
  263. endif()
  264. if(NOT MGE_ENABLE_EXCEPTIONS)
  265. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xcompiler -fno-exception")
  266. endif()
  267. if(NOT MGE_CUDA_GENCODE)
  268. if(${MGE_ARCH} STREQUAL "x86_64" OR ${MGE_ARCH} STREQUAL "i386")
  269. set(MEGDNN_THREADS_512 0)
  270. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.0.0")
  271. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  272. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  273. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  274. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=sm_70")
  275. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_75,code=sm_75")
  276. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_75,code=compute_75")
  277. elseif(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "9.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "9.0.0")
  278. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  279. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  280. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  281. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=sm_70")
  282. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_70,code=compute_70")
  283. else()
  284. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_35,code=sm_35")
  285. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_52,code=sm_52")
  286. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_60,code=sm_60")
  287. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=sm_61")
  288. set(MGE_CUDA_GENCODE "${MGE_CUDA_GENCODE} -gencode arch=compute_61,code=compute_61")
  289. endif()
  290. else()
  291. message(FATAL_ERROR "Unsupported CUDA host arch.")
  292. endif()
  293. else()
  294. set(MEGDNN_THREADS_512 1)
  295. endif()
  296. set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} ${MGE_CUDA_GENCODE}")
  297. include(cmake/cudnn.cmake)
  298. if(MGE_WITH_TRT)
  299. include(cmake/tensorrt.cmake)
  300. endif()
  301. if(MGE_CUDA_USE_STATIC)
  302. if(MGE_WITH_TRT)
  303. if(MSVC OR WIN32)
  304. list(APPEND MGE_CUDA_LIBS ${TRT_LIBRARY} ${CUDNN_LIBRARY})
  305. message("-- windows TRT_LIBRARY: ${TRT_LIBRARY}")
  306. message("-- windows CUDNN_LIBRARY: ${CUDNN_LIBRARY}")
  307. else()
  308. list(APPEND MGE_CUDA_LIBS -Wl,--whole-archive libnvinfer libcudnn -Wl,--no-whole-archive)
  309. endif()
  310. else()
  311. list(APPEND MGE_CUDA_LIBS -Wl,--whole-archive libcudnn -Wl,--no-whole-archive)
  312. endif()
  313. if(MSVC OR WIN32)
  314. list(APPEND MGE_CUDA_LIBS cusolver.lib cublas.lib curand.lib cudart_static.lib cusparse.lib)
  315. else()
  316. list(APPEND MGE_CUDA_LIBS cusolver_static cublas_static curand_static culibos cudart_static cusparse_static)
  317. endif()
  318. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.1.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.1.0")
  319. if(MSVC OR WIN32)
  320. list(APPEND MGE_CUDA_LIBS cublasLt.lib)
  321. else()
  322. list(APPEND MGE_CUDA_LIBS cublasLt_static)
  323. endif()
  324. endif()
  325. if((${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.0.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.0.0") AND NOT MSVC AND NOT WIN32)
  326. # mark all symbols from liblapack_static.a as weak to avoid
  327. # duplicated definition with mkl
  328. find_library(
  329. LAPACK_STATIC_PATH lapack_static
  330. HINTS ${CMAKE_CUDA_HOST_IMPLICIT_LINK_DIRECTORIES})
  331. if(NOT LAPACK_STATIC_PATH)
  332. message(FATAL_ERROR "liblapack_static.a not found")
  333. endif()
  334. set(LAPACK_STATIC_COPY_PATH ${CMAKE_CURRENT_BINARY_DIR}/liblapack_static_copy.a)
  335. # add a target that run objcopy
  336. add_custom_command(
  337. OUTPUT ${LAPACK_STATIC_COPY_PATH}
  338. COMMAND ${CMAKE_OBJCOPY} -w -W* ${LAPACK_STATIC_PATH} ${LAPACK_STATIC_COPY_PATH}
  339. VERBATIM)
  340. add_custom_target(lapack_static_weak_target DEPENDS ${LAPACK_STATIC_COPY_PATH})
  341. # create a library named "lapack_static_weak"
  342. add_library(lapack_static_weak STATIC IMPORTED GLOBAL)
  343. add_dependencies(lapack_static_weak lapack_static_weak_target)
  344. set_target_properties(
  345. lapack_static_weak PROPERTIES
  346. IMPORTED_LOCATION ${LAPACK_STATIC_COPY_PATH})
  347. list(APPEND MGE_CUDA_LIBS lapack_static_weak ${LAPACK_STATIC_COPY_PATH})
  348. endif()
  349. else()
  350. if(MGE_WITH_TRT)
  351. list(APPEND MGE_CUDA_LIBS libnvinfer)
  352. endif()
  353. list(APPEND MGE_CUDA_LIBS libcudnn)
  354. if(${CMAKE_CUDA_COMPILER_VERSION} VERSION_GREATER "10.1.0" OR ${CMAKE_CUDA_COMPILER_VERSION} VERSION_EQUAL "10.1.0")
  355. list(APPEND MGE_CUDA_LIBS cublasLt cusolver cublas curand)
  356. endif()
  357. endif()
  358. add_subdirectory(dnn/cuda-stub)
  359. if(MSVC OR WIN32)
  360. list(APPEND MGE_CUDA_LIBS nvrtc.lib cuda-stub)
  361. else()
  362. list(APPEND MGE_CUDA_LIBS nvrtc cuda-stub nvToolsExt)
  363. endif()
  364. set(MGE_CUDA_LIBS "${MGE_CUDA_LIBS}")
  365. endif()
  366. if(MGE_WITH_CAMBRICON)
  367. include_directories("$ENV{NEUWARE_HOME}/include")
  368. link_directories("$ENV{NEUWARE_HOME}/lib64")
  369. include(cmake/FindBANG/FindBANG.cmake)
  370. if (${MGE_MLU_ARCH} STREQUAL "MLU100")
  371. set(BANG_ARCH "100")
  372. elseif (${MGE_MLU_ARCH} STREQUAL "MLU1h8")
  373. set(BANG_ARCH "110")
  374. elseif (${MGE_MLU_ARCH} STREQUAL "MLU220")
  375. set(BANG_ARCH "220")
  376. elseif (${MGE_MLU_ARCH} STREQUAL "MLU270")
  377. set(BANG_ARCH "270")
  378. elseif (${MGE_MLU_ARCH} STREQUAL "MLU290")
  379. set(BANG_ARCH "290")
  380. elseif (${MGE_MLU_ARCH} STREQUAL "MLU200")
  381. set(BANG_ARCH "200")
  382. else()
  383. message (FATAL_ERROR "Unsupported MLU arch.")
  384. endif()
  385. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} --bang-mlu-arch=${MGE_MLU_ARCH}")
  386. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} -std=c++11 -Werror")
  387. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -D__BANG_ARCH__=${BANG_ARCH}")
  388. if (${CMAKE_BUILD_TYPE} STREQUAL "Debug")
  389. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} -g -O0")
  390. elseif (${CMAKE_BUILD_TYPE} STREQUAL "Release")
  391. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} -O3")
  392. elseif (${CMAKE_BUILD_TYPE} STREQUAL "RelWithDebInfo")
  393. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} -g -O3")
  394. elseif (${CMAKE_BUILD_TYPE} STREQUAL "MinSizeRel")
  395. set(BANG_CNCC_FLAGS "${BANG_CNCC_FLAGS} -Os")
  396. endif()
  397. include(cmake/cnrt.cmake)
  398. include(cmake/cndev.cmake)
  399. include(cmake/cnml.cmake)
  400. list(APPEND MGE_CAMBRICON_LIBS libcnrt libcndev libcnml)
  401. set(MGE_CAMBRICON_LIBS "${MGE_CAMBRICON_LIBS}")
  402. endif()
  403. if (MGE_WITH_ROCM)
  404. include(cmake/rocm.cmake)
  405. endif ()
  406. if(MGE_WITH_ATLAS)
  407. include(cmake/aclrt.cmake)
  408. list(APPEND MGE_ATLAS_LIBS libascendcl)
  409. set(MGE_ATLAS_LIBS "${MGE_ATLAS_LIBS}")
  410. set(MGB_ATLAS ${MGE_WITH_ATLAS})
  411. endif()
  412. find_program(CCACHE_BIN ccache)
  413. if(CCACHE_BIN)
  414. set(CMAKE_CXX_COMPILER_LAUNCHER ${CCACHE_BIN})
  415. if(MGE_WITH_CUDA AND NOT ${CMAKE_VERSION} VERSION_LESS "3.10.0")
  416. message("-- Using ccache as CMAKE_CUDA_COMPILER_LAUNCHER")
  417. set(CMAKE_CUDA_COMPILER_LAUNCHER ${CCACHE_BIN})
  418. endif()
  419. endif()
  420. if(${MGE_ARCH} STREQUAL "x86_64" OR ${MGE_ARCH} STREQUAL "i386")
  421. if(${MGE_BLAS} STREQUAL "MKL")
  422. include(cmake/mkl.cmake)
  423. set(MGE_BLAS_LIBS libmkl)
  424. elseif(${MGE_BLAS} STREQUAL "OpenBLAS")
  425. include(cmake/OpenBLAS.cmake)
  426. set(MGE_BLAS_LIBS libopenblas)
  427. else()
  428. message(FATAL_ERROR "Unknown BLAS implementation ${MGE_BLAS}")
  429. endif()
  430. endif()
  431. # MKLDNN build
  432. if(MGE_WITH_MKLDNN AND ${MGE_ARCH} STREQUAL "x86_64")
  433. include(cmake/MKL_DNN.cmake)
  434. set(MEGDNN_X86_WITH_MKL_DNN 1)
  435. endif()
  436. # RTTI
  437. if(MGE_ENABLE_RTTI)
  438. set(MEGDNN_ENABLE_MANGLING 0)
  439. set(MEGDNN_ENABLE_RTTI 1)
  440. else()
  441. set(MEGDNN_ENABLE_MANGLING 1)
  442. set(MEGDNN_ENABLE_RTTI 0)
  443. endif()
  444. set(MGB_VERBOSE_TYPEINFO_NAME ${MGE_ENABLE_RTTI})
  445. # Logging
  446. set(MGB_ENABLE_LOGGING ${MGE_ENABLE_LOGGING})
  447. set(MEGDNN_ENABLE_LOGGING ${MGE_ENABLE_LOGGING})
  448. set(MGB_ENABLE_JSON ${MGE_ENABLE_LOGGING})
  449. # Exception
  450. if(NOT MGE_ENABLE_EXCEPTIONS)
  451. message(STATUS "Exceptions disabled; MegEngine would kill itself when it is supposed to throw an exception.")
  452. endif()
  453. set(MGB_ENABLE_EXCEPTION ${MGE_ENABLE_EXCEPTIONS})
  454. set(MEGDNN_ENABLE_EXCEPTIONS ${MGE_ENABLE_EXCEPTIONS})
  455. # JIT
  456. if(MGE_WITH_JIT AND MGE_WITH_HALIDE)
  457. set(HALIDE_SHARED_LIBRARY OFF CACHE BOOL "Build as a shared library")
  458. include(cmake/Halide.cmake)
  459. endif()
  460. set(MGB_JIT ${MGE_WITH_JIT})
  461. set(MGB_JIT_HALIDE ${MGE_WITH_HALIDE})
  462. # Thread
  463. IF(APPLE)
  464. set(CMAKE_THREAD_LIBS_INIT "-lpthread")
  465. set(CMAKE_HAVE_THREADS_LIBRARY 1)
  466. set(CMAKE_USE_WIN32_THREADS_INIT 0)
  467. set(CMAKE_USE_PTHREADS_INIT 1)
  468. set(THREADS_PREFER_PTHREAD_FLAG ON)
  469. ENDIF()
  470. if(MSVC OR WIN32)
  471. set(CMAKE_HAVE_THREADS_LIBRARY 1)
  472. set(CMAKE_USE_WIN32_THREADS_INIT 1)
  473. set(CMAKE_USE_PTHREADS_INIT 1)
  474. set(THREADS_PREFER_PTHREAD_FLAG ON)
  475. endif()
  476. if(CMAKE_THREAD_LIBS_INIT OR CMAKE_USE_WIN32_THREADS_INIT)
  477. set(MGB_HAVE_THREAD 1)
  478. endif()
  479. if(MGE_WITH_TEST)
  480. # use intra-op multi threads
  481. set(MEGDNN_ENABLE_MULTI_THREADS 1)
  482. endif()
  483. # CUDA
  484. set(MGB_CUDA ${MGE_WITH_CUDA})
  485. set(MEGDNN_WITH_CUDA ${MGE_WITH_CUDA})
  486. #ROCM
  487. set(MGB_ROCM ${MGE_WITH_ROCM})
  488. set(MEGDNN_WITH_ROCM ${MGE_WITH_ROCM})
  489. # CAMBRICON
  490. set(MGB_CAMBRICON ${MGE_WITH_CAMBRICON})
  491. set(MEGDNN_WITH_CAMBRICON ${MGE_WITH_CAMBRICON})
  492. # Debug info
  493. if(${CMAKE_BUILD_TYPE} STREQUAL "Debug" OR ${CMAKE_BUILD_TYPE} STREQUAL "RelWithDebInfo")
  494. set(MGB_ASSERT_LOC 1)
  495. set(MGB_ENABLE_DEBUG_UTIL 1)
  496. else()
  497. set(MGB_ASSERT_LOC 0)
  498. set(MGB_ENABLE_DEBUG_UTIL 0)
  499. endif()
  500. # TensorRT
  501. set(MGB_ENABLE_TENSOR_RT ${MGE_WITH_TRT})
  502. # Inference only
  503. if(MGE_INFERENCE_ONLY AND NOT MGE_WITH_TEST)
  504. set(MGB_ENABLE_GRAD 0)
  505. set(MGB_BUILD_SLIM_SERVING 1)
  506. else()
  507. set(MGB_ENABLE_GRAD 1)
  508. set(MGB_BUILD_SLIM_SERVING 0)
  509. endif()
  510. # Distributed communication
  511. set(MGB_ENABLE_OPR_MM ${MGE_WITH_DISTRIBUTED})
  512. # MGE_ARCH related flags
  513. if(MGE_ARCH STREQUAL "x86_64" OR MGE_ARCH STREQUAL "i386")
  514. if(MGE_BLAS STREQUAL "MKL")
  515. set(MEGDNN_X86_WITH_MKL 1)
  516. elseif(MGE_BLAS STREQUAL "OpenBLAS")
  517. set(MEGDNN_X86_WITH_OPENBLAS 1)
  518. endif()
  519. endif()
  520. # Enable Naive
  521. if(MGE_ARCH STREQUAL "naive")
  522. set(MEGDNN_NAIVE 1)
  523. message(WARNING "MEGDNN_NAIVE is enabled; MegDNN performance is degraded.")
  524. endif()
  525. if(MGE_ARCH STREQUAL "x86_64" OR MGE_ARCH STREQUAL "i386")
  526. set(MEGDNN_X86 1)
  527. if(MGE_ARCH STREQUAL "x86_64")
  528. set(MEGDNN_X86_64 1)
  529. set(MEGDNN_64_BIT 1)
  530. if(NOT MSVC)
  531. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -m64")
  532. endif()
  533. else()
  534. set(MEGDNN_X86_32 1)
  535. if(NOT MSVC)
  536. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -m32")
  537. endif()
  538. endif()
  539. if(NOT MSVC)
  540. set(CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -msse4.2 -mfpmath=sse")
  541. endif()
  542. endif()
  543. if(MGE_ARCH STREQUAL "armv7")
  544. # -funsafe-math-optimizations to enable neon auto-vectorization (since neon is not fully IEEE 754 compatible, GCC does not turn on neon auto-vectorization by default.
  545. if(ANDROID)
  546. set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -mfloat-abi=softfp -mfpu=neon")
  547. endif()
  548. set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} -funsafe-math-optimizations")
  549. set (MARCH "-march=armv7-a")
  550. set (MEGDNN_ARMV7 1)
  551. endif()
  552. if(MGE_ARCH STREQUAL "aarch64")
  553. set(MEGDNN_AARCH64 1)
  554. set(MEGDNN_64_BIT 1)
  555. set(MARCH "-march=armv8-a")
  556. if(MGE_ARMV8_2_FEATURE_FP16)
  557. message("Enable fp16 feature support in armv8.2")
  558. if(NOT ${MGE_DISABLE_FLOAT16})
  559. set(MEGDNN_ENABLE_FP16_NEON 1)
  560. endif()
  561. set(MARCH "-march=armv8.2-a+fp16")
  562. endif()
  563. if(MGE_ARMV8_2_FEATURE_DOTPROD)
  564. message("Enable dotprod feature support in armv8.2")
  565. if(MGE_ARMV8_2_FEATURE_FP16)
  566. set(MARCH "-march=armv8.2-a+fp16+dotprod")
  567. else()
  568. set(MARCH "-march=armv8.2-a+dotprod")
  569. endif()
  570. endif()
  571. endif()
  572. set (CMAKE_CXX_FLAGS "${CMAKE_CXX_FLAGS} ${MARCH}")
  573. set(MGB_ENABLE_IMPERATIVE ${MGE_BUILD_IMPERATIVE_RT})
  574. # Write out megbrain_build_config.h
  575. # It defines macros needed by both megbrain and dnn
  576. configure_file(src/megbrain_build_config.h.in ${CMAKE_CURRENT_BINARY_DIR}/genfiles/megbrain_build_config.h)
  577. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/genfiles/megbrain_build_config.h DESTINATION ${CMAKE_INSTALL_INCLUDEDIR})
  578. add_subdirectory(dnn)
  579. list(APPEND MGB_OPR_PARAM_DEFS_SRCS ${CMAKE_CURRENT_SOURCE_DIR}/tools/param_defs/mgb_opr_param_defs.py)
  580. set(MGB_OPR_PARAM_DEFS_SCRIPT ${CMAKE_CURRENT_SOURCE_DIR}/dnn/scripts/gen_param_defs.py)
  581. set(MGB_OPR_PARAM_DEFS_OUT_DIR ${CMAKE_CURRENT_BINARY_DIR}/src/opr/include/)
  582. file(MAKE_DIRECTORY ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr)
  583. add_custom_command(
  584. OUTPUT
  585. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  586. COMMAND ${PYTHON_EXECUTABLE} ${MGB_OPR_PARAM_DEFS_SCRIPT} ${MGB_OPR_PARAM_DEFS_SRCS}
  587. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  588. DEPENDS ${MGB_OPR_PARAM_DEFS_SRCS} ${MGB_OPR_PARAM_DEFS_SCRIPT}
  589. VERBATIM
  590. )
  591. list(APPEND MGB_OPR_PARAM_DEFS_OUTS
  592. ${MGB_OPR_PARAM_DEFS_OUT_DIR}/megbrain/opr/param_defs.h
  593. )
  594. install(FILES ${MGB_OPR_PARAM_DEFS_OUTS} DESTINATION ${CMAKE_INSTALL_INCLUDEDIR}/megbrain/opr/)
  595. list(APPEND MGB_OPR_PARAM_DEFS_INC ${MGB_OPR_PARAM_DEFS_OUT_DIR})
  596. add_custom_target(_mgb_opr_param_defs DEPENDS ${MGB_OPR_PARAM_DEFS_OUTS})
  597. add_library(mgb_opr_param_defs INTERFACE)
  598. target_include_directories(mgb_opr_param_defs
  599. INTERFACE
  600. $<INSTALL_INTERFACE:${CMAKE_INSTALL_INCLUDEDIR}>
  601. $<BUILD_INTERFACE:${MGB_OPR_PARAM_DEFS_INC}>
  602. )
  603. add_dependencies(mgb_opr_param_defs _mgb_opr_param_defs)
  604. install(TARGETS mgb_opr_param_defs EXPORT ${MGE_EXPORT_TARGETS})
  605. if(MGE_WITH_DISTRIBUTED)
  606. add_subdirectory(${PROJECT_SOURCE_DIR}/third_party/MegRay)
  607. endif()
  608. add_subdirectory(src)
  609. if(MGE_BUILD_SDK)
  610. add_subdirectory(sdk/load-and-run)
  611. endif()
  612. if(MGE_WITH_PYTHON_MODULE)
  613. if(MGE_BUILD_IMPERATIVE_RT)
  614. add_subdirectory(imperative)
  615. message("-- Enable imperative python wrapper runtime")
  616. else()
  617. add_subdirectory(python_module)
  618. message("-- Enable legacy python wrapper runtime")
  619. endif()
  620. endif()
  621. if(MGE_WITH_TEST AND MGE_ENABLE_RTTI)
  622. add_subdirectory(test)
  623. endif()
  624. if(TARGET mgb)
  625. add_custom_target(
  626. develop
  627. COMMAND ${CMAKE_COMMAND} -E create_symlink
  628. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/$<TARGET_FILE_NAME:mgb>
  629. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/$<TARGET_FILE_NAME:mgb>
  630. COMMAND ${CMAKE_COMMAND} -E create_symlink
  631. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/mgb.py
  632. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/mgb.py
  633. COMMAND ${CMAKE_COMMAND} -E create_symlink
  634. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/opr.py
  635. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/opr.py
  636. COMMAND ${CMAKE_COMMAND} -E create_symlink
  637. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/opr_param_defs.py
  638. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/opr_param_defs.py
  639. COMMAND ${CMAKE_COMMAND} -E create_symlink
  640. ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/include
  641. ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/include
  642. DEPENDS mgb
  643. VERBATIM
  644. )
  645. elseif(TARGET _imperative_rt)
  646. add_custom_target(
  647. develop
  648. COMMAND ${CMAKE_COMMAND} -E create_symlink
  649. ${CMAKE_CURRENT_BINARY_DIR}/imperative/python/${PACKAGE_NAME}/core/$<TARGET_FILE_NAME:${MODULE_NAME}>
  650. ${CMAKE_CURRENT_SOURCE_DIR}/imperative/python/${PACKAGE_NAME}/core/$<TARGET_FILE_NAME:${MODULE_NAME}>
  651. COMMAND ${CMAKE_COMMAND} -E create_symlink
  652. ${CMAKE_CURRENT_BINARY_DIR}/imperative/python/${PACKAGE_NAME}/core/ops/_internal/generated_ops.py
  653. ${CMAKE_CURRENT_SOURCE_DIR}/imperative/python/${PACKAGE_NAME}/core/ops/_internal/generated_ops.py
  654. COMMAND ${CMAKE_COMMAND} -E create_symlink
  655. ${CMAKE_CURRENT_BINARY_DIR}/imperative/python/${PACKAGE_NAME}/core/ops/_internal/param_defs.py
  656. ${CMAKE_CURRENT_SOURCE_DIR}/imperative/python/${PACKAGE_NAME}/core/ops/_internal/param_defs.py
  657. DEPENDS _imperative_rt
  658. VERBATIM
  659. )
  660. endif()
  661. # Configure and install pkg-config.
  662. # Note that unlike the Config.cmake modules, this is not relocatable (and not
  663. # really portable) because we have two dependencies without pkg-config
  664. # descriptions: FlatBuffers and MKL-DNN
  665. if (MGE_USE_SYSTEM_MKLDNN)
  666. set (MGE_PKGCONFIG_LIBS_PRIVATE "-ldnnl")
  667. endif()
  668. if (MGE_USE_SYSTEM_OPENBLAS)
  669. set (MGE_PKGCONFIG_LIBS_PRIVATE "${MGE_PKGCONFIG_LIBS_PRIVATE} -lopenblas")
  670. endif()
  671. configure_file(cmake/megengine.pc.in
  672. ${CMAKE_CURRENT_BINARY_DIR}/megengine.pc
  673. @ONLY)
  674. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/megengine.pc
  675. DESTINATION ${CMAKE_INSTALL_LIBDIR}/pkgconfig)
  676. # Do not export targets if MGE_WITH_DISTRIBUTED is on. MegRay is not ready.
  677. if (NOT MGE_WITH_DISTRIBUTED)
  678. include(CMakePackageConfigHelpers)
  679. set (MGE_INSTALL_CMAKEDIR ${CMAKE_INSTALL_LIBDIR}/cmake/MegEngine)
  680. configure_package_config_file(cmake/MegEngineConfig.cmake.in
  681. ${CMAKE_CURRENT_BINARY_DIR}/MegEngineConfig.cmake
  682. INSTALL_DESTINATION ${MGE_INSTALL_CMAKEDIR}
  683. )
  684. write_basic_package_version_file(
  685. ${CMAKE_CURRENT_BINARY_DIR}/MegEngineConfigVersion.cmake
  686. VERSION ${MGB_VER_MAJOR}.${MGB_VER_MINOR}.${MGB_VER_PATCH}
  687. COMPATIBILITY SameMajorVersion)
  688. install(EXPORT ${MGE_EXPORT_TARGETS} DESTINATION ${MGE_INSTALL_CMAKEDIR})
  689. install(FILES ${CMAKE_CURRENT_BINARY_DIR}/MegEngineConfig.cmake
  690. ${CMAKE_CURRENT_BINARY_DIR}/MegEngineConfigVersion.cmake
  691. DESTINATION ${MGE_INSTALL_CMAKEDIR})
  692. endif()
  693. if(MSVC OR WIN32)
  694. add_compile_options(
  695. $<$<CONFIG:>:/MT>
  696. $<$<CONFIG:Debug>:/MTd>
  697. $<$<CONFIG:Release>:/MT>
  698. )
  699. foreach (CompilerFlag
  700. CMAKE_C_FLAGS CMAKE_C_FLAGS_DEBUG CMAKE_C_FLAGS_RELEASE
  701. CMAKE_C_FLAGS_MINSIZEREL CMAKE_C_FLAGS_RELWITHDEBINFO
  702. CMAKE_CXX_FLAGS CMAKE_CXX_FLAGS_DEBUG CMAKE_CXX_FLAGS_RELEASE
  703. CMAKE_CXX_FLAGS_MINSIZEREL CMAKE_CXX_FLAGS_RELWITHDEBINFO)
  704. if(${CompilerFlag} MATCHES "/MD")
  705. string(REPLACE "/MD" "/MT" ${CompilerFlag} "${${CompilerFlag}}")
  706. set(${CompilerFlag} "${${CompilerFlag}}" CACHE STRING "msvc compiler flags" FORCE)
  707. message("MSVC flags: ${CompilerFlag}:${${CompilerFlag}}")
  708. endif()
  709. endforeach()
  710. endif()

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台