You can not select more than 25 topics Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.

build_wheel_common.sh 11 kB

123456789101112131415161718192021222324252627282930313233343536373839404142434445464748495051525354555657585960616263646566676869707172737475767778798081828384858687888990919293949596979899100101102103104105106107108109110111112113114115116117118119120121122123124125126127128129130131132133134135136137138139140141142143144145146147148149150151152153154155156157158159160161162163164165166167168169170171172173174175176177178179180181182183184185186187188189190191192193194195196197198199200201202203204205206207208209210211212213214215216217218219220221222223224225226227228229230231232233234235236237238239240241242243244245246247248249250251252253254255256257258259260261262263264265266267268269270271272273274275276277278279280281282283284285286287288289290291292293294295296297298299300301302303304305306307308309310311312
  1. #!/bin/bash -e
  2. set -x
  3. CWD=$(dirname $0)
  4. BASEDIR=$(readlink -f ${CWD}/../../..)
  5. OUTPUTDIR=$(readlink -f ${CWD}/output)
  6. USERID=$(id -u)
  7. TMPFS_ARGS="--tmpfs /tmp:exec"
  8. local_path=$(dirname $(readlink -f $0))
  9. CUDNN_LIB_DIR="/opt/cudnn/lib64/"
  10. CUDA_LIB_DIR="/usr/local/cuda/lib64/"
  11. SDK_NAME="unknown"
  12. x86_64_support_version="cu101 cu111 cu112 cpu"
  13. aarch64_support_version="cu111 cpu"
  14. if [[ -z ${IN_CI} ]]
  15. then
  16. IN_CI="false"
  17. fi
  18. function usage() {
  19. echo "use -sdk sdk_version to specify sdk toolkit config!"
  20. echo "now x86_64 sdk_version support ${x86_64_support_version}"
  21. echo "now aarch64 sdk_version support ${aarch64_support_version}"
  22. }
  23. while [ "$1" != "" ]; do
  24. case $1 in
  25. -sdk)
  26. shift
  27. SDK_NAME=$1
  28. shift
  29. ;;
  30. *)
  31. usage
  32. exit -1
  33. esac
  34. done
  35. is_valid_sdk="false"
  36. all_sdk=""
  37. machine=$(uname -m)
  38. case ${machine} in
  39. x86_64) all_sdk=${x86_64_support_version} ;;
  40. aarch64) all_sdk=${aarch64_support_version} ;;
  41. *) echo "nonsupport env!!!";exit -1 ;;
  42. esac
  43. for i_sdk in ${all_sdk}
  44. do
  45. if [ ${i_sdk} == ${SDK_NAME} ];then
  46. is_valid_sdk="true"
  47. fi
  48. done
  49. if [ ${is_valid_sdk} == "false" ];then
  50. echo "invalid sdk: ${SDK_NAME}"
  51. usage
  52. exit -1
  53. fi
  54. echo "Build with ${SDK_NAME}"
  55. if [ $SDK_NAME == "cu101" ];then
  56. CUDA_COPY_LIB_LIST="${CUDA_LIB_DIR}/libnvrtc.so.10.1"
  57. EXTRA_CMAKE_FLAG=" -DMGE_WITH_CUDNN_SHARED=OFF -DMGE_WITH_CUBLAS_SHARED=OFF"
  58. BUILD_GCC8="ON"
  59. REQUIR_CUDA_VERSION="10010"
  60. REQUIR_CUDNN_VERSION="7.6.3"
  61. REQUIR_TENSORRT_VERSION="6.0.1.5"
  62. REQUIR_CUBLAS_VERSION="10.2.1.243"
  63. elif [ $SDK_NAME == "cu111" ];then
  64. if [ ${machine} == "aarch64" ];then
  65. REQUIR_CUDA_VERSION="11010"
  66. REQUIR_CUDNN_VERSION="8.0.5"
  67. REQUIR_TENSORRT_VERSION="7.2.1.6"
  68. REQUIR_CUBLAS_VERSION="11.3.0.106"
  69. elif [ ${machine} == "x86_64" ];then
  70. REQUIR_CUDA_VERSION="11010"
  71. REQUIR_CUDNN_VERSION="8.0.4"
  72. REQUIR_TENSORRT_VERSION="7.2.2.3"
  73. REQUIR_CUBLAS_VERSION="11.2.1.74"
  74. else
  75. echo "no support machine: ${machine}"
  76. exit -1
  77. fi
  78. CUDA_COPY_LIB_LIST="\
  79. ${CUDA_LIB_DIR}/libnvrtc.so.11.1:\
  80. ${CUDA_LIB_DIR}/libcublasLt.so.11:\
  81. ${CUDA_LIB_DIR}/libcublas.so.11:\
  82. ${CUDNN_LIB_DIR}/libcudnn_adv_infer.so.8:\
  83. ${CUDNN_LIB_DIR}/libcudnn_adv_train.so.8:\
  84. ${CUDNN_LIB_DIR}/libcudnn_cnn_infer.so.8:\
  85. ${CUDNN_LIB_DIR}/libcudnn_cnn_train.so.8:\
  86. ${CUDNN_LIB_DIR}/libcudnn_ops_infer.so.8:\
  87. ${CUDNN_LIB_DIR}/libcudnn_ops_train.so.8:\
  88. ${CUDNN_LIB_DIR}/libcudnn.so.8"
  89. if [ ${IN_CI} = "true" ] && [ ${machine} == "aarch64" ]; then
  90. EXTRA_CMAKE_FLAG=" -DMGE_WITH_CUDNN_SHARED=ON -DMGE_WITH_CUBLAS_SHARED=ON -DMGE_CUDA_GENCODE=\"-gencode arch=compute_75,code=sm_75\" "
  91. else
  92. EXTRA_CMAKE_FLAG=" -DMGE_WITH_CUDNN_SHARED=ON -DMGE_WITH_CUBLAS_SHARED=ON \
  93. -DMGE_CUDA_GENCODE=\"-gencode arch=compute_61,code=sm_61 \
  94. -gencode arch=compute_70,code=sm_70 \
  95. -gencode arch=compute_75,code=sm_75 \
  96. -gencode arch=compute_80,code=sm_80 \
  97. -gencode arch=compute_86,code=sm_86 \
  98. -gencode arch=compute_86,code=compute_86\" "
  99. fi
  100. elif [ $SDK_NAME == "cu112" ];then
  101. CUDA_COPY_LIB_LIST="\
  102. ${CUDA_LIB_DIR}/libnvrtc.so.11.2:\
  103. ${CUDA_LIB_DIR}/libcublasLt.so.11:\
  104. ${CUDA_LIB_DIR}/libcublas.so.11:\
  105. ${CUDNN_LIB_DIR}/libcudnn_adv_infer.so.8:\
  106. ${CUDNN_LIB_DIR}/libcudnn_adv_train.so.8:\
  107. ${CUDNN_LIB_DIR}/libcudnn_cnn_infer.so.8:\
  108. ${CUDNN_LIB_DIR}/libcudnn_cnn_train.so.8:\
  109. ${CUDNN_LIB_DIR}/libcudnn_ops_infer.so.8:\
  110. ${CUDNN_LIB_DIR}/libcudnn_ops_train.so.8:\
  111. ${CUDNN_LIB_DIR}/libcudnn.so.8"
  112. EXTRA_CMAKE_FLAG=" -DMGE_WITH_CUDNN_SHARED=ON -DMGE_WITH_CUBLAS_SHARED=ON \
  113. -DMGE_CUDA_GENCODE=\"-gencode arch=compute_61,code=sm_61 \
  114. -gencode arch=compute_70,code=sm_70 \
  115. -gencode arch=compute_75,code=sm_75 \
  116. -gencode arch=compute_80,code=sm_80 \
  117. -gencode arch=compute_86,code=sm_86 \
  118. -gencode arch=compute_86,code=compute_86\" "
  119. REQUIR_CUDA_VERSION="11020"
  120. REQUIR_CUDNN_VERSION="8.0.4"
  121. REQUIR_TENSORRT_VERSION="7.2.2.3"
  122. REQUIR_CUBLAS_VERSION="11.3.1.68"
  123. elif [ $SDK_NAME == "cpu" ];then
  124. echo "use $SDK_NAME without cuda support"
  125. BUILD_WHL_CPU_ONLY="ON"
  126. else
  127. echo "no support sdk ${SDK_NAME}"
  128. usage
  129. exit -1
  130. fi
  131. if [[ -z ${BUILD_WHL_CPU_ONLY} ]]
  132. then
  133. BUILD_WHL_CPU_ONLY="OFF"
  134. fi
  135. echo ${BASEDIR}
  136. pushd ${BASEDIR}/third_party >/dev/null
  137. ./prepare.sh
  138. popd >/dev/null
  139. cd ${CWD}
  140. mkdir -p ${OUTPUTDIR}
  141. if [ ${BUILD_WHL_CPU_ONLY} = "OFF" ]; then
  142. if [[ -z ${CUDA_ROOT_DIR} ]]; then
  143. echo "Environment variable CUDA_ROOT_DIR not set."
  144. exit -1
  145. fi
  146. if [[ -z ${CUDNN_ROOT_DIR} ]]; then
  147. echo "Environment variable CUDNN_ROOT_DIR not set."
  148. exit -1
  149. fi
  150. if [[ -z ${TENSORRT_ROOT_DIR} ]]; then
  151. echo "Environment variable TENSORRT_ROOT_DIR not set."
  152. if [[ -z ${TRT_ROOT_DIR} ]]; then
  153. echo "Environment variable TRT_ROOT_DIR not set."
  154. exit -1
  155. else
  156. echo "put ${TRT_ROOT_DIR} to TENSORRT_ROOT_DIR env"
  157. TENSORRT_ROOT_DIR=${TRT_ROOT_DIR}
  158. fi
  159. fi
  160. ## YOU SHOULD MODIFY CUDA VERSION AS BELOW WHEN UPGRADE
  161. CUDA_ROOT_DIR_=${CUDA_ROOT_DIR%*/}
  162. CUDNN_ROOT_DIR_=${CUDNN_ROOT_DIR%*/}
  163. TENSORRT_ROOT_DIR_=${TENSORRT_ROOT_DIR%*/}
  164. CUBLAS_VERSION_PATH=${CUDA_ROOT_DIR_}/include/cublas_api.h
  165. CUDA_VERSION_PATH=${CUDA_ROOT_DIR_}/include/cuda.h
  166. if [ "$REQUIR_CUDA_VERSION" -ge "11000" ];then
  167. CUDNN_VERSION_PATH=${CUDNN_ROOT_DIR_}/include/cudnn_version.h
  168. else
  169. CUDNN_VERSION_PATH=${CUDNN_ROOT_DIR_}/include/cudnn.h
  170. fi
  171. TENSORRT_VERSION_PATH=${TENSORRT_ROOT_DIR_}/include/NvInferVersion.h
  172. if [ ! -e $CUDA_VERSION_PATH ] ; then
  173. echo file $CUDA_VERSION_PATH is not exist
  174. echo please check the Environment must use CUDA-$REQUIR_CUDA_VERSION
  175. exit -1
  176. fi
  177. if [ ! -e $CUDNN_VERSION_PATH ] ; then
  178. echo file $CUDNN_VERSION_PATH is not exist
  179. echo please check the Environment must use CUDNN-V$REQUIR_CUDNN_VERSION
  180. exit -1
  181. fi
  182. if [ ! -e $TENSORRT_VERSION_PATH ] ; then
  183. echo file $TENSORRT_VERSION_PATH is not exist
  184. echo please check the Environment must use TensorRT-$REQUIR_TENSORRT_VERSION
  185. exit -1
  186. fi
  187. if [ ! -e $CUBLAS_VERSION_PATH ] ; then
  188. echo file $CUBLAS_VERSION_PATH is not exist
  189. exit -1
  190. fi
  191. CUBLAS_VERSION_CONTEXT=$(head -150 ${CUBLAS_VERSION_PATH})
  192. CUDA_VERSION_CONTEXT=$(head -300 ${CUDA_VERSION_PATH})
  193. CUDNN_VERSION_CONTEXT=$(head -62 ${CUDNN_VERSION_PATH})
  194. TENSORRT_VERSION_CONTEXT=$(tail -12 ${TENSORRT_VERSION_PATH})
  195. if [ "$REQUIR_CUDA_VERSION" -ge "11000" ];then
  196. CUDA_API_VERSION=$(echo $CUDA_VERSION_CONTEXT | grep -Eo "define CUDA_VERSION * +([0-9]+)")
  197. else
  198. CUDA_API_VERSION=$(echo $CUDA_VERSION_CONTEXT | grep -Eo "define __CUDA_API_VERSION * +([0-9]+)")
  199. fi
  200. CUDA_VERSION=${CUDA_API_VERSION:0-5}
  201. echo CUDA_VERSION:$CUDA_VERSION
  202. CUDNN_VERSION_MAJOR=$(echo $CUDNN_VERSION_CONTEXT | grep -Eo "define CUDNN_MAJOR * +([0-9]+)")
  203. CUDNN_VERSION_MINOR=$(echo $CUDNN_VERSION_CONTEXT | grep -Eo "define CUDNN_MINOR * +([0-9]+)")
  204. CUDNN_VERSION_PATCH=$(echo $CUDNN_VERSION_CONTEXT | grep -Eo "define CUDNN_PATCHLEVEL * +([0-9]+)")
  205. CUDNN_VERSION=${CUDNN_VERSION_MAJOR:0-1}.${CUDNN_VERSION_MINOR:0-1}.${CUDNN_VERSION_PATCH:0-1}
  206. echo CUDNN_VERSION:$CUDNN_VERSION
  207. TENSORRT_VERSION_MAJOR=$(echo $TENSORRT_VERSION_CONTEXT | grep -Eo "NV_TENSORRT_MAJOR * +([0-9]+)")
  208. TENSORRT_VERSION_MINOR=$(echo $TENSORRT_VERSION_CONTEXT | grep -Eo "NV_TENSORRT_MINOR * +([0-9]+)")
  209. TENSORRT_VERSION_PATCH=$(echo $TENSORRT_VERSION_CONTEXT | grep -Eo "NV_TENSORRT_PATCH * +([0-9]+)")
  210. TENSORRT_VERSION_BUILD=$(echo $TENSORRT_VERSION_CONTEXT | grep -Eo "NV_TENSORRT_BUILD * +([0-9]+)")
  211. TENSORRT_VERSION=${TENSORRT_VERSION_MAJOR:0-1}.${TENSORRT_VERSION_MINOR:0-1}.${TENSORRT_VERSION_PATCH:0-1}.${TENSORRT_VERSION_BUILD:0-1}
  212. echo TENSORRT_VERSION:$TENSORRT_VERSION
  213. CUBLAS_VERSION_MAJOR=$(echo $CUBLAS_VERSION_CONTEXT | grep -Eo "define CUBLAS_VER_MAJOR * +([0-9]+)" | grep -Eo "*+([0-9]+)")
  214. CUBLAS_VERSION_MINOR=$(echo $CUBLAS_VERSION_CONTEXT | grep -Eo "define CUBLAS_VER_MINOR * +([0-9]+)" | grep -Eo "*+([0-9]+)")
  215. CUBLAS_VERSION_PATCH=$(echo $CUBLAS_VERSION_CONTEXT | grep -Eo "define CUBLAS_VER_PATCH * +([0-9]+)" | grep -Eo "*+([0-9]+)")
  216. CUBLAS_VERSION_BUILD=$(echo $CUBLAS_VERSION_CONTEXT | grep -Eo "define CUBLAS_VER_BUILD * +([0-9]+)" | grep -Eo "*+([0-9]+)")
  217. CUBLAS_VERSION=${CUBLAS_VERSION_MAJOR}.${CUBLAS_VERSION_MINOR}.${CUBLAS_VERSION_PATCH}.${CUBLAS_VERSION_BUILD}
  218. echo CUBLAS_VERSION:$CUBLAS_VERSION
  219. if [ $CUDA_VERSION != $REQUIR_CUDA_VERSION ] ; then
  220. echo please check the Environment must use CUDA NO.$REQUIR_CUDA_VERSION
  221. exit -1
  222. fi
  223. if [ $CUDNN_VERSION != $REQUIR_CUDNN_VERSION ] ; then
  224. echo please check the Environment must use CUDNN-V$REQUIR_CUDNN_VERSION
  225. exit -1
  226. fi
  227. if [ $TENSORRT_VERSION != $REQUIR_TENSORRT_VERSION ] ; then
  228. echo please check the Environment must use TENSORRT-$REQUIR_TENSORRT_VERSION
  229. exit -1
  230. fi
  231. if [ $CUBLAS_VERSION != $REQUIR_CUBLAS_VERSION ] ; then
  232. echo please check the Environment must use CUBLAS-$REQUIR_CUBLAS_VERSION
  233. exit -1
  234. fi
  235. fi
  236. if [[ -z ${BUILD_GCC8} ]];then
  237. BUILD_GCC8=OFF
  238. fi
  239. if [ ${machine} == "aarch64" ];then
  240. # manylinux on aarch64 gcc9 is: (GCC) 9.3.1 20200408 (Red Hat 9.3.1-2)
  241. # which version has issue: 'as' take a long long long time for some dnn kernel!
  242. # infact ubuntu gcc version: gcc (Ubuntu 9.3.0-17ubuntu1~20.04) 9.3.0 is OK
  243. echo "force use gcc8 on aarch64 linux"
  244. BUILD_GCC8="ON"
  245. fi
  246. if [ "$BUILD_GCC8" == "ON" ];then
  247. run_cmd="scl enable devtoolset-8 /home/code/scripts/whl/manylinux2014/do_build_common.sh"
  248. else
  249. run_cmd="/home/code/scripts/whl/manylinux2014/do_build_common.sh"
  250. fi
  251. set +x
  252. docker_args="-it"
  253. if [ -z "${CI_SERVER_NAME}" ]; then
  254. CI_SERVER_NAME="null"
  255. fi
  256. if [ ${CI_SERVER_NAME} = "GitLab" ];then
  257. docker_args="-i"
  258. fi
  259. if [ ${IN_CI} = "true" ];then
  260. EXTRA_CMAKE_FLAG=" ${EXTRA_CMAKE_FLAG} -DMGE_WITH_TEST=ON"
  261. fi
  262. docker run --rm ${docker_args} $TMPFS_ARGS \
  263. -e UID=${USERID} \
  264. -e PUBLIC_VERSION_POSTFIX=${PUBLIC_VERSION_POSTFIX} \
  265. -e LOCAL_VERSION=${LOCAL_VERSION} \
  266. -e STRIP_SDK_INFO=${STRIP_SDK_INFO} \
  267. -e BUILD_WHL_CPU_ONLY=${BUILD_WHL_CPU_ONLY} \
  268. -e ALL_PYTHON="${ALL_PYTHON}" \
  269. -e EXTRA_CMAKE_FLAG="$EXTRA_CMAKE_FLAG" \
  270. -e CUDA_COPY_LIB_LIST="$CUDA_COPY_LIB_LIST" \
  271. -e SDK_NAME="$SDK_NAME" \
  272. -e CUDA_ROOT_DIR="/usr/local/cuda" \
  273. -e CUDNN_ROOT_DIR="/opt/cudnn" \
  274. -e TRT_ROOT_DIR="/opt/tensorrt" \
  275. -v ${CUDA_ROOT_DIR}:/usr/local/cuda \
  276. -v ${CUDNN_ROOT_DIR}:/opt/cudnn \
  277. -v ${TENSORRT_ROOT_DIR}:/opt/tensorrt \
  278. -v ${BASEDIR}:/home/code \
  279. -v ${OUTPUTDIR}:/home/output:rw \
  280. env_manylinux2014:latest /bin/bash -c "$run_cmd"

MegEngine 安装包中集成了使用 GPU 运行代码所需的 CUDA 环境,不用区分 CPU 和 GPU 版。 如果想要运行 GPU 程序,请确保机器本身配有 GPU 硬件设备并安装好驱动。 如果你想体验在云端 GPU 算力平台进行深度学习开发的感觉,欢迎访问 MegStudio 平台