GitOrigin-RevId: 9e7d7d4167
tags/v1.0.0-rc1
@@ -297,7 +297,7 @@ if(MGE_WITH_CUDA) | |||||
if(MSVC OR WIN32) | if(MSVC OR WIN32) | ||||
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xfatbin -compress-all") | set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xfatbin -compress-all") | ||||
set(CCBIN_FLAG "${CCBIN_FLAG} /wd4819 /wd4334 /wd4267 /wd4002 /wd4244 /wd4068") | set(CCBIN_FLAG "${CCBIN_FLAG} /wd4819 /wd4334 /wd4267 /wd4002 /wd4244 /wd4068") | ||||
if(${CMAKE_BUILD_TYPE} STREQUAL "Debug" OR ${CMAKE_BUILD_TYPE} STREQUAL "RelWithDebInfo") | |||||
if(${CMAKE_BUILD_TYPE} STREQUAL "Debug") | |||||
set(CCBIN_FLAG "${CCBIN_FLAG} -D_ITERATOR_DEBUG_LEVEL=2 -MTd") | set(CCBIN_FLAG "${CCBIN_FLAG} -D_ITERATOR_DEBUG_LEVEL=2 -MTd") | ||||
endif() | endif() | ||||
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --compiler-options \" ${CCBIN_FLAG} \" ") | set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --compiler-options \" ${CCBIN_FLAG} \" ") | ||||
@@ -680,6 +680,7 @@ if(TARGET mgb) | |||||
COMMAND ${CMAKE_COMMAND} -E create_symlink | COMMAND ${CMAKE_COMMAND} -E create_symlink | ||||
${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/include | ${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/include | ||||
${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/include | ${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/include | ||||
DEPENDS mgb | DEPENDS mgb | ||||
VERBATIM | VERBATIM | ||||
) | ) | ||||
@@ -17,6 +17,68 @@ import collections | |||||
import json | import json | ||||
import os | import os | ||||
import sys | import sys | ||||
import platform | |||||
import ctypes | |||||
if sys.platform == "win32": | |||||
lib_path = os.path.join(os.path.dirname(__file__), "lib") | |||||
Lib_path = os.path.join(os.path.dirname(__file__), "Lib") | |||||
dll_paths = list(filter(os.path.exists, [lib_path, Lib_path])) | |||||
assert len(dll_paths) > 0 | |||||
kernel32 = ctypes.WinDLL("kernel32.dll", use_last_error=True) | |||||
has_load_library_attr = hasattr(kernel32, "AddDllDirectory") | |||||
old_error_mode = kernel32.SetErrorMode(0x0001) | |||||
kernel32.LoadLibraryW.restype = ctypes.c_void_p | |||||
if has_load_library_attr: | |||||
kernel32.AddDllDirectory.restype = ctypes.c_void_p | |||||
kernel32.LoadLibraryExW.restype = ctypes.c_void_p | |||||
for dll_path in dll_paths: | |||||
if sys.version_info >= (3, 8): | |||||
os.add_dll_directory(dll_path) | |||||
elif has_load_library_attr: | |||||
res = kernel32.AddDllDirectory(dll_path) | |||||
if res is None: | |||||
err = ctypes.WinError(ctypes.get_last_error()) | |||||
err.strerror += ' Error adding "{}" to the DLL search PATH.'.format( | |||||
dll_path | |||||
) | |||||
raise err | |||||
else: | |||||
print("WARN: python or OS env have some issue, may load DLL failed!!!") | |||||
import glob | |||||
dlls = glob.glob(os.path.join(lib_path, "*.dll")) | |||||
path_patched = False | |||||
for dll in dlls: | |||||
is_loaded = False | |||||
if has_load_library_attr: | |||||
res = kernel32.LoadLibraryExW(dll, None, 0x00001100) | |||||
last_error = ctypes.get_last_error() | |||||
if res is None and last_error != 126: | |||||
err = ctypes.WinError(last_error) | |||||
err.strerror += ' Error loading "{}" or one of its dependencies.'.format( | |||||
dll | |||||
) | |||||
raise err | |||||
elif res is not None: | |||||
is_loaded = True | |||||
if not is_loaded: | |||||
if not path_patched: | |||||
os.environ["PATH"] = ";".join(dll_paths + [os.environ["PATH"]]) | |||||
path_patched = True | |||||
res = kernel32.LoadLibraryW(dll) | |||||
if res is None: | |||||
err = ctypes.WinError(ctypes.get_last_error()) | |||||
err.strerror += ' Error loading "{}" or one of its dependencies.'.format( | |||||
dll | |||||
) | |||||
raise err | |||||
kernel32.SetErrorMode(old_error_mode) | |||||
import numpy as np | import numpy as np | ||||
@@ -99,3 +99,8 @@ | |||||
``` | ``` | ||||
ALL_PYTHON=3.5.4 ./scripts/whl/windows/windows_build_whl.sh | ALL_PYTHON=3.5.4 ./scripts/whl/windows/windows_build_whl.sh | ||||
``` | ``` | ||||
If you want to build windows whl with cuda, also a specific Python verison. eg: | |||||
``` | |||||
WINDOWS_WHL_WITH_CUDA="true" ALL_PYTHON=3.5.4 ./scripts/whl/windows/windows_build_whl.sh | |||||
``` |
@@ -60,6 +60,40 @@ function config_python_env() { | |||||
PYTHON_INCLUDE_DIR=${PYTHON_DIR}/include | PYTHON_INCLUDE_DIR=${PYTHON_DIR}/include | ||||
} | } | ||||
if [[ -z ${WINDOWS_WHL_WITH_CUDA} ]] | |||||
then | |||||
WINDOWS_WHL_WITH_CUDA="false" | |||||
fi | |||||
# config NVIDIA libs | |||||
TRT_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/TensorRT-6.0.1.5/lib/nvinfer.dll" | |||||
CUDNN_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/cudnn-10.1-windows10-x64-v7.6.5.32/cuda/bin/cudnn64_7.dll" | |||||
CUSOLVER_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cusolver64_10.dll" | |||||
CUBLAS_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cublas64_10.dll" | |||||
CURAND_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/curand64_10.dll" | |||||
CUBLASLT_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cublasLt64_10.dll" | |||||
CUDART_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cudart64_101.dll" | |||||
function copy_more_dll() { | |||||
# for python whl real use | |||||
CP_DST=${BUILD_DIR}/staging/megengine/_internal/lib | |||||
rm -rf ${CP_DST} | |||||
mkdir ${CP_DST} | |||||
if [ ${WINDOWS_WHL_WITH_CUDA} = "true" ]; then | |||||
echo "copy nvidia lib to whl use...." | |||||
cp "${TRT_LIB}" ${CP_DST} | |||||
cp "${CUDNN_LIB}" ${CP_DST} | |||||
cp "${CUSOLVER_LIB}" ${CP_DST} | |||||
cp "${CUBLAS_LIB}" ${CP_DST} | |||||
cp "${CURAND_LIB}" ${CP_DST} | |||||
cp "${CUBLASLT_LIB}" ${CP_DST} | |||||
cp "${CUDART_LIB}" ${CP_DST} | |||||
fi | |||||
} | |||||
function do_build() { | function do_build() { | ||||
for ver in ${ALL_PYTHON} | for ver in ${ALL_PYTHON} | ||||
do | do | ||||
@@ -91,7 +125,13 @@ function do_build() { | |||||
#change PYTHON_LIBRARY and PYTHON_INCLUDE_DIR, so add | #change PYTHON_LIBRARY and PYTHON_INCLUDE_DIR, so add | ||||
#-r to remove build cache after a new ver build, which | #-r to remove build cache after a new ver build, which | ||||
#will be more slow build than without -r | #will be more slow build than without -r | ||||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r | |||||
if [ ${WINDOWS_WHL_WITH_CUDA} = "true" ]; then | |||||
echo "build windows whl with cuda" | |||||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r -c | |||||
else | |||||
echo "build windows whl with cpu only" | |||||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r | |||||
fi | |||||
#call setup.py | #call setup.py | ||||
BUILD_DIR=${SRC_DIR}/build_dir/host/build/ | BUILD_DIR=${SRC_DIR}/build_dir/host/build/ | ||||
@@ -107,6 +147,7 @@ function do_build() { | |||||
cp -a python_module/{megengine,setup.py,requires.txt,requires-style.txt,requires-test.txt} staging/ | cp -a python_module/{megengine,setup.py,requires.txt,requires-style.txt,requires-test.txt} staging/ | ||||
cd ${BUILD_DIR}/staging/megengine/_internal | cd ${BUILD_DIR}/staging/megengine/_internal | ||||
llvm-strip -s _mgb.pyd | llvm-strip -s _mgb.pyd | ||||
copy_more_dll | |||||
cd ${BUILD_DIR}/staging | cd ${BUILD_DIR}/staging | ||||
${PYTHON_DIR}/python3 setup.py bdist_wheel | ${PYTHON_DIR}/python3 setup.py bdist_wheel | ||||
cp ${BUILD_DIR}/staging/dist/Meg*.whl ${WINDOWS_WHL_HOME}/ | cp ${BUILD_DIR}/staging/dist/Meg*.whl ${WINDOWS_WHL_HOME}/ | ||||