GitOrigin-RevId: 9e7d7d4167
tags/v1.0.0-rc1
@@ -297,7 +297,7 @@ if(MGE_WITH_CUDA) | |||
if(MSVC OR WIN32) | |||
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} -Xfatbin -compress-all") | |||
set(CCBIN_FLAG "${CCBIN_FLAG} /wd4819 /wd4334 /wd4267 /wd4002 /wd4244 /wd4068") | |||
if(${CMAKE_BUILD_TYPE} STREQUAL "Debug" OR ${CMAKE_BUILD_TYPE} STREQUAL "RelWithDebInfo") | |||
if(${CMAKE_BUILD_TYPE} STREQUAL "Debug") | |||
set(CCBIN_FLAG "${CCBIN_FLAG} -D_ITERATOR_DEBUG_LEVEL=2 -MTd") | |||
endif() | |||
set(CMAKE_CUDA_FLAGS "${CMAKE_CUDA_FLAGS} --compiler-options \" ${CCBIN_FLAG} \" ") | |||
@@ -680,6 +680,7 @@ if(TARGET mgb) | |||
COMMAND ${CMAKE_COMMAND} -E create_symlink | |||
${CMAKE_CURRENT_BINARY_DIR}/python_module/megengine/_internal/include | |||
${CMAKE_CURRENT_SOURCE_DIR}/python_module/megengine/_internal/include | |||
DEPENDS mgb | |||
VERBATIM | |||
) | |||
@@ -17,6 +17,68 @@ import collections | |||
import json | |||
import os | |||
import sys | |||
import platform | |||
import ctypes | |||
if sys.platform == "win32": | |||
lib_path = os.path.join(os.path.dirname(__file__), "lib") | |||
Lib_path = os.path.join(os.path.dirname(__file__), "Lib") | |||
dll_paths = list(filter(os.path.exists, [lib_path, Lib_path])) | |||
assert len(dll_paths) > 0 | |||
kernel32 = ctypes.WinDLL("kernel32.dll", use_last_error=True) | |||
has_load_library_attr = hasattr(kernel32, "AddDllDirectory") | |||
old_error_mode = kernel32.SetErrorMode(0x0001) | |||
kernel32.LoadLibraryW.restype = ctypes.c_void_p | |||
if has_load_library_attr: | |||
kernel32.AddDllDirectory.restype = ctypes.c_void_p | |||
kernel32.LoadLibraryExW.restype = ctypes.c_void_p | |||
for dll_path in dll_paths: | |||
if sys.version_info >= (3, 8): | |||
os.add_dll_directory(dll_path) | |||
elif has_load_library_attr: | |||
res = kernel32.AddDllDirectory(dll_path) | |||
if res is None: | |||
err = ctypes.WinError(ctypes.get_last_error()) | |||
err.strerror += ' Error adding "{}" to the DLL search PATH.'.format( | |||
dll_path | |||
) | |||
raise err | |||
else: | |||
print("WARN: python or OS env have some issue, may load DLL failed!!!") | |||
import glob | |||
dlls = glob.glob(os.path.join(lib_path, "*.dll")) | |||
path_patched = False | |||
for dll in dlls: | |||
is_loaded = False | |||
if has_load_library_attr: | |||
res = kernel32.LoadLibraryExW(dll, None, 0x00001100) | |||
last_error = ctypes.get_last_error() | |||
if res is None and last_error != 126: | |||
err = ctypes.WinError(last_error) | |||
err.strerror += ' Error loading "{}" or one of its dependencies.'.format( | |||
dll | |||
) | |||
raise err | |||
elif res is not None: | |||
is_loaded = True | |||
if not is_loaded: | |||
if not path_patched: | |||
os.environ["PATH"] = ";".join(dll_paths + [os.environ["PATH"]]) | |||
path_patched = True | |||
res = kernel32.LoadLibraryW(dll) | |||
if res is None: | |||
err = ctypes.WinError(ctypes.get_last_error()) | |||
err.strerror += ' Error loading "{}" or one of its dependencies.'.format( | |||
dll | |||
) | |||
raise err | |||
kernel32.SetErrorMode(old_error_mode) | |||
import numpy as np | |||
@@ -99,3 +99,8 @@ | |||
``` | |||
ALL_PYTHON=3.5.4 ./scripts/whl/windows/windows_build_whl.sh | |||
``` | |||
If you want to build windows whl with cuda, also a specific Python verison. eg: | |||
``` | |||
WINDOWS_WHL_WITH_CUDA="true" ALL_PYTHON=3.5.4 ./scripts/whl/windows/windows_build_whl.sh | |||
``` |
@@ -60,6 +60,40 @@ function config_python_env() { | |||
PYTHON_INCLUDE_DIR=${PYTHON_DIR}/include | |||
} | |||
if [[ -z ${WINDOWS_WHL_WITH_CUDA} ]] | |||
then | |||
WINDOWS_WHL_WITH_CUDA="false" | |||
fi | |||
# config NVIDIA libs | |||
TRT_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/TensorRT-6.0.1.5/lib/nvinfer.dll" | |||
CUDNN_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/cudnn-10.1-windows10-x64-v7.6.5.32/cuda/bin/cudnn64_7.dll" | |||
CUSOLVER_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cusolver64_10.dll" | |||
CUBLAS_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cublas64_10.dll" | |||
CURAND_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/curand64_10.dll" | |||
CUBLASLT_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cublasLt64_10.dll" | |||
CUDART_LIB="/c/Program Files/NVIDIA GPU Computing Toolkit/CUDA/v10.1/bin/cudart64_101.dll" | |||
function copy_more_dll() { | |||
# for python whl real use | |||
CP_DST=${BUILD_DIR}/staging/megengine/_internal/lib | |||
rm -rf ${CP_DST} | |||
mkdir ${CP_DST} | |||
if [ ${WINDOWS_WHL_WITH_CUDA} = "true" ]; then | |||
echo "copy nvidia lib to whl use...." | |||
cp "${TRT_LIB}" ${CP_DST} | |||
cp "${CUDNN_LIB}" ${CP_DST} | |||
cp "${CUSOLVER_LIB}" ${CP_DST} | |||
cp "${CUBLAS_LIB}" ${CP_DST} | |||
cp "${CURAND_LIB}" ${CP_DST} | |||
cp "${CUBLASLT_LIB}" ${CP_DST} | |||
cp "${CUDART_LIB}" ${CP_DST} | |||
fi | |||
} | |||
function do_build() { | |||
for ver in ${ALL_PYTHON} | |||
do | |||
@@ -91,7 +125,13 @@ function do_build() { | |||
#change PYTHON_LIBRARY and PYTHON_INCLUDE_DIR, so add | |||
#-r to remove build cache after a new ver build, which | |||
#will be more slow build than without -r | |||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r | |||
if [ ${WINDOWS_WHL_WITH_CUDA} = "true" ]; then | |||
echo "build windows whl with cuda" | |||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r -c | |||
else | |||
echo "build windows whl with cpu only" | |||
${SRC_DIR}/scripts/cmake-build/host_build.sh -t -r | |||
fi | |||
#call setup.py | |||
BUILD_DIR=${SRC_DIR}/build_dir/host/build/ | |||
@@ -107,6 +147,7 @@ function do_build() { | |||
cp -a python_module/{megengine,setup.py,requires.txt,requires-style.txt,requires-test.txt} staging/ | |||
cd ${BUILD_DIR}/staging/megengine/_internal | |||
llvm-strip -s _mgb.pyd | |||
copy_more_dll | |||
cd ${BUILD_DIR}/staging | |||
${PYTHON_DIR}/python3 setup.py bdist_wheel | |||
cp ${BUILD_DIR}/staging/dist/Meg*.whl ${WINDOWS_WHL_HOME}/ | |||