diff --git a/ci/run_cpp_test.sh b/ci/run_cpp_test.sh index 1e0e16eb..6dd6fda0 100755 --- a/ci/run_cpp_test.sh +++ b/ci/run_cpp_test.sh @@ -20,4 +20,4 @@ if [[ "$1" == "cpu" || "$1" == "cuda" ]] ; then else echo "Argument must cpu or cuda" exit 1 -fi \ No newline at end of file +fi diff --git a/dnn/test/cuda/convolution.cpp b/dnn/test/cuda/convolution.cpp index b95cfda4..4a69c8f4 100644 --- a/dnn/test/cuda/convolution.cpp +++ b/dnn/test/cuda/convolution.cpp @@ -17,6 +17,7 @@ #include "test/common/convolution.h" #include "test/common/rng.h" #include "test/cuda/benchmark.h" +#include "test/cuda/utils.h" #include "src/cuda/utils.h" @@ -203,18 +204,20 @@ TEST_F(CUDA, CONVOLUTION_BACKWARD_DATA) .set_epsilon(1e-3) .set_param(arg.param) .exec(TensorLayoutArray{filter, dst, src}); - src.dtype = dst.dtype = filter.dtype = dtype::Float16(); - checker.set_rng(0, &rng) - .set_rng(1, &rng) - .set_epsilon(1e-1) - .set_param(arg.param) - .exec(TensorLayoutArray{filter, dst, src}); - arg.param.compute_mode = param::Convolution::ComputeMode::FLOAT32; - checker.set_rng(0, &rng) - .set_rng(1, &rng) - .set_epsilon(1e-1) - .set_param(arg.param) - .exec(TensorLayoutArray{filter, dst, src}); + if (!megdnn::test::check_compute_capability(6, 0)) { + src.dtype = dst.dtype = filter.dtype = dtype::Float16(); + checker.set_rng(0, &rng) + .set_rng(1, &rng) + .set_epsilon(1e-1) + .set_param(arg.param) + .exec(TensorLayoutArray{filter, dst, src}); + arg.param.compute_mode = param::Convolution::ComputeMode::FLOAT32; + checker.set_rng(0, &rng) + .set_rng(1, &rng) + .set_epsilon(1e-1) + .set_param(arg.param) + .exec(TensorLayoutArray{filter, dst, src}); + } } } diff --git a/src/jit/impl/halide/compiler_cuda.cpp b/src/jit/impl/halide/compiler_cuda.cpp index 75347122..3c109e2f 100644 --- a/src/jit/impl/halide/compiler_cuda.cpp +++ b/src/jit/impl/halide/compiler_cuda.cpp @@ -49,7 +49,7 @@ HalideCudaTargetTrait::FeatureSet HalideCudaTargetTrait::features( set.set(Target::CUDACapability32); } else if (in(35, 40)) { set.set(Target::CUDACapability35); - } else if (in(50, 60)) { + } else if (in(50, 61)) { set.set(Target::CUDACapability50); } else if (in(61, 70)) { set.set(Target::CUDACapability61);