GitOrigin-RevId: 11d78ab227
release-1.5
@@ -37,21 +37,21 @@ all: ${PARAM_DEFS} ${ELEMWISE_IMPL} ${CUDA_CONV_IMPL} $(CUDA_MATMUL_IMPL) | |||||
../src/cuda/elemwise_multi_type/kimpl: gen_elemwise_multi_type_kern_impls.py | ../src/cuda/elemwise_multi_type/kimpl: gen_elemwise_multi_type_kern_impls.py | ||||
./$^ --type cuda $@ | ./$^ --type cuda $@ | ||||
../src/cuda/conv_bias/int8/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator | |||||
../src/cuda/conv_bias/int8/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator/generator.py | |||||
./gen_cuda_conv_bias_kern_impls.py --type dp4a $@ | ./gen_cuda_conv_bias_kern_impls.py --type dp4a $@ | ||||
python3 ./cutlass_generator/generator.py --operations all --type simt $@ | |||||
python3 ./cutlass_generator/generator.py --operations conv2d --type simt $@ | |||||
../src/cuda/conv_bias/int8_imma/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator | |||||
../src/cuda/conv_bias/int8_imma/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator/generator.py | |||||
./gen_cuda_conv_bias_kern_impls.py --type imma $@ | ./gen_cuda_conv_bias_kern_impls.py --type imma $@ | ||||
python3 ./cutlass_generator/generator.py --operations conv2d --type tensorop8816 $@ | python3 ./cutlass_generator/generator.py --operations conv2d --type tensorop8816 $@ | ||||
../src/cuda/batch_conv_bias/int8/kimpl: gen_cuda_batch_conv_bias_kern_impls.py | ../src/cuda/batch_conv_bias/int8/kimpl: gen_cuda_batch_conv_bias_kern_impls.py | ||||
./$^ --type dp4a $@ | ./$^ --type dp4a $@ | ||||
../src/cuda/matrix_mul/fp32_simt/kimpl: gen_cutlass_matmul_kern_impls.py | |||||
./$^ $@ | |||||
../src/cuda/matrix_mul/fp32_simt/kimpl: cutlass_generator/generator.py | |||||
python3 ./cutlass_generator/generator.py --operations gemm --type simt $@ | |||||
../src/cuda/matrix_mul/fp32_simt_gemv/kimpl: gen_cutlass_gemv_batched_strided_kern_impls.py | |||||
./$^ $@ | |||||
../src/cuda/matrix_mul/fp32_simt_gemv/kimpl: cutlass_generator | |||||
python3 ./cutlass_generator/generator.py --operations gemv --type simt $@ | |||||
.PHONY: all | .PHONY: all |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |
@@ -40,16 +40,19 @@ using Convolution = | |||||
cutlass::arch::OpMultiplyAdd>; | cutlass::arch::OpMultiplyAdd>; | ||||
template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | template void megdnn::cuda::cutlass_wrapper::cutlass_convolution_wrapper<Convolution>( | ||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
const typename Convolution::ElementSrc* d_src, | |||||
const typename Convolution::ElementFilter* d_filter, | |||||
const typename Convolution::ElementBias* d_bias, | |||||
const typename Convolution::ElementDst* d_z, | |||||
typename Convolution::ElementDst* d_dst, | |||||
int* workspace, | |||||
typename Convolution::ConvolutionParameter const& conv_param, | |||||
typename Convolution::EpilogueOutputOp::Params const& epilogue, | |||||
cudaStream_t stream, | |||||
typename Convolution::ExtraParam extra_param); | |||||
#pragma GCC diagnostic pop | #pragma GCC diagnostic pop | ||||
#endif | #endif |