Browse Source

fix(dnn/cuda): fix algo matmul for conv bwd filter

fix fastrun workspace size not available exception and device OOM error caused by the incorrect workspace size calculation of algo matmul of conv bwd filter

GitOrigin-RevId: de96b4fe11
release-1.6
Megvii Engine Team 3 years ago
parent
commit
a0231a7920
1 changed files with 2 additions and 2 deletions
  1. +2
    -2
      dnn/src/cuda/convolution/backward_filter/matmul.cpp

+ 2
- 2
dnn/src/cuda/convolution/backward_filter/matmul.cpp View File

@@ -21,11 +21,11 @@ using namespace cuda;

namespace {
std::pair<TensorLayoutArray, MatrixMulForward::Param> sub_opr_config(
const ConvolutionBackwardDataImpl::CanonizedFilterMeta& fm,
const ConvolutionBackwardFilterImpl::CanonizedFilterMeta& fm,
const TensorLayout& src_layout, const TensorLayout& diff_layout,
const TensorLayout& grad_layout,
const ConvolutionBackwardFilterImpl* opr) {
size_t N = grad_layout.shape[0], IC = fm.icpg,
size_t N = src_layout.shape[0], IC = fm.icpg,
OC = fm.ocpg, OH = diff_layout.shape[2],
OW = diff_layout.shape[3], FH = fm.spatial[0],
FW = fm.spatial[1];


Loading…
Cancel
Save