Browse Source

refactor(dnn/cuda): refactor reorder filter and bias kernel to support conv imma with data type s4

GitOrigin-RevId: 6827b73770
release-1.5
Megvii Engine Team 4 years ago
parent
commit
52b55564d7
1 changed files with 2 additions and 0 deletions
  1. +2
    -0
      dnn/src/cuda/conv_bias/algo.h

+ 2
- 0
dnn/src/cuda/conv_bias/algo.h View File

@@ -66,6 +66,7 @@ public:
CUDA_IMPLICIT_GEMM_1X1_SASS_NCHW4_DOTPROD_INT8,
CUDA_IMPLICIT_GEMM_SASS_NCHW32_IMMA_INT8,
CUDA_IMPLICIT_GEMM_1X1_SASS_NCHW32_IMMA_INT8,
CUDA_IMPLICIT_GEMM_SASS_NCHW64_IMMA_INT4,
};
using Mapper = std::unordered_map<AlgorithmDesc, AlgoBase*>;

@@ -806,6 +807,7 @@ public:
AlgoBatchedMatmul batched_matmul;
std::vector<AlgoInt8NCHW4DotProdImplicitGemm> int8_nchw4_dotprod;
AlgoInt8CHWN4DotProdImplicitGemm int8_chwn4_dotprod;
<<<<<<< HEAD
#if CUDA_VERSION >= 10000
AlgoQUInt4x4x32WMMA wmma_quint4x4x32;
std::vector<AlgoInt8CHWN4IMMAImplicitGemm> int8_chwn4_imma;


Loading…
Cancel
Save