提交 52b55564 编写于 作者: M Megvii Engine Team

refactor(dnn/cuda): refactor reorder filter and bias kernel to support conv imma with data type s4

GitOrigin-RevId: 6827b73770872277c00a7505b0cb39dd05fd8d46
上级 d2673c5a
......@@ -66,6 +66,7 @@ public:
CUDA_IMPLICIT_GEMM_1X1_SASS_NCHW4_DOTPROD_INT8,
CUDA_IMPLICIT_GEMM_SASS_NCHW32_IMMA_INT8,
CUDA_IMPLICIT_GEMM_1X1_SASS_NCHW32_IMMA_INT8,
CUDA_IMPLICIT_GEMM_SASS_NCHW64_IMMA_INT4,
};
using Mapper = std::unordered_map<AlgorithmDesc, AlgoBase*>;
......@@ -806,6 +807,7 @@ public:
AlgoBatchedMatmul batched_matmul;
std::vector<AlgoInt8NCHW4DotProdImplicitGemm> int8_nchw4_dotprod;
AlgoInt8CHWN4DotProdImplicitGemm int8_chwn4_dotprod;
<<<<<<< HEAD
#if CUDA_VERSION >= 10000
AlgoQUInt4x4x32WMMA wmma_quint4x4x32;
std::vector<AlgoInt8CHWN4IMMAImplicitGemm> int8_chwn4_imma;
......
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册