提交 5a14a892 编写于 作者: M Megvii Engine Team 提交者: huangxinda

refactor(dnn/cuda): refactor cutlass kernel generator for gemm and gemv

GitOrigin-RevId: 11d78ab2270f0720d7d79e186124a1254c467980
上级 b33217d8
......@@ -37,21 +37,21 @@ all: ${PARAM_DEFS} ${ELEMWISE_IMPL} ${CUDA_CONV_IMPL} $(CUDA_MATMUL_IMPL)
../src/cuda/elemwise_multi_type/kimpl: gen_elemwise_multi_type_kern_impls.py
./$^ --type cuda $@
../src/cuda/conv_bias/int8/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator
../src/cuda/conv_bias/int8/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator/generator.py
./gen_cuda_conv_bias_kern_impls.py --type dp4a $@
python3 ./cutlass_generator/generator.py --operations all --type simt $@
python3 ./cutlass_generator/generator.py --operations conv2d --type simt $@
../src/cuda/conv_bias/int8_imma/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator
../src/cuda/conv_bias/int8_imma/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator/generator.py
./gen_cuda_conv_bias_kern_impls.py --type imma $@
python3 ./cutlass_generator/generator.py --operations conv2d --type tensorop8816 $@
../src/cuda/batch_conv_bias/int8/kimpl: gen_cuda_batch_conv_bias_kern_impls.py
./$^ --type dp4a $@
../src/cuda/matrix_mul/fp32_simt/kimpl: gen_cutlass_matmul_kern_impls.py
./$^ $@
../src/cuda/matrix_mul/fp32_simt/kimpl: cutlass_generator/generator.py
python3 ./cutlass_generator/generator.py --operations gemm --type simt $@
../src/cuda/matrix_mul/fp32_simt_gemv/kimpl: gen_cutlass_gemv_batched_strided_kern_impls.py
./$^ $@
../src/cuda/matrix_mul/fp32_simt_gemv/kimpl: cutlass_generator
python3 ./cutlass_generator/generator.py --operations gemv --type simt $@
.PHONY: all
Markdown is supported
0% .
You are about to add 0 people to the discussion. Proceed with caution.
先完成此消息的编辑!
想要评论请 注册