You can not select more than 25 topics
Topics must start with a chinese character,a letter or number, can include dashes ('-') and can be up to 35 characters long.
|
- PARAM_DEFS := ../src/common/elemwise/each_mode.inl
-
- ELEMWISE_IMPL := ../src/cuda/cond_take/kimpl \
- ../src/cuda/elemwise/special_kimpl \
- ../src/cuda/elemwise/kimpl \
- ../src/rocm/elemwise/special_kimpl \
- ../src/rocm/elemwise/kimpl \
- ../src/naive/elemwise/kimpl \
- ../src/cuda/elemwise_multi_type/kimpl
-
- CUDA_CONV_IMPL := ../src/cuda/conv_bias/int8/kimpl ../src/cuda/conv_bias/int8_imma/kimpl ../src/cuda/batch_conv_bias/int8/kimpl
- CUDA_MATMUL_IMPL := ../src/cuda/matrix_mul/fp32_simt/kimpl ../src/cuda/matrix_mul/fp32_simt_gemv/kimpl
-
- all: ${PARAM_DEFS} ${ELEMWISE_IMPL} ${CUDA_CONV_IMPL} $(CUDA_MATMUL_IMPL)
-
- ../src/common/elemwise/each_mode.inl: gen_elemwise_each_mode.py
- ./$^ $@
-
- ../src/cuda/cond_take/kimpl: gen_cond_take_kern_impls.py
- ./$^ --type cuda $@
-
- ../src/cuda/elemwise/special_kimpl: gen_elemwise_special_kern_impls.py
- ./$^ --type cuda $@
-
- ../src/rocm/elemwise/special_kimpl: gen_elemwise_special_kern_impls.py
- ./$^ --type hip $@
-
- ../src/cuda/elemwise/kimpl: gen_elemwise_kern_impls.py
- ./$^ --type cuda $@
-
- ../src/rocm/elemwise/kimpl: gen_elemwise_kern_impls.py
- ./$^ --type hip $@
-
- ../src/%/elemwise/kimpl: gen_elemwise_kern_impls.py
- ./$^ $@
-
- ../src/cuda/elemwise_multi_type/kimpl: gen_elemwise_multi_type_kern_impls.py
- ./$^ --type cuda $@
-
- ../src/cuda/conv_bias/int8/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator
- ./gen_cuda_conv_bias_kern_impls.py --type dp4a $@
- python3 ./cutlass_generator/generator.py --operations all --type simt $@
-
- ../src/cuda/conv_bias/int8_imma/kimpl: gen_cuda_conv_bias_kern_impls.py cutlass_generator
- ./gen_cuda_conv_bias_kern_impls.py --type imma $@
- python3 ./cutlass_generator/generator.py --operations conv2d --type tensorop8816 $@
-
- ../src/cuda/batch_conv_bias/int8/kimpl: gen_cuda_batch_conv_bias_kern_impls.py
- ./$^ --type dp4a $@
-
- ../src/cuda/matrix_mul/fp32_simt/kimpl: gen_cutlass_matmul_kern_impls.py
- ./$^ $@
-
- ../src/cuda/matrix_mul/fp32_simt_gemv/kimpl: gen_cutlass_gemv_batched_strided_kern_impls.py
- ./$^ $@
-
- .PHONY: all
|