punica-sgmv / build.toml
danieldk's picture
danieldk HF Staff
Set CUDA capabilities for bgmv
6c3d9d6
[general]
name = "punica_sgmv"
[torch]
src = [
"torch-ext/torch_binding.cpp",
"torch-ext/torch_binding.h"
]
[kernel.sgmv]
language = "cuda"
src = [
"sgmv/sgmv_cutlass.cu",
"sgmv/sgmv_cutlass.cuh",
]
depends = [ "cutlass_3_8", "torch" ]
[kernel.sgmv_flashinfer]
language = "cuda"
cuda-capabilities = [ "8.0", "8.6", "8.7", "8.9", "9.0", "10.0", "10.1", "12.0" ]
src = [
"flashinfer/cp_async.cuh",
"flashinfer/mma.cuh",
"flashinfer/permuted_smem.cuh",
"flashinfer/vec_dtypes.cuh",
"sgmv_flashinfer/sgmv_all.cu",
"sgmv_flashinfer/sgmv_config.h",
"sgmv_flashinfer/sgmv_flashinfer.cuh"
]
include = [ "." ]
depends = [ "torch" ]
[kernel.bgmv]
language = "cuda"
cuda-capabilities = [ "8.0", "8.6", "8.7", "8.9", "9.0", "10.0", "10.1", "12.0" ]
src = [
"bgmv/bgmv_all.cu",
"bgmv/bgmv_impl.cuh",
"bgmv/bgmv_config.h",
"flashinfer/vec_dtypes.cuh"
]
include = [ "." ]
depends = [ "torch" ]
[kernel.punica_kernels]
language = "cuda"
src = [
"bgmv/bgmv_config.h",
"punica_kernels/punica_ops.cc",
"sgmv/sgmv.h",
"sgmv_flashinfer/sgmv_config.h"
]
include = [ "." ]
depends = [ "torch" ]