File size: 1,115 Bytes
5a84343
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
6c3d9d6
5a84343
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
[general]
name = "punica_sgmv"

[torch]
src = [
  "torch-ext/torch_binding.cpp",
  "torch-ext/torch_binding.h"
]

[kernel.sgmv]
language = "cuda"
src = [
  "sgmv/sgmv_cutlass.cu",
  "sgmv/sgmv_cutlass.cuh",
]
depends = [ "cutlass_3_8", "torch" ]

[kernel.sgmv_flashinfer]
language = "cuda"
cuda-capabilities = [ "8.0", "8.6", "8.7", "8.9", "9.0", "10.0", "10.1", "12.0" ]
src = [
  "flashinfer/cp_async.cuh",
  "flashinfer/mma.cuh",
  "flashinfer/permuted_smem.cuh",
  "flashinfer/vec_dtypes.cuh",
  "sgmv_flashinfer/sgmv_all.cu",
  "sgmv_flashinfer/sgmv_config.h",
  "sgmv_flashinfer/sgmv_flashinfer.cuh"
]
include = [ "." ]
depends = [ "torch" ]

[kernel.bgmv]
language = "cuda"
cuda-capabilities = [ "8.0", "8.6", "8.7", "8.9", "9.0", "10.0", "10.1", "12.0" ]
src = [
  "bgmv/bgmv_all.cu",
  "bgmv/bgmv_impl.cuh",
  "bgmv/bgmv_config.h",
  "flashinfer/vec_dtypes.cuh"
]
include = [ "." ]
depends = [ "torch" ]

[kernel.punica_kernels]
language = "cuda"
src = [
  "bgmv/bgmv_config.h",
  "punica_kernels/punica_ops.cc",
  "sgmv/sgmv.h",
  "sgmv_flashinfer/sgmv_config.h"
]
include = [ "." ]
depends = [ "torch" ]