-
Notifications
You must be signed in to change notification settings - Fork 66
/
config.py
61 lines (59 loc) · 1.47 KB
/
config.py
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
46
47
48
49
50
51
52
53
54
55
56
57
58
59
60
61
### ADD TO THIS TO REGISTER NEW KERNELS
sources = {
'attn': {
'source_files': {
'h100': 'kernels/attn/h100/h100.cu' # define these source files for each GPU target desired.
}
},
'hedgehog': {
'source_files': {
'h100': 'kernels/hedgehog/hh.cu'
}
},
'based': {
'source_files': {
'h100': [
'kernels/based/lin_attn_h100.cu',
]
}
},
'cylon': {
'source_files': {
'h100': 'kernels/cylon/cylon.cu'
}
},
'flux': {
'source_files': {
'h100': [
'kernels/flux/flux_gate.cu',
'kernels/flux/flux_gelu.cu'
]
}
},
'fftconv': {
'source_files': {
'h100': 'kernels/fftconv/pc/pc.cu'
}
},
'fused_rotary': {
'source_files': {
'h100': 'kernels/rotary/pc.cu'
}
},
'fused_layernorm': {
'source_files': {
'h100': 'kernels/layernorm/non_pc/layer_norm.cu'
}
},
'mamba2': {
'source_files': {
'h100': 'kernels/mamba2/pc.cu'
}
}
}
### WHICH KERNELS DO WE WANT TO BUILD?
# (oftentimes during development work you don't need to redefine them all.)
kernels = ['attn', 'mamba2', 'hedgehog', 'fftconv', 'fused_rotary', 'based', 'fused_layernorm']
# kernels = ['mamba2', 'fftconv']
### WHICH GPU TARGET DO WE WANT TO BUILD FOR?
target = 'h100'