Kernels
File size: 923 Bytes
44e9845
 
cef5fdf
 
 
 
44e9845
 
 
 
 
 
 
 
f5a7d38
cf68df1
44e9845
f3b99fb
e5e2eeb
f3b99fb
e5e2eeb
0045757
44e9845
 
 
 
 
 
cf68df1
 
 
 
 
e5e2eeb
cf68df1
e5e2eeb
0045757
cf68df1
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
16
17
18
19
20
21
22
23
24
25
26
27
28
29
30
31
32
33
34
35
36
37
38
39
40
41
42
43
44
45
[general]
name = "activation"
backends = [
    "cuda",
    "rocm",
]

[torch]
src = [
  "torch-ext/torch_binding.cpp",
  "torch-ext/torch_binding.h"
]

[kernel.activation]
backend = "rocm"
rocm-archs = [ "gfx90a", "gfx942" ]
src = [
  "activation/poly_norm.cu",
  "activation/fused_mul_poly_norm.cu",
  "activation/rms_norm.cu",
  "activation/fused_add_rms_norm.cu",
  "activation/grouped_poly_norm.cu",
  "activation/cuda_compat.h",
  "activation/dispatch_utils.h",
  "activation/assert_utils.h",
  "activation/atomic_utils.h",
]
depends = [ "torch" ]

[kernel.activation_cuda]
backend = "cuda"
src = [
  "activation/poly_norm.cu",
  "activation/fused_mul_poly_norm.cu",
  "activation/rms_norm.cu",
  "activation/fused_add_rms_norm.cu",
  "activation/grouped_poly_norm.cu",
  "activation/cuda_compat.h",
  "activation/dispatch_utils.h",
  "activation/assert_utils.h",
  "activation/atomic_utils.h",
]
depends = ["torch"]