MekkCyber commited on
Commit
4e9c226
Β·
1 Parent(s): d180d2d

update name

Browse files
This view is limited to 50 files because it contains too many changes. Β  See raw diff
Files changed (50) hide show
  1. build.toml +67 -67
  2. {layer-norm β†’ layer_norm}/ln.h +0 -0
  3. {layer-norm β†’ layer_norm}/ln_api.cpp +0 -0
  4. {layer-norm β†’ layer_norm}/ln_bwd_1024.cu +0 -0
  5. {layer-norm β†’ layer_norm}/ln_bwd_1280.cu +0 -0
  6. {layer-norm β†’ layer_norm}/ln_bwd_1536.cu +0 -0
  7. {layer-norm β†’ layer_norm}/ln_bwd_2048.cu +0 -0
  8. {layer-norm β†’ layer_norm}/ln_bwd_256.cu +0 -0
  9. {layer-norm β†’ layer_norm}/ln_bwd_2560.cu +0 -0
  10. {layer-norm β†’ layer_norm}/ln_bwd_3072.cu +0 -0
  11. {layer-norm β†’ layer_norm}/ln_bwd_4096.cu +0 -0
  12. {layer-norm β†’ layer_norm}/ln_bwd_512.cu +0 -0
  13. {layer-norm β†’ layer_norm}/ln_bwd_5120.cu +0 -0
  14. {layer-norm β†’ layer_norm}/ln_bwd_6144.cu +0 -0
  15. {layer-norm β†’ layer_norm}/ln_bwd_7168.cu +0 -0
  16. {layer-norm β†’ layer_norm}/ln_bwd_768.cu +0 -0
  17. {layer-norm β†’ layer_norm}/ln_bwd_8192.cu +0 -0
  18. {layer-norm β†’ layer_norm}/ln_bwd_kernels.cuh +0 -0
  19. {layer-norm β†’ layer_norm}/ln_fwd_1024.cu +0 -0
  20. {layer-norm β†’ layer_norm}/ln_fwd_1280.cu +0 -0
  21. {layer-norm β†’ layer_norm}/ln_fwd_1536.cu +0 -0
  22. {layer-norm β†’ layer_norm}/ln_fwd_2048.cu +0 -0
  23. {layer-norm β†’ layer_norm}/ln_fwd_256.cu +0 -0
  24. {layer-norm β†’ layer_norm}/ln_fwd_2560.cu +0 -0
  25. {layer-norm β†’ layer_norm}/ln_fwd_3072.cu +0 -0
  26. {layer-norm β†’ layer_norm}/ln_fwd_4096.cu +0 -0
  27. {layer-norm β†’ layer_norm}/ln_fwd_512.cu +0 -0
  28. {layer-norm β†’ layer_norm}/ln_fwd_5120.cu +0 -0
  29. {layer-norm β†’ layer_norm}/ln_fwd_6144.cu +0 -0
  30. {layer-norm β†’ layer_norm}/ln_fwd_7168.cu +0 -0
  31. {layer-norm β†’ layer_norm}/ln_fwd_768.cu +0 -0
  32. {layer-norm β†’ layer_norm}/ln_fwd_8192.cu +0 -0
  33. {layer-norm β†’ layer_norm}/ln_fwd_kernels.cuh +0 -0
  34. {layer-norm β†’ layer_norm}/ln_kernel_traits.h +0 -0
  35. {layer-norm β†’ layer_norm}/ln_parallel_bwd_1024.cu +0 -0
  36. {layer-norm β†’ layer_norm}/ln_parallel_bwd_1280.cu +0 -0
  37. {layer-norm β†’ layer_norm}/ln_parallel_bwd_1536.cu +0 -0
  38. {layer-norm β†’ layer_norm}/ln_parallel_bwd_2048.cu +0 -0
  39. {layer-norm β†’ layer_norm}/ln_parallel_bwd_256.cu +0 -0
  40. {layer-norm β†’ layer_norm}/ln_parallel_bwd_2560.cu +0 -0
  41. {layer-norm β†’ layer_norm}/ln_parallel_bwd_3072.cu +0 -0
  42. {layer-norm β†’ layer_norm}/ln_parallel_bwd_4096.cu +0 -0
  43. {layer-norm β†’ layer_norm}/ln_parallel_bwd_512.cu +0 -0
  44. {layer-norm β†’ layer_norm}/ln_parallel_bwd_5120.cu +0 -0
  45. {layer-norm β†’ layer_norm}/ln_parallel_bwd_6144.cu +0 -0
  46. {layer-norm β†’ layer_norm}/ln_parallel_bwd_7168.cu +0 -0
  47. {layer-norm β†’ layer_norm}/ln_parallel_bwd_768.cu +0 -0
  48. {layer-norm β†’ layer_norm}/ln_parallel_bwd_8192.cu +0 -0
  49. {layer-norm β†’ layer_norm}/ln_parallel_fwd_1024.cu +0 -0
  50. {layer-norm β†’ layer_norm}/ln_parallel_fwd_1280.cu +0 -0
build.toml CHANGED
@@ -1,5 +1,5 @@
1
  [general]
2
- name = "layer-norm"
3
  universal = false
4
 
5
  [torch]
@@ -8,76 +8,76 @@ src = [
8
  "torch-ext/torch_binding.h",
9
  ]
10
 
11
- [kernel.layer-norm]
12
  depends = ["torch"]
13
  backend = "cuda"
14
  include = ["."]
15
  src = [
16
- "layer-norm/ln.h",
17
- "layer-norm/ln_api.cpp",
18
- "layer-norm/ln_bwd_1024.cu",
19
- "layer-norm/ln_bwd_1280.cu",
20
- "layer-norm/ln_bwd_1536.cu",
21
- "layer-norm/ln_bwd_2048.cu",
22
- "layer-norm/ln_bwd_256.cu",
23
- "layer-norm/ln_bwd_2560.cu",
24
- "layer-norm/ln_bwd_3072.cu",
25
- "layer-norm/ln_bwd_4096.cu",
26
- "layer-norm/ln_bwd_512.cu",
27
- "layer-norm/ln_bwd_5120.cu",
28
- "layer-norm/ln_bwd_6144.cu",
29
- "layer-norm/ln_bwd_7168.cu",
30
- "layer-norm/ln_bwd_768.cu",
31
- "layer-norm/ln_bwd_8192.cu",
32
- "layer-norm/ln_bwd_kernels.cuh",
33
- "layer-norm/ln_fwd_1024.cu",
34
- "layer-norm/ln_fwd_1280.cu",
35
- "layer-norm/ln_fwd_1536.cu",
36
- "layer-norm/ln_fwd_2048.cu",
37
- "layer-norm/ln_fwd_256.cu",
38
- "layer-norm/ln_fwd_2560.cu",
39
- "layer-norm/ln_fwd_3072.cu",
40
- "layer-norm/ln_fwd_4096.cu",
41
- "layer-norm/ln_fwd_512.cu",
42
- "layer-norm/ln_fwd_5120.cu",
43
- "layer-norm/ln_fwd_6144.cu",
44
- "layer-norm/ln_fwd_7168.cu",
45
- "layer-norm/ln_fwd_768.cu",
46
- "layer-norm/ln_fwd_8192.cu",
47
- "layer-norm/ln_fwd_kernels.cuh",
48
- "layer-norm/ln_kernel_traits.h",
49
- "layer-norm/ln_parallel_bwd_1024.cu",
50
- "layer-norm/ln_parallel_bwd_1280.cu",
51
- "layer-norm/ln_parallel_bwd_1536.cu",
52
- "layer-norm/ln_parallel_bwd_2048.cu",
53
- "layer-norm/ln_parallel_bwd_256.cu",
54
- "layer-norm/ln_parallel_bwd_2560.cu",
55
- "layer-norm/ln_parallel_bwd_3072.cu",
56
- "layer-norm/ln_parallel_bwd_4096.cu",
57
- "layer-norm/ln_parallel_bwd_512.cu",
58
- "layer-norm/ln_parallel_bwd_5120.cu",
59
- "layer-norm/ln_parallel_bwd_6144.cu",
60
- "layer-norm/ln_parallel_bwd_7168.cu",
61
- "layer-norm/ln_parallel_bwd_768.cu",
62
- "layer-norm/ln_parallel_bwd_8192.cu",
63
- "layer-norm/ln_parallel_fwd_1024.cu",
64
- "layer-norm/ln_parallel_fwd_1280.cu",
65
- "layer-norm/ln_parallel_fwd_1536.cu",
66
- "layer-norm/ln_parallel_fwd_2048.cu",
67
- "layer-norm/ln_parallel_fwd_256.cu",
68
- "layer-norm/ln_parallel_fwd_2560.cu",
69
- "layer-norm/ln_parallel_fwd_3072.cu",
70
- "layer-norm/ln_parallel_fwd_4096.cu",
71
- "layer-norm/ln_parallel_fwd_512.cu",
72
- "layer-norm/ln_parallel_fwd_5120.cu",
73
- "layer-norm/ln_parallel_fwd_6144.cu",
74
- "layer-norm/ln_parallel_fwd_7168.cu",
75
- "layer-norm/ln_parallel_fwd_768.cu",
76
- "layer-norm/ln_parallel_fwd_8192.cu",
77
- "layer-norm/ln_parallel_residual_bwd_kernels.cuh",
78
- "layer-norm/ln_parallel_residual_fwd_kernels.cuh",
79
- "layer-norm/ln_utils.cuh",
80
- "layer-norm/static_switch.h"
81
  ]
82
  cxx-flags = ["-DFLASHATTENTION_DISABLE_PYBIND"]
83
  cuda-flags = [
 
1
  [general]
2
+ name = "layer_norm"
3
  universal = false
4
 
5
  [torch]
 
8
  "torch-ext/torch_binding.h",
9
  ]
10
 
11
+ [kernel.layer_norm]
12
  depends = ["torch"]
13
  backend = "cuda"
14
  include = ["."]
15
  src = [
16
+ "layer_norm/ln.h",
17
+ "layer_norm/ln_api.cpp",
18
+ "layer_norm/ln_bwd_1024.cu",
19
+ "layer_norm/ln_bwd_1280.cu",
20
+ "layer_norm/ln_bwd_1536.cu",
21
+ "layer_norm/ln_bwd_2048.cu",
22
+ "layer_norm/ln_bwd_256.cu",
23
+ "layer_norm/ln_bwd_2560.cu",
24
+ "layer_norm/ln_bwd_3072.cu",
25
+ "layer_norm/ln_bwd_4096.cu",
26
+ "layer_norm/ln_bwd_512.cu",
27
+ "layer_norm/ln_bwd_5120.cu",
28
+ "layer_norm/ln_bwd_6144.cu",
29
+ "layer_norm/ln_bwd_7168.cu",
30
+ "layer_norm/ln_bwd_768.cu",
31
+ "layer_norm/ln_bwd_8192.cu",
32
+ "layer_norm/ln_bwd_kernels.cuh",
33
+ "layer_norm/ln_fwd_1024.cu",
34
+ "layer_norm/ln_fwd_1280.cu",
35
+ "layer_norm/ln_fwd_1536.cu",
36
+ "layer_norm/ln_fwd_2048.cu",
37
+ "layer_norm/ln_fwd_256.cu",
38
+ "layer_norm/ln_fwd_2560.cu",
39
+ "layer_norm/ln_fwd_3072.cu",
40
+ "layer_norm/ln_fwd_4096.cu",
41
+ "layer_norm/ln_fwd_512.cu",
42
+ "layer_norm/ln_fwd_5120.cu",
43
+ "layer_norm/ln_fwd_6144.cu",
44
+ "layer_norm/ln_fwd_7168.cu",
45
+ "layer_norm/ln_fwd_768.cu",
46
+ "layer_norm/ln_fwd_8192.cu",
47
+ "layer_norm/ln_fwd_kernels.cuh",
48
+ "layer_norm/ln_kernel_traits.h",
49
+ "layer_norm/ln_parallel_bwd_1024.cu",
50
+ "layer_norm/ln_parallel_bwd_1280.cu",
51
+ "layer_norm/ln_parallel_bwd_1536.cu",
52
+ "layer_norm/ln_parallel_bwd_2048.cu",
53
+ "layer_norm/ln_parallel_bwd_256.cu",
54
+ "layer_norm/ln_parallel_bwd_2560.cu",
55
+ "layer_norm/ln_parallel_bwd_3072.cu",
56
+ "layer_norm/ln_parallel_bwd_4096.cu",
57
+ "layer_norm/ln_parallel_bwd_512.cu",
58
+ "layer_norm/ln_parallel_bwd_5120.cu",
59
+ "layer_norm/ln_parallel_bwd_6144.cu",
60
+ "layer_norm/ln_parallel_bwd_7168.cu",
61
+ "layer_norm/ln_parallel_bwd_768.cu",
62
+ "layer_norm/ln_parallel_bwd_8192.cu",
63
+ "layer_norm/ln_parallel_fwd_1024.cu",
64
+ "layer_norm/ln_parallel_fwd_1280.cu",
65
+ "layer_norm/ln_parallel_fwd_1536.cu",
66
+ "layer_norm/ln_parallel_fwd_2048.cu",
67
+ "layer_norm/ln_parallel_fwd_256.cu",
68
+ "layer_norm/ln_parallel_fwd_2560.cu",
69
+ "layer_norm/ln_parallel_fwd_3072.cu",
70
+ "layer_norm/ln_parallel_fwd_4096.cu",
71
+ "layer_norm/ln_parallel_fwd_512.cu",
72
+ "layer_norm/ln_parallel_fwd_5120.cu",
73
+ "layer_norm/ln_parallel_fwd_6144.cu",
74
+ "layer_norm/ln_parallel_fwd_7168.cu",
75
+ "layer_norm/ln_parallel_fwd_768.cu",
76
+ "layer_norm/ln_parallel_fwd_8192.cu",
77
+ "layer_norm/ln_parallel_residual_bwd_kernels.cuh",
78
+ "layer_norm/ln_parallel_residual_fwd_kernels.cuh",
79
+ "layer_norm/ln_utils.cuh",
80
+ "layer_norm/static_switch.h"
81
  ]
82
  cxx-flags = ["-DFLASHATTENTION_DISABLE_PYBIND"]
83
  cuda-flags = [
{layer-norm β†’ layer_norm}/ln.h RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_api.cpp RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_1024.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_1280.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_1536.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_2048.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_256.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_2560.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_3072.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_4096.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_512.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_5120.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_6144.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_7168.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_768.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_8192.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_bwd_kernels.cuh RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_1024.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_1280.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_1536.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_2048.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_256.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_2560.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_3072.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_4096.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_512.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_5120.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_6144.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_7168.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_768.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_8192.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_fwd_kernels.cuh RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_kernel_traits.h RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_1024.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_1280.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_1536.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_2048.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_256.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_2560.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_3072.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_4096.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_512.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_5120.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_6144.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_7168.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_768.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_bwd_8192.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_fwd_1024.cu RENAMED
File without changes
{layer-norm β†’ layer_norm}/ln_parallel_fwd_1280.cu RENAMED
File without changes