Update README.md
Browse files
README.md
CHANGED
|
@@ -17,30 +17,29 @@ This is the repository card of {repo_id} that has been pushed on the Hub. It was
|
|
| 17 |
from kernels import get_kernel
|
| 18 |
|
| 19 |
kernel_module = get_kernel("REPO_ID") # <- change the ID if needed
|
| 20 |
-
|
| 21 |
|
| 22 |
-
|
| 23 |
```
|
| 24 |
|
| 25 |
## Available functions
|
| 26 |
|
| 27 |
-
- `
|
| 28 |
-
- `
|
| 29 |
-
- `
|
| 30 |
-
- `
|
| 31 |
-
- `
|
| 32 |
-
- `
|
| 33 |
-
- `gelu_new`
|
| 34 |
-
- `gelu_quick`
|
| 35 |
-
- `gelu_tanh`
|
| 36 |
-
- `silu`
|
| 37 |
-
- `gelu`
|
| 38 |
-
- `layers`
|
| 39 |
|
| 40 |
## Supported backends
|
| 41 |
|
| 42 |
- cuda
|
| 43 |
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 44 |
## Benchmarks
|
| 45 |
|
| 46 |
[TODO: provide benchmarks if available]
|
|
|
|
| 17 |
from kernels import get_kernel
|
| 18 |
|
| 19 |
kernel_module = get_kernel("REPO_ID") # <- change the ID if needed
|
| 20 |
+
flash_attn_combine = kernel_module.flash_attn_combine
|
| 21 |
|
| 22 |
+
flash_attn_combine(...)
|
| 23 |
```
|
| 24 |
|
| 25 |
## Available functions
|
| 26 |
|
| 27 |
+
- `flash_attn_combine`
|
| 28 |
+
- `flash_attn_func`
|
| 29 |
+
- `flash_attn_qkvpacked_func`
|
| 30 |
+
- `flash_attn_varlen_func`
|
| 31 |
+
- `flash_attn_with_kvcache`
|
| 32 |
+
- `get_scheduler_metadata`
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
|
| 33 |
|
| 34 |
## Supported backends
|
| 35 |
|
| 36 |
- cuda
|
| 37 |
|
| 38 |
+
## CUDA Capabilities
|
| 39 |
+
|
| 40 |
+
- 9.0a
|
| 41 |
+
- 8.0
|
| 42 |
+
|
| 43 |
## Benchmarks
|
| 44 |
|
| 45 |
[TODO: provide benchmarks if available]
|