Instructions to use kernels-community/flash-attn2 with libraries, inference providers, notebooks, and local apps. Follow these links to get started.
- Libraries
- Kernels
How to use kernels-community/flash-attn2 with Kernels:
# !pip install kernels from kernels import get_kernel kernel = get_kernel("kernels-community/flash-attn2") - Notebooks
- Google Colab
- Kaggle
Uploaded using `kernel-builder`.
Browse files- build/torch210-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch210-cxx11-cu126-aarch64-linux/_ops.py +3 -3
- build/torch210-cxx11-cu126-aarch64-linux/metadata.json +1 -1
- build/torch210-cxx11-cu128-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch210-cxx11-cu128-aarch64-linux/_ops.py +3 -3
- build/torch210-cxx11-cu128-aarch64-linux/metadata.json +1 -1
- build/torch210-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch210-cxx11-cu130-aarch64-linux/_ops.py +3 -3
- build/torch210-cxx11-cu130-aarch64-linux/metadata.json +1 -1
- build/torch211-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch211-cxx11-cu126-aarch64-linux/_ops.py +3 -3
- build/torch211-cxx11-cu126-aarch64-linux/metadata.json +1 -1
- build/torch211-cxx11-cu128-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch211-cxx11-cu128-aarch64-linux/_ops.py +3 -3
- build/torch211-cxx11-cu128-aarch64-linux/metadata.json +1 -1
- build/torch211-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch211-cxx11-cu130-aarch64-linux/_ops.py +3 -3
- build/torch211-cxx11-cu130-aarch64-linux/metadata.json +1 -1
- build/torch212-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch212-cxx11-cu126-aarch64-linux/_ops.py +3 -3
- build/torch212-cxx11-cu126-aarch64-linux/metadata.json +1 -1
- build/torch212-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch212-cxx11-cu130-aarch64-linux/_ops.py +3 -3
- build/torch212-cxx11-cu130-aarch64-linux/metadata.json +1 -1
- build/torch212-cxx11-cu132-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so} +1 -1
- build/torch212-cxx11-cu132-aarch64-linux/_ops.py +3 -3
- build/torch212-cxx11-cu132-aarch64-linux/metadata.json +1 -1
build/torch210-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 448533504
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:6a2dbd72f90200c6eeb0af34b80474129ca47b9622a55b6ea387fb71cf129f8b
|
| 3 |
size 448533504
|
build/torch210-cxx11-cu126-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch210-cxx11-cu126-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch210-cxx11-cu128-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1037990952
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9575dbcc1f6deb66ad86fd240114761b7ca5d6c9a603d392e487afd3309bfd1a
|
| 3 |
size 1037990952
|
build/torch210-cxx11-cu128-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch210-cxx11-cu128-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch210-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1008644888
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:801f0f8c09783b2cf1eca03600b3cb41b41d8af172c2b89f14e8b04d38c64c34
|
| 3 |
size 1008644888
|
build/torch210-cxx11-cu130-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch210-cxx11-cu130-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch211-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 448529832
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:a97ba5d5eb2edb48237d7fa376de3d92303eabdb0f45e678f9807c89bcd6835a
|
| 3 |
size 448529832
|
build/torch211-cxx11-cu126-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch211-cxx11-cu126-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch211-cxx11-cu128-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1037987184
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:b87ac231a8ef6d7700ca1d6a3f92ec9a71ac703d3f78a3529c99a08947581aef
|
| 3 |
size 1037987184
|
build/torch211-cxx11-cu128-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch211-cxx11-cu128-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch211-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1008641088
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:9f258f1e0b43582268c0e0a56c9a7446f843730697c1e3b70bc7fd3e4ef48c86
|
| 3 |
size 1008641088
|
build/torch211-cxx11-cu130-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch211-cxx11-cu130-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch212-cxx11-cu126-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 448533232
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:23515351fae9b31d35f535ba553cce63fa3ab080b0185c838103f0710522e9cc
|
| 3 |
size 448533232
|
build/torch212-cxx11-cu126-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch212-cxx11-cu126-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch212-cxx11-cu130-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1008644656
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:1008b71ff56f162d3b920c32bba353fc8533baf4a895ef5345e995bc149d3cb5
|
| 3 |
size 1008644656
|
build/torch212-cxx11-cu130-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch212-cxx11-cu130-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
build/torch212-cxx11-cu132-aarch64-linux/{_flash_attn2_cuda_d36888d.abi3.so → _flash_attn2_cuda_93b0cf2.abi3.so}
RENAMED
|
@@ -1,3 +1,3 @@
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
-
oid sha256:
|
| 3 |
size 1026020752
|
|
|
|
| 1 |
version https://git-lfs.github.com/spec/v1
|
| 2 |
+
oid sha256:f3c04a8219e405c29f2afc41fa0a313cdb7374d9e30e44fb03e24494a128684c
|
| 3 |
size 1026020752
|
build/torch212-cxx11-cu132-aarch64-linux/_ops.py
CHANGED
|
@@ -1,9 +1,9 @@
|
|
| 1 |
import torch
|
| 2 |
-
from . import
|
| 3 |
-
ops = torch.ops.
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
-
return f"
|
|
|
|
| 1 |
import torch
|
| 2 |
+
from . import _flash_attn2_cuda_93b0cf2
|
| 3 |
+
ops = torch.ops._flash_attn2_cuda_93b0cf2
|
| 4 |
|
| 5 |
def add_op_namespace_prefix(op_name: str):
|
| 6 |
"""
|
| 7 |
Prefix op by namespace.
|
| 8 |
"""
|
| 9 |
+
return f"_flash_attn2_cuda_93b0cf2::{op_name}"
|
build/torch212-cxx11-cu132-aarch64-linux/metadata.json
CHANGED
|
@@ -1,6 +1,6 @@
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
-
"id": "
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|
|
|
|
| 1 |
{
|
| 2 |
"name": "flash-attn2",
|
| 3 |
+
"id": "_flash_attn2_cuda_93b0cf2",
|
| 4 |
"version": 1,
|
| 5 |
"license": "BSD-3-Clause",
|
| 6 |
"python-depends": [],
|