Kernels:

kernels-community
/

flash-attn2

Trusted publisher

kernels-bot commited on 17 days ago

Commit

c5b9b7c

verified ·

1 Parent(s): 4d869f3

Uploaded using `kernel-builder`.

Files changed (12) hide show

build/torch210-cxx11-xpu20253-x86_64-linux/{_flash_attn2_xpu_14f6010.abi3.so → _flash_attn2_xpu_85c21a0.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:4aebc32fcc23d3e214267b829b34593617c300865c7ee84388b62820bcc96c59
-size 37243424

 version https://git-lfs.github.com/spec/v1
+oid sha256:15a9d3044a02aff0b2f3c240b62c7eb54124878c480717102384dd89090e77ae
+size 17713168

build/torch210-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _flash_attn2_xpu_14f6010
-ops = torch.ops._flash_attn2_xpu_14f6010
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_flash_attn2_xpu_14f6010::{op_name}"

 import torch
+from . import _flash_attn2_xpu_85c21a0
+ops = torch.ops._flash_attn2_xpu_85c21a0
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_flash_attn2_xpu_85c21a0::{op_name}"

build/torch210-cxx11-xpu20253-x86_64-linux/flash_attn_interface.py CHANGED Viewed

@@ -36,14 +36,7 @@ def _get_block_size_n(device, head_dim, is_dropout, is_causal):
     assert head_dim <= 256
     if device.type == "xpu":
-        if head_dim <= 96:
-            return 64
-        elif head_dim <= 128:
-            return 32
-        elif head_dim <= 256:
-            return 64
-        else:
-            return 32
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

     assert head_dim <= 256
     if device.type == "xpu":
+        return 64
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

build/torch210-cxx11-xpu20253-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "flash-attn2",
-  "id": "_flash_attn2_xpu_14f6010",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "flash-attn2",
+  "id": "_flash_attn2_xpu_85c21a0",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch211-cxx11-xpu20253-x86_64-linux/{_flash_attn2_xpu_14f6010.abi3.so → _flash_attn2_xpu_85c21a0.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:58e4af382503705b7154ce52ea48013f45f9bd1558f4469b96e17a25878b6ab4
-size 37243424

 version https://git-lfs.github.com/spec/v1
+oid sha256:54c1c44285ae6adbd98d2eeaaa1f475dd74170c5d5676091ac26bf01091a0da5
+size 17713168

build/torch211-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _flash_attn2_xpu_14f6010
-ops = torch.ops._flash_attn2_xpu_14f6010
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_flash_attn2_xpu_14f6010::{op_name}"

 import torch
+from . import _flash_attn2_xpu_85c21a0
+ops = torch.ops._flash_attn2_xpu_85c21a0
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_flash_attn2_xpu_85c21a0::{op_name}"

build/torch211-cxx11-xpu20253-x86_64-linux/flash_attn_interface.py CHANGED Viewed

@@ -36,14 +36,7 @@ def _get_block_size_n(device, head_dim, is_dropout, is_causal):
     assert head_dim <= 256
     if device.type == "xpu":
-        if head_dim <= 96:
-            return 64
-        elif head_dim <= 128:
-            return 32
-        elif head_dim <= 256:
-            return 64
-        else:
-            return 32
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

     assert head_dim <= 256
     if device.type == "xpu":
+        return 64
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

build/torch211-cxx11-xpu20253-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "flash-attn2",
-  "id": "_flash_attn2_xpu_14f6010",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "flash-attn2",
+  "id": "_flash_attn2_xpu_85c21a0",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch212-cxx11-xpu20253-x86_64-linux/{_flash_attn2_xpu_14f6010.abi3.so → _flash_attn2_xpu_85c21a0.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:66c1acbc81d29095817f87ce78459026c256d33b40b54ca3416e5a24d7df9b8b
-size 37198312

 version https://git-lfs.github.com/spec/v1
+oid sha256:d32013ee9eba7775b2ce44c94d6059798f6c56cf7e9b32b5c7f7684aaedd99ff
+size 17672144

build/torch212-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _flash_attn2_xpu_14f6010
-ops = torch.ops._flash_attn2_xpu_14f6010
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_flash_attn2_xpu_14f6010::{op_name}"

 import torch
+from . import _flash_attn2_xpu_85c21a0
+ops = torch.ops._flash_attn2_xpu_85c21a0
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_flash_attn2_xpu_85c21a0::{op_name}"

build/torch212-cxx11-xpu20253-x86_64-linux/flash_attn_interface.py CHANGED Viewed

@@ -36,14 +36,7 @@ def _get_block_size_n(device, head_dim, is_dropout, is_causal):
     assert head_dim <= 256
     if device.type == "xpu":
-        if head_dim <= 96:
-            return 64
-        elif head_dim <= 128:
-            return 32
-        elif head_dim <= 256:
-            return 64
-        else:
-            return 32
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

     assert head_dim <= 256
     if device.type == "xpu":
+        return 64
     # This should match the block sizes in the CUDA kernel
     major, minor = torch.cuda.get_device_capability(device)

build/torch212-cxx11-xpu20253-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "flash-attn2",
-  "id": "_flash_attn2_xpu_14f6010",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "flash-attn2",
+  "id": "_flash_attn2_xpu_85c21a0",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],