Kernels:

kernels-community
/

flash-mla

Trusted publisher

Kernel card Files Files and versions

xet

Community

danieldk HF Staff commited on 13 days ago

Commit

f10ba3f

1 Parent(s): 745c77f

Remove builds incompatible with kernels >= 0.14

Browse files

This view is limited to 50 files because it contains too many changes. See raw diff

Files changed (50) hide show

build/torch25-cxx11-cu118-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx11-cu118-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch25-cxx11-cu121-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx11-cu121-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx11-cu121-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch25-cxx11-cu124-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx11-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx11-cu124-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch25-cxx98-cu118-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx98-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx98-cu118-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch25-cxx98-cu121-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx98-cu121-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx98-cu121-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch25-cxx98-cu124-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch25-cxx98-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch25-cxx98-cu124-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx11-cu118-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx11-cu118-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx11-cu124-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx11-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx11-cu124-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx11-cu126-aarch64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx11-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so +0 -3
build/torch26-cxx11-cu126-aarch64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx11-cu126-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx11-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx11-cu126-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx98-cu118-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx98-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx98-cu118-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx98-cu124-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx98-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx98-cu124-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx98-cu126-aarch64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx98-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so +0 -3
build/torch26-cxx98-cu126-aarch64-linux/flash_mla/_ops.py +0 -9
build/torch26-cxx98-cu126-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch26-cxx98-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch26-cxx98-cu126-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch27-cxx11-cu118-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch27-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3
build/torch27-cxx11-cu118-x86_64-linux/flash_mla/_ops.py +0 -9
build/torch27-cxx11-cu126-aarch64-linux/flash_mla/__init__.py +0 -33
build/torch27-cxx11-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so +0 -3
build/torch27-cxx11-cu126-aarch64-linux/flash_mla/_ops.py +0 -9
build/torch27-cxx11-cu126-x86_64-linux/flash_mla/__init__.py +0 -33
build/torch27-cxx11-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so +0 -3

build/torch25-cxx11-cu118-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:a9a2b99b276b5aa714b27d1f54cc5da2d451e65a9ed385c583daf528f2c030a9
-size 2564144

build/torch25-cxx11-cu118-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch25-cxx11-cu121-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx11-cu121-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:77e241f633fa5b103f379ba6ac58d2cc068e0c3fc4d4f20ac1e1c679fc19614f
-size 2595176

build/torch25-cxx11-cu121-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch25-cxx11-cu124-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx11-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:31aa895a57efbd29aeff693b65b02842926bf1788d6f98022c32470a60265f9e
-size 2580248

build/torch25-cxx11-cu124-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch25-cxx98-cu118-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx98-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:7454c10a3b29128e035bdb3fa18d5fc3706f7970542a0bcb55d9714f0999d42f
-size 2556792

build/torch25-cxx98-cu118-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch25-cxx98-cu121-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx98-cu121-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:c8cb9402f3091420227cbccf1ec4938a444765e26f5d34c356c76bf7c85630d0
-size 2587896

build/torch25-cxx98-cu121-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch25-cxx98-cu124-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch25-cxx98-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:bb4be09cbde1979c1aa17e3bc93c1538f129b438d305bee0fe96f3c08efeee04
-size 2572968

build/torch25-cxx98-cu124-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx11-cu118-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:35c67c788220d8988e47cd4ad976495450b71cd682bd8ab08af3db066d625126
-size 2564496

build/torch26-cxx11-cu118-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx11-cu124-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx11-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:069fb3e3a051c91e73390245c7463218829b8decf0f60bd6fc9a0ba8127b5bd2
-size 2580592

build/torch26-cxx11-cu124-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx11-cu126-aarch64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx11-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:e1e97fef62f5ebbe6b19b0d5fbe700fcdf6b9acd7a54cba6f0b1d23665188fa9
-size 2643848

build/torch26-cxx11-cu126-aarch64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_341ab77
-ops = torch.ops._flash_mla_341ab77
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_341ab77::{op_name}"

build/torch26-cxx11-cu126-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx11-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:50fad86fa7bc15096c2a1feadf8091b20e188e32b8c0633423ec26e4e8e8e7ce
-size 2560552

build/torch26-cxx11-cu126-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx98-cu118-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx98-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:ae937ddfbc3e6097b2fdd9197f2ddb5b9f66c65146a4de30ccab59dab6e18dd4
-size 2557136

build/torch26-cxx98-cu118-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx98-cu124-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx98-cu124-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:503910324475f8bd9dab47687339005f58e5b623bf0c9e4234fabf099c08da33
-size 2573312

build/torch26-cxx98-cu124-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch26-cxx98-cu126-aarch64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx98-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:6f15b3b0bd0bee56760bd6500175ca5a1fd17f2742ef9496c28ea3720d038c66
-size 2640208

build/torch26-cxx98-cu126-aarch64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_341ab77
-ops = torch.ops._flash_mla_341ab77
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_341ab77::{op_name}"

build/torch26-cxx98-cu126-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch26-cxx98-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:2c41fa4058ee2bb5d3d90458a7f92f0ef1c10e8bc854329cf7c208025bb244b2
-size 2553280

build/torch26-cxx98-cu126-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch27-cxx11-cu118-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch27-cxx11-cu118-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:59c4034880f4482b06e447a2c4810aaf8009b7d4c86a4fd71356f169df986535
-size 2564632

build/torch27-cxx11-cu118-x86_64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_d4f4195
-ops = torch.ops._flash_mla_d4f4195
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_d4f4195::{op_name}"

build/torch27-cxx11-cu126-aarch64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch27-cxx11-cu126-aarch64-linux/flash_mla/_flash_mla_341ab77.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:fb925b062d31034672a45d925a3767d953e97a3c6c483467e6b81833d42b5a27
-size 2644048

build/torch27-cxx11-cu126-aarch64-linux/flash_mla/_ops.py DELETED Viewed

@@ -1,9 +0,0 @@
-import torch
-from . import _flash_mla_341ab77
-ops = torch.ops._flash_mla_341ab77
-def add_op_namespace_prefix(op_name: str):
-    """
-    Prefix op by namespace.
-    """
-    return f"_flash_mla_341ab77::{op_name}"

build/torch27-cxx11-cu126-x86_64-linux/flash_mla/__init__.py DELETED Viewed

@@ -1,33 +0,0 @@
-import torch
-from ._ops import ops
-def get_mla_metadata(seqlens_k: torch.Tensor, s_q: int, h_kv: int):
-    return ops.get_mla_metadata(seqlens_k, s_q, h_kv)
-def mha_fwd_kvcache_mla(
-    q: torch.Tensor,
-    kcache: torch.Tensor,
-    vcache_: torch.Tensor,
-    head_size_v: int,
-    seqlens_k: torch.Tensor,
-    block_table: torch.Tensor,
-    softmax_scale: float,
-    is_causal_: bool,
-    tile_scheduler_metadata: torch.Tensor,
-    num_splits: torch.Tensor,
-) -> torch.Tensor:
-    return ops.mha_fwd_kvcache_mla(
-        q,
-        kcache,
-        vcache_,
-        head_size_v,
-        seqlens_k,
-        block_table,
-        softmax_scale,
-        is_causal_,
-        tile_scheduler_metadata,
-        num_splits
-    )

build/torch27-cxx11-cu126-x86_64-linux/flash_mla/_flash_mla_d4f4195.abi3.so DELETED Viewed

@@ -1,3 +0,0 @@
-version https://git-lfs.github.com/spec/v1
-oid sha256:5db69ef4975e2eee001e6a9b7466c1fe40bc2228ed64eb8c24caf3e0fb6ed0b2
-size 2560584