Kernels:

kernels-community
/

rotary

Trusted publisher

Kernel card Files Files and versions

xet

Community

kernels-bot commited on 6 days ago

Commit

79a3cae

verified ·

1 Parent(s): 18186f3

Uploaded using `kernel-builder`.

Browse files

Files changed (44) hide show

build/torch210-cxx11-cu126-x86_64-linux/_ops.py +3 -3
build/torch210-cxx11-cu126-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch210-cxx11-cu126-x86_64-linux/metadata.json +1 -1
build/torch210-cxx11-cu128-x86_64-linux/_ops.py +3 -3
build/torch210-cxx11-cu128-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch210-cxx11-cu128-x86_64-linux/metadata.json +1 -1
build/torch210-cxx11-cu130-x86_64-linux/_ops.py +3 -3
build/torch210-cxx11-cu130-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch210-cxx11-cu130-x86_64-linux/metadata.json +1 -1
build/torch210-cxx11-xpu20253-x86_64-linux/_ops.py +3 -3
build/{torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_86f75d9.abi3.so → torch210-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so} +1 -1
build/torch210-cxx11-xpu20253-x86_64-linux/metadata.json +1 -1
build/torch211-cxx11-cu126-x86_64-linux/_ops.py +3 -3
build/torch211-cxx11-cu126-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch211-cxx11-cu126-x86_64-linux/metadata.json +1 -1
build/torch211-cxx11-cu128-x86_64-linux/_ops.py +3 -3
build/torch211-cxx11-cu128-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch211-cxx11-cu128-x86_64-linux/metadata.json +1 -1
build/torch211-cxx11-cu130-x86_64-linux/_ops.py +3 -3
build/torch211-cxx11-cu130-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} +1 -1
build/torch211-cxx11-cu130-x86_64-linux/metadata.json +1 -1
build/torch211-cxx11-xpu20253-x86_64-linux/_ops.py +3 -3
build/{torch210-cxx11-xpu20253-x86_64-linux/_rotary_xpu_86f75d9.abi3.so → torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so} +1 -1
build/torch211-cxx11-xpu20253-x86_64-linux/metadata.json +1 -1
build/torch212-cxx11-cu126-x86_64-linux/__init__.py +52 -0
build/torch212-cxx11-cu126-x86_64-linux/_ops.py +9 -0
build/torch212-cxx11-cu126-x86_64-linux/_rotary_cuda_725ebfc.abi3.so +3 -0
build/torch212-cxx11-cu126-x86_64-linux/metadata.json +20 -0
build/torch212-cxx11-cu126-x86_64-linux/rotary/__init__.py +26 -0
build/torch212-cxx11-cu130-x86_64-linux/__init__.py +52 -0
build/torch212-cxx11-cu130-x86_64-linux/_ops.py +9 -0
build/torch212-cxx11-cu130-x86_64-linux/_rotary_cuda_725ebfc.abi3.so +3 -0
build/torch212-cxx11-cu130-x86_64-linux/metadata.json +21 -0
build/torch212-cxx11-cu130-x86_64-linux/rotary/__init__.py +26 -0
build/torch212-cxx11-cu132-x86_64-linux/__init__.py +52 -0
build/torch212-cxx11-cu132-x86_64-linux/_ops.py +9 -0
build/torch212-cxx11-cu132-x86_64-linux/_rotary_cuda_725ebfc.abi3.so +3 -0
build/torch212-cxx11-cu132-x86_64-linux/metadata.json +21 -0
build/torch212-cxx11-cu132-x86_64-linux/rotary/__init__.py +26 -0
build/torch212-cxx11-xpu20253-x86_64-linux/__init__.py +52 -0
build/torch212-cxx11-xpu20253-x86_64-linux/_ops.py +9 -0
build/torch212-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so +3 -0
build/torch212-cxx11-xpu20253-x86_64-linux/metadata.json +10 -0
build/torch212-cxx11-xpu20253-x86_64-linux/rotary/__init__.py +26 -0

build/torch210-cxx11-cu126-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch210-cxx11-cu126-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:b1d5394246163c10eb12e82bd4151ef5f26044ebef06ff6eb978204ce9569fe4
 size 8200568

 version https://git-lfs.github.com/spec/v1
+oid sha256:39d341299aaec16caebbdebde5fa235e8d2fe93304f64f39d5d25aca27bb1e47
 size 8200568

build/torch210-cxx11-cu126-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch210-cxx11-cu128-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch210-cxx11-cu128-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2776016e55fced29f3f7da4592a64690abc7d13f13a1abeb97d0e5ac0ae79570
 size 11905904

 version https://git-lfs.github.com/spec/v1
+oid sha256:cc218cdb6a055456094a6f518d2f3b43fb1a0d516907cc8dedee3d6511b3217b
 size 11905904

build/torch210-cxx11-cu128-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch210-cxx11-cu130-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch210-cxx11-cu130-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:d48e50159c8070fad7389d57fd8a828ae09b0bf7c7823d9ce175e60a68d04321
 size 10307160

 version https://git-lfs.github.com/spec/v1
+oid sha256:51653f32f84e840f9e7182eb129bf31e528c513d59802f8560909cfcc3707b85
 size 10307160

build/torch210-cxx11-cu130-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch210-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_xpu_86f75d9
-ops = torch.ops._rotary_xpu_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_xpu_86f75d9::{op_name}"

 import torch
+from . import _rotary_xpu_725ebfc
+ops = torch.ops._rotary_xpu_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_xpu_725ebfc::{op_name}"

build/{torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_86f75d9.abi3.so → torch210-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:2e78d1a36648ffeaa4835901d94e93de2d1439fedd504345d71984fc5cbfebd0
 size 2301504

 version https://git-lfs.github.com/spec/v1
+oid sha256:c1a6425022ede63a5cdaa95626f393fde741b34037d7bd588044d324c64a0588
 size 2301504

build/torch210-cxx11-xpu20253-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_xpu_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_xpu_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch211-cxx11-cu126-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch211-cxx11-cu126-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:dcafe175d2f5a54a5133884109c478238dfe9000f178a317d27881b5b32e168d
 size 8193600

 version https://git-lfs.github.com/spec/v1
+oid sha256:7b43b3223ec25d835af8c4020d87eca05c60efc111211a2a7196c3d692e77179
 size 8193600

build/torch211-cxx11-cu126-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch211-cxx11-cu128-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch211-cxx11-cu128-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:04ea5f41dc222373c069accb827df58ab6156edba6e2684fd5ebd6b1ec2993ce
 size 11894840

 version https://git-lfs.github.com/spec/v1
+oid sha256:3037fcf467a2bddcc34cfa70d188ae2ed190a87c6b56818f20c0c39b9bc2342f
 size 11894840

build/torch211-cxx11-cu128-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch211-cxx11-cu130-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_cuda_86f75d9
-ops = torch.ops._rotary_cuda_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_cuda_86f75d9::{op_name}"

 import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch211-cxx11-cu130-x86_64-linux/{_rotary_cuda_86f75d9.abi3.so → _rotary_cuda_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:81f997832b95bdd5bfd0d0ce46ef13f910345b0c47ae163431b8ecde7947482d
 size 10296096

 version https://git-lfs.github.com/spec/v1
+oid sha256:5d95c0078ab5f1e7462f6b607890d58044d40bd02a5ecd749c9e6cac33424faf
 size 10296096

build/torch211-cxx11-cu130-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_cuda_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch211-cxx11-xpu20253-x86_64-linux/_ops.py CHANGED Viewed

@@ -1,9 +1,9 @@
 import torch
-from . import _rotary_xpu_86f75d9
-ops = torch.ops._rotary_xpu_86f75d9
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
-    return f"_rotary_xpu_86f75d9::{op_name}"

 import torch
+from . import _rotary_xpu_725ebfc
+ops = torch.ops._rotary_xpu_725ebfc
 def add_op_namespace_prefix(op_name: str):
     """
     Prefix op by namespace.
     """
+    return f"_rotary_xpu_725ebfc::{op_name}"

build/{torch210-cxx11-xpu20253-x86_64-linux/_rotary_xpu_86f75d9.abi3.so → torch211-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so} RENAMED Viewed

@@ -1,3 +1,3 @@
 version https://git-lfs.github.com/spec/v1
-oid sha256:31984c0927a018a70c49d356690a4cd08f39ec0109f6a5a440e93f05bd6da25e
 size 2301504

 version https://git-lfs.github.com/spec/v1
+oid sha256:8482e87f3cb8d30070a9367ea2d01398497f52fc7e2369db3d763118c3c92566
 size 2301504

build/torch211-cxx11-xpu20253-x86_64-linux/metadata.json CHANGED Viewed

@@ -1,6 +1,6 @@
 {
   "name": "rotary",
-  "id": "_rotary_xpu_86f75d9",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

 {
   "name": "rotary",
+  "id": "_rotary_xpu_725ebfc",
   "version": 1,
   "license": "BSD-3-Clause",
   "python-depends": [],

build/torch212-cxx11-cu126-x86_64-linux/__init__.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from typing import Optional, Tuple
+import torch
+from ._ops import ops
+def apply_rotary(
+    x1: torch.Tensor,
+    x2: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    out1: torch.Tensor,
+    out2: torch.Tensor,
+    conj: bool,
+) -> None:
+    ops.apply_rotary(x1, x2, cos, sin, out1, out2, conj)
+def apply_rotary_transformers(
+    q: torch.Tensor,
+    k: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    unsqueeze_dim: int = 1,
+) -> Tuple[torch.Tensor, torch.Tensor]:
+    """
+    Rotary kernel implementation wrapper
+    Adapts rotary kernel implementation to match transformers apply_rotary_pos_emb signature
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    q_rotated = q.clone()
+    k_rotated = k.clone()
+    # Get half dimension for rotation
+    half_dim = q.shape[-1] // 2
+    q1 = q_rotated[..., :half_dim]
+    q2 = q_rotated[..., half_dim:]
+    k1 = k_rotated[..., :half_dim]
+    k2 = k_rotated[..., half_dim:]
+    if cos.shape[-1] != half_dim:
+        # Trim cos/sin to match half_dim
+        cos = cos[..., :half_dim]
+        sin = sin[..., :half_dim]
+    apply_rotary(q1, q2, cos, sin, q1, q2, False)
+    apply_rotary(k1, k2, cos, sin, k1, k2, False)
+    return q_rotated, k_rotated
+__all__ = ["apply_rotary", "apply_rotary_transformers"]

build/torch212-cxx11-cu126-x86_64-linux/_ops.py ADDED Viewed

	@@ -0,0 +1,9 @@

+import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
+def add_op_namespace_prefix(op_name: str):
+    """
+    Prefix op by namespace.
+    """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch212-cxx11-cu126-x86_64-linux/_rotary_cuda_725ebfc.abi3.so ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:b7e9bd09e74ab8c1a7468d01fc6c21185ef9fce899f24e020d09c17e8cfe4a08
+size 8195384

build/torch212-cxx11-cu126-x86_64-linux/metadata.json ADDED Viewed

	@@ -0,0 +1,20 @@

+{
+  "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
+  "version": 1,
+  "license": "BSD-3-Clause",
+  "python-depends": [],
+  "backend": {
+    "type": "cuda",
+    "archs": [
+      "7.0",
+      "7.2",
+      "7.5",
+      "8.0",
+      "8.6",
+      "8.7",
+      "8.9",
+      "9.0+PTX"
+    ]
+  }
+}

build/torch212-cxx11-cu126-x86_64-linux/rotary/__init__.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import ctypes
+import importlib.util
+import sys
+from pathlib import Path
+from types import ModuleType
+def _import_from_path(file_path: Path) -> ModuleType:
+    # We cannot use the module name as-is, after adding it to `sys.modules`,
+    # it would also be used for other imports. So, we make a module name that
+    # depends on the path for it to be unique using the hex-encoded hash of
+    # the path.
+    path_hash = "{:x}".format(ctypes.c_size_t(hash(file_path.absolute())).value)
+    module_name = path_hash
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Cannot load spec for {module_name} from {file_path}")
+    module = importlib.util.module_from_spec(spec)
+    if module is None:
+        raise ImportError(f"Cannot load module {module_name} from spec")
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)  # type: ignore
+    return module
+globals().update(vars(_import_from_path(Path(__file__).parent.parent / "__init__.py")))

build/torch212-cxx11-cu130-x86_64-linux/__init__.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from typing import Optional, Tuple
+import torch
+from ._ops import ops
+def apply_rotary(
+    x1: torch.Tensor,
+    x2: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    out1: torch.Tensor,
+    out2: torch.Tensor,
+    conj: bool,
+) -> None:
+    ops.apply_rotary(x1, x2, cos, sin, out1, out2, conj)
+def apply_rotary_transformers(
+    q: torch.Tensor,
+    k: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    unsqueeze_dim: int = 1,
+) -> Tuple[torch.Tensor, torch.Tensor]:
+    """
+    Rotary kernel implementation wrapper
+    Adapts rotary kernel implementation to match transformers apply_rotary_pos_emb signature
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    q_rotated = q.clone()
+    k_rotated = k.clone()
+    # Get half dimension for rotation
+    half_dim = q.shape[-1] // 2
+    q1 = q_rotated[..., :half_dim]
+    q2 = q_rotated[..., half_dim:]
+    k1 = k_rotated[..., :half_dim]
+    k2 = k_rotated[..., half_dim:]
+    if cos.shape[-1] != half_dim:
+        # Trim cos/sin to match half_dim
+        cos = cos[..., :half_dim]
+        sin = sin[..., :half_dim]
+    apply_rotary(q1, q2, cos, sin, q1, q2, False)
+    apply_rotary(k1, k2, cos, sin, k1, k2, False)
+    return q_rotated, k_rotated
+__all__ = ["apply_rotary", "apply_rotary_transformers"]

build/torch212-cxx11-cu130-x86_64-linux/_ops.py ADDED Viewed

	@@ -0,0 +1,9 @@

+import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
+def add_op_namespace_prefix(op_name: str):
+    """
+    Prefix op by namespace.
+    """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch212-cxx11-cu130-x86_64-linux/_rotary_cuda_725ebfc.abi3.so ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:720b8c363ad2feaeda8476661c5627265524b8cd704a1b5f4c7946ef9e2d0c9c
+size 10301968

build/torch212-cxx11-cu130-x86_64-linux/metadata.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
+  "version": 1,
+  "license": "BSD-3-Clause",
+  "python-depends": [],
+  "backend": {
+    "type": "cuda",
+    "archs": [
+      "10.0",
+      "11.0",
+      "12.0+PTX",
+      "7.5",
+      "8.0",
+      "8.6",
+      "8.7",
+      "8.9",
+      "9.0"
+    ]
+  }
+}

build/torch212-cxx11-cu130-x86_64-linux/rotary/__init__.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import ctypes
+import importlib.util
+import sys
+from pathlib import Path
+from types import ModuleType
+def _import_from_path(file_path: Path) -> ModuleType:
+    # We cannot use the module name as-is, after adding it to `sys.modules`,
+    # it would also be used for other imports. So, we make a module name that
+    # depends on the path for it to be unique using the hex-encoded hash of
+    # the path.
+    path_hash = "{:x}".format(ctypes.c_size_t(hash(file_path.absolute())).value)
+    module_name = path_hash
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Cannot load spec for {module_name} from {file_path}")
+    module = importlib.util.module_from_spec(spec)
+    if module is None:
+        raise ImportError(f"Cannot load module {module_name} from spec")
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)  # type: ignore
+    return module
+globals().update(vars(_import_from_path(Path(__file__).parent.parent / "__init__.py")))

build/torch212-cxx11-cu132-x86_64-linux/__init__.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from typing import Optional, Tuple
+import torch
+from ._ops import ops
+def apply_rotary(
+    x1: torch.Tensor,
+    x2: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    out1: torch.Tensor,
+    out2: torch.Tensor,
+    conj: bool,
+) -> None:
+    ops.apply_rotary(x1, x2, cos, sin, out1, out2, conj)
+def apply_rotary_transformers(
+    q: torch.Tensor,
+    k: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    unsqueeze_dim: int = 1,
+) -> Tuple[torch.Tensor, torch.Tensor]:
+    """
+    Rotary kernel implementation wrapper
+    Adapts rotary kernel implementation to match transformers apply_rotary_pos_emb signature
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    q_rotated = q.clone()
+    k_rotated = k.clone()
+    # Get half dimension for rotation
+    half_dim = q.shape[-1] // 2
+    q1 = q_rotated[..., :half_dim]
+    q2 = q_rotated[..., half_dim:]
+    k1 = k_rotated[..., :half_dim]
+    k2 = k_rotated[..., half_dim:]
+    if cos.shape[-1] != half_dim:
+        # Trim cos/sin to match half_dim
+        cos = cos[..., :half_dim]
+        sin = sin[..., :half_dim]
+    apply_rotary(q1, q2, cos, sin, q1, q2, False)
+    apply_rotary(k1, k2, cos, sin, k1, k2, False)
+    return q_rotated, k_rotated
+__all__ = ["apply_rotary", "apply_rotary_transformers"]

build/torch212-cxx11-cu132-x86_64-linux/_ops.py ADDED Viewed

	@@ -0,0 +1,9 @@

+import torch
+from . import _rotary_cuda_725ebfc
+ops = torch.ops._rotary_cuda_725ebfc
+def add_op_namespace_prefix(op_name: str):
+    """
+    Prefix op by namespace.
+    """
+    return f"_rotary_cuda_725ebfc::{op_name}"

build/torch212-cxx11-cu132-x86_64-linux/_rotary_cuda_725ebfc.abi3.so ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:eb233b9be14a2d9c5bbb7b860973db6dd48aad4f5b760dd358880d079bff3b23
+size 10490208

build/torch212-cxx11-cu132-x86_64-linux/metadata.json ADDED Viewed

	@@ -0,0 +1,21 @@

+{
+  "name": "rotary",
+  "id": "_rotary_cuda_725ebfc",
+  "version": 1,
+  "license": "BSD-3-Clause",
+  "python-depends": [],
+  "backend": {
+    "type": "cuda",
+    "archs": [
+      "10.0",
+      "11.0",
+      "12.0+PTX",
+      "7.5",
+      "8.0",
+      "8.6",
+      "8.7",
+      "8.9",
+      "9.0"
+    ]
+  }
+}

build/torch212-cxx11-cu132-x86_64-linux/rotary/__init__.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import ctypes
+import importlib.util
+import sys
+from pathlib import Path
+from types import ModuleType
+def _import_from_path(file_path: Path) -> ModuleType:
+    # We cannot use the module name as-is, after adding it to `sys.modules`,
+    # it would also be used for other imports. So, we make a module name that
+    # depends on the path for it to be unique using the hex-encoded hash of
+    # the path.
+    path_hash = "{:x}".format(ctypes.c_size_t(hash(file_path.absolute())).value)
+    module_name = path_hash
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Cannot load spec for {module_name} from {file_path}")
+    module = importlib.util.module_from_spec(spec)
+    if module is None:
+        raise ImportError(f"Cannot load module {module_name} from spec")
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)  # type: ignore
+    return module
+globals().update(vars(_import_from_path(Path(__file__).parent.parent / "__init__.py")))

build/torch212-cxx11-xpu20253-x86_64-linux/__init__.py ADDED Viewed

	@@ -0,0 +1,52 @@

+from typing import Optional, Tuple
+import torch
+from ._ops import ops
+def apply_rotary(
+    x1: torch.Tensor,
+    x2: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    out1: torch.Tensor,
+    out2: torch.Tensor,
+    conj: bool,
+) -> None:
+    ops.apply_rotary(x1, x2, cos, sin, out1, out2, conj)
+def apply_rotary_transformers(
+    q: torch.Tensor,
+    k: torch.Tensor,
+    cos: torch.Tensor,
+    sin: torch.Tensor,
+    unsqueeze_dim: int = 1,
+) -> Tuple[torch.Tensor, torch.Tensor]:
+    """
+    Rotary kernel implementation wrapper
+    Adapts rotary kernel implementation to match transformers apply_rotary_pos_emb signature
+    """
+    cos = cos.unsqueeze(unsqueeze_dim)
+    sin = sin.unsqueeze(unsqueeze_dim)
+    q_rotated = q.clone()
+    k_rotated = k.clone()
+    # Get half dimension for rotation
+    half_dim = q.shape[-1] // 2
+    q1 = q_rotated[..., :half_dim]
+    q2 = q_rotated[..., half_dim:]
+    k1 = k_rotated[..., :half_dim]
+    k2 = k_rotated[..., half_dim:]
+    if cos.shape[-1] != half_dim:
+        # Trim cos/sin to match half_dim
+        cos = cos[..., :half_dim]
+        sin = sin[..., :half_dim]
+    apply_rotary(q1, q2, cos, sin, q1, q2, False)
+    apply_rotary(k1, k2, cos, sin, k1, k2, False)
+    return q_rotated, k_rotated
+__all__ = ["apply_rotary", "apply_rotary_transformers"]

build/torch212-cxx11-xpu20253-x86_64-linux/_ops.py ADDED Viewed

	@@ -0,0 +1,9 @@

+import torch
+from . import _rotary_xpu_725ebfc
+ops = torch.ops._rotary_xpu_725ebfc
+def add_op_namespace_prefix(op_name: str):
+    """
+    Prefix op by namespace.
+    """
+    return f"_rotary_xpu_725ebfc::{op_name}"

build/torch212-cxx11-xpu20253-x86_64-linux/_rotary_xpu_725ebfc.abi3.so ADDED Viewed

	@@ -0,0 +1,3 @@

+version https://git-lfs.github.com/spec/v1
+oid sha256:42a11c6606ad23c9cd2f3e8dff22be3a2349efefff46a1e42cb87f7785b7fcb6
+size 2301512

build/torch212-cxx11-xpu20253-x86_64-linux/metadata.json ADDED Viewed

	@@ -0,0 +1,10 @@

+{
+  "name": "rotary",
+  "id": "_rotary_xpu_725ebfc",
+  "version": 1,
+  "license": "BSD-3-Clause",
+  "python-depends": [],
+  "backend": {
+    "type": "xpu"
+  }
+}

build/torch212-cxx11-xpu20253-x86_64-linux/rotary/__init__.py ADDED Viewed

	@@ -0,0 +1,26 @@

+import ctypes
+import importlib.util
+import sys
+from pathlib import Path
+from types import ModuleType
+def _import_from_path(file_path: Path) -> ModuleType:
+    # We cannot use the module name as-is, after adding it to `sys.modules`,
+    # it would also be used for other imports. So, we make a module name that
+    # depends on the path for it to be unique using the hex-encoded hash of
+    # the path.
+    path_hash = "{:x}".format(ctypes.c_size_t(hash(file_path.absolute())).value)
+    module_name = path_hash
+    spec = importlib.util.spec_from_file_location(module_name, file_path)
+    if spec is None:
+        raise ImportError(f"Cannot load spec for {module_name} from {file_path}")
+    module = importlib.util.module_from_spec(spec)
+    if module is None:
+        raise ImportError(f"Cannot load module {module_name} from spec")
+    sys.modules[module_name] = module
+    spec.loader.exec_module(module)  # type: ignore
+    return module
+globals().update(vars(_import_from_path(Path(__file__).parent.parent / "__init__.py")))