kernels-community
/

activation

danieldk HF Staff commited on Jun 3, 2025

Commit

e99cc09

1 Parent(s): b0e5c39

Mark as torch.compile being supported

Files changed (1) hide show

torch-ext/activation/layers.py CHANGED Viewed

@@ -5,6 +5,8 @@ from ._ops import ops
 class SiluAndMul(nn.Module):
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
@@ -14,6 +16,8 @@ class SiluAndMul(nn.Module):
 class GeluAndMul(nn.Module):
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
@@ -23,6 +27,8 @@ class GeluAndMul(nn.Module):
 class GeluTanhAndMul(nn.Module):
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
@@ -32,6 +38,8 @@ class GeluTanhAndMul(nn.Module):
 class FatreluAndMul(nn.Module):
     def __init__(self, threshold: float = 0.0):
         super().__init__()
         self.threshold = threshold
@@ -45,6 +53,8 @@ class FatreluAndMul(nn.Module):
 class FastGELU(nn.Module):
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_fast(out, x)
@@ -52,6 +62,8 @@ class FastGELU(nn.Module):
 class NewGELU(nn.Module):
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_new(out, x)
@@ -59,6 +71,8 @@ class NewGELU(nn.Module):
 class QuickGELU(nn.Module):
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_quick(out, x)

 class SiluAndMul(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
 class GeluAndMul(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
 class GeluTanhAndMul(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor):
         d = x.shape[-1] // 2
         output_shape = x.shape[:-1] + (d,)
 class FatreluAndMul(nn.Module):
+    can_torch_compile: bool = True
     def __init__(self, threshold: float = 0.0):
         super().__init__()
         self.threshold = threshold
 class FastGELU(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_fast(out, x)
 class NewGELU(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_new(out, x)
 class QuickGELU(nn.Module):
+    can_torch_compile: bool = True
     def forward(self, x: torch.Tensor) -> torch.Tensor:
         out = torch.empty_like(x)
         ops.gelu_quick(out, x)