togethercomputer
/

evo-1-131k-base

Text Generation

deep signal processing

Model card Files Files and versions

maxall4 commited on Nov 28, 2024

Commit

cd7d86b

·

verified ·

1 Parent(s): 5bbaeb8

Update model.py

Files changed (1) hide show

model.py +2 -2

model.py CHANGED Viewed

@@ -22,7 +22,7 @@ try:
 except ImportError:
     "could not import swap_mha_rope from positional_embeddings.py"
-from flashfftconv import FlashDepthwiseConv1d
 # dummy import to force huggingface to bundle the tokenizer
 from .tokenizer import ByteTokenizer
@@ -122,7 +122,7 @@ class ParallelHyenaFilter(nn.Module):
         self.data_dtype = None
         if self.use_flash_depthwise:
-            self.fir_fn = FlashDepthwiseConv1d(
                 channels=3 * self.hidden_size,
                 kernel_size=self.short_filter_length,
                 padding=self.short_filter_length - 1,

 except ImportError:
     "could not import swap_mha_rope from positional_embeddings.py"
+from flashfftconv import FlashDepthWiseConv1d
 # dummy import to force huggingface to bundle the tokenizer
 from .tokenizer import ByteTokenizer
         self.data_dtype = None
         if self.use_flash_depthwise:
+            self.fir_fn = FlashDepthWiseConv1d(
                 channels=3 * self.hidden_size,
                 kernel_size=self.short_filter_length,
                 padding=self.short_filter_length - 1,