goodarzilab
/

decodon-200M-euk

Text Generation

Model card Files Files and versions

mohsennp commited on Oct 20, 2024

Commit

8e2efae

·

verified ·

1 Parent(s): 4b2b63f

Upload DeCodon

Files changed (1) hide show

modeling_decodon.py +1 -1

modeling_decodon.py CHANGED Viewed

@@ -629,7 +629,7 @@ class MultiHeadedSelfAttention(nn.Module):
             attention_probs = attention_scores.softmax(dim=-1)
             attention_probs = self.dropout(attention_probs)
-            x = einsum(attention_probs, v, "b h q k, b v h d -> b q h d")
         x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)

             attention_probs = attention_scores.softmax(dim=-1)
             attention_probs = self.dropout(attention_probs)
+            x = einsum(attention_probs, v, "b h q k, b k h d -> b q h d")
         x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)