Upload DeCodon
Browse files- modeling_decodon.py +1 -1
modeling_decodon.py
CHANGED
|
@@ -629,7 +629,7 @@ class MultiHeadedSelfAttention(nn.Module):
|
|
| 629 |
attention_probs = attention_scores.softmax(dim=-1)
|
| 630 |
attention_probs = self.dropout(attention_probs)
|
| 631 |
|
| 632 |
-
x = einsum(attention_probs, v, "b h q k, b
|
| 633 |
|
| 634 |
x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)
|
| 635 |
|
|
|
|
| 629 |
attention_probs = attention_scores.softmax(dim=-1)
|
| 630 |
attention_probs = self.dropout(attention_probs)
|
| 631 |
|
| 632 |
+
x = einsum(attention_probs, v, "b h q k, b k h d -> b q h d")
|
| 633 |
|
| 634 |
x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)
|
| 635 |
|