mohsennp commited on
Commit
8e2efae
·
verified ·
1 Parent(s): 4b2b63f

Upload DeCodon

Browse files
Files changed (1) hide show
  1. modeling_decodon.py +1 -1
modeling_decodon.py CHANGED
@@ -629,7 +629,7 @@ class MultiHeadedSelfAttention(nn.Module):
629
  attention_probs = attention_scores.softmax(dim=-1)
630
  attention_probs = self.dropout(attention_probs)
631
 
632
- x = einsum(attention_probs, v, "b h q k, b v h d -> b q h d")
633
 
634
  x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)
635
 
 
629
  attention_probs = attention_scores.softmax(dim=-1)
630
  attention_probs = self.dropout(attention_probs)
631
 
632
+ x = einsum(attention_probs, v, "b h q k, b k h d -> b q h d")
633
 
634
  x = rearrange(x, "b q h d -> b q (h d)", h=self.num_heads)
635