davda54 commited on
Commit
37fc2ed
·
verified ·
1 Parent(s): 60e56bf
Files changed (1) hide show
  1. modeling_gptbert.py +1 -1
modeling_gptbert.py CHANGED
@@ -306,7 +306,7 @@ class SelfAttention(nn.Module):
306
  self.d_qk = config.query_key_head_size
307
  self.d_v = config.value_head_size
308
  self.num_attention_heads = config.num_attention_heads
309
- self.num_kv_heads = config.num_kv_heads
310
  self.hidden_size = config.hidden_size
311
 
312
  self.q_out_dim = self.d_qk * self.num_attention_heads
 
306
  self.d_qk = config.query_key_head_size
307
  self.d_v = config.value_head_size
308
  self.num_attention_heads = config.num_attention_heads
309
+ self.num_kv_heads = config.num_attention_heads
310
  self.hidden_size = config.hidden_size
311
 
312
  self.q_out_dim = self.d_qk * self.num_attention_heads