File size: 327 Bytes
baa2ef6
 
 
 
 
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
12
13
14
15
{
  "max_seq_len": 1024,
  "d_model": 768,
  "n_layers": 12,
  "n_heads": 12,
  "use_padded_vocab_size": true,
  "use_rope": true,
  "rope_theta": 10000.0,
  "is_rope_full_precision": true,
  "embd_dropout_p": 0.0,
  "attn_dropout_p": 0.0,
  "residual_dropout_p": 0.0,
  "init_std": 0.02,
  "init_residual_scaled_factor": 2.0
}