File size: 161 Bytes
38afa82
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
{
  "n_layers": 3,
  "d_model": 768,
  "d_latent": 6144,
  "k": 48,
  "auxk": 192,
  "dead_steps_threshold": 2441,
  "auxk_coef": 0.03125,
  "alpha_spec": 0.01
}