File size: 163 Bytes
3740525
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
{
  "n_nodes": 64,
  "d_model": 128,
  "n_heads": 4,
  "n_layers": 4,
  "d_ff": 512,
  "dropout": 0.1,
  "train_iters": 8,
  "rope_base": 10.0,
  "damping": 0.85
}