File size: 263 Bytes
63f47f9
 
022db6b
 
 
 
 
 
 
 
 
 
63f47f9
1
2
3
4
5
6
7
8
9
10
11
12
13
{
  "stage": 2,
  "method": "KL distillation",
  "best_loss": 2.7305,
  "total_steps": 20000,
  "temperature": 2.0,
  "alpha": 0.7,
  "lr": 0.0005,
  "status": "COMPLETE",
  "teacher": "CohereLabs/tiny-aya-global",
  "student_params_m": 721.6,
  "languages": 67
}