File size: 274 Bytes
2d58dce
 
 
 
 
 
 
 
 
 
 
1
2
3
4
5
6
7
8
9
10
11
{
  "base_model": "/content/Qwen3-0.6B",
  "loop_window_size": 64,
  "num_layers": 28,
  "num_heads": 16,
  "head_dim": 128,
  "final_val_loss": 3.6202090362707775,
  "final_val_ppl": 37.34537124633789,
  "training_epochs": 3,
  "training_time_minutes": 38.990576179822284
}