df26a75
1
2
3
4
5
6
{ "step": 40, "eval_sparse_kl": 0.0796971321105957, "teacher": "Qwen/Qwen3.5-35B-A3B", "data_position": 2204 }