train_math_qa_123_1760637721 / all_results.json
rbelanec's picture
End of training
107f0f2 verified
{
"epoch": 20.0,
"eval_loss": 0.7989339828491211,
"eval_runtime": 70.5638,
"eval_samples_per_second": 42.288,
"eval_steps_per_second": 10.572,
"num_input_tokens_seen": 77961608,
"total_flos": 3.5105759720879555e+18,
"train_loss": 0.8024387844978857,
"train_runtime": 29897.2604,
"train_samples_per_second": 17.964,
"train_steps_per_second": 4.491
}