rbelanec's picture
End of training
a1c4065 verified
{
"epoch": 20.0,
"eval_loss": 0.46720752120018005,
"eval_runtime": 11.6787,
"eval_samples_per_second": 72.611,
"eval_steps_per_second": 18.153,
"num_input_tokens_seen": 24964664,
"total_flos": 1.1263464338822922e+18,
"train_loss": 0.18866363030058317,
"train_runtime": 8637.5215,
"train_samples_per_second": 17.665,
"train_steps_per_second": 4.418
}