chchen's picture
End of training
7be65ec verified
{
"epoch": 4.938271604938271,
"total_flos": 1.7255774630530253e+17,
"train_loss": 0.07573245613276959,
"train_runtime": 5157.9329,
"train_samples_per_second": 0.393,
"train_steps_per_second": 0.024
}