craa's picture
End of training
666b0cb verified
{
"epoch": 28.812761993479274,
"eval_accuracy": 0.3695037327259836,
"eval_loss": 3.558704137802124,
"eval_runtime": 53.8711,
"eval_samples": 16651,
"eval_samples_per_second": 309.09,
"eval_steps_per_second": 19.324,
"perplexity": 35.11765999847565,
"total_flos": 2.068898812526592e+18,
"train_loss": 3.3939504055447047,
"train_runtime": 44109.3766,
"train_samples": 274807,
"train_samples_per_second": 311.506,
"train_steps_per_second": 3.895
}