T5La-Large / all_results.json
hrezaei's picture
End of training
5354973
{
"epoch": 1.04632568359375,
"eval_accuracy": 0.04088023483365949,
"eval_loss": 6.392906188964844,
"eval_runtime": 244.4224,
"eval_samples": 10000,
"eval_samples_per_second": 40.913,
"eval_steps_per_second": 10.228,
"perplexity": 597.5907702266671,
"total_flos": 5.045399375119909e+18,
"train_loss": 6.577412648592144,
"train_runtime": 154506.2809,
"train_samples": 2000000,
"train_samples_per_second": 13.573,
"train_steps_per_second": 3.393
}