100M_low_500_1208 / all_results.json
craa's picture
End of training
b134770 verified
raw
history blame contribute delete
485 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.3940823943098048,
"eval_loss": 3.3038175106048584,
"eval_runtime": 188.5528,
"eval_samples": 18011,
"eval_samples_per_second": 95.522,
"eval_steps_per_second": 5.972,
"perplexity": 27.216339520393753,
"total_flos": 7.7681598529536e+17,
"train_loss": 3.4615205547984353,
"train_runtime": 81693.8548,
"train_samples": 297298,
"train_samples_per_second": 36.392,
"train_steps_per_second": 1.137
}