100M_low_0_1208 / all_results.json
craa's picture
End of training
a285683 verified
raw
history blame contribute delete
482 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.3943069798289173,
"eval_loss": 3.30434513092041,
"eval_runtime": 181.0661,
"eval_samples": 18011,
"eval_samples_per_second": 99.472,
"eval_steps_per_second": 6.219,
"perplexity": 27.230703202991823,
"total_flos": 7.7681859821568e+17,
"train_loss": 3.454896697509457,
"train_runtime": 79880.5297,
"train_samples": 297299,
"train_samples_per_second": 37.218,
"train_steps_per_second": 1.163
}