100M_low_100_495 / all_results.json
craa's picture
End of training
669df97 verified
raw
history blame contribute delete
482 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.3939788481077176,
"eval_loss": 3.305659294128418,
"eval_runtime": 184.1966,
"eval_samples": 18011,
"eval_samples_per_second": 97.781,
"eval_steps_per_second": 6.113,
"perplexity": 27.26651231562494,
"total_flos": 7.7681075945472e+17,
"train_loss": 3.458772770117256,
"train_runtime": 79806.4071,
"train_samples": 297296,
"train_samples_per_second": 37.252,
"train_steps_per_second": 1.164
}