100M_low_0_634 / all_results.json
craa's picture
End of training
b8dee87 verified
raw
history blame contribute delete
486 Bytes
{
"epoch": 10.0,
"eval_accuracy": 0.39444659878975896,
"eval_loss": 3.3022682666778564,
"eval_runtime": 180.2938,
"eval_samples": 18011,
"eval_samples_per_second": 99.898,
"eval_steps_per_second": 6.245,
"perplexity": 27.174207416556534,
"total_flos": 7.7681859821568e+17,
"train_loss": 3.4581149110803304,
"train_runtime": 79999.4738,
"train_samples": 297299,
"train_samples_per_second": 37.163,
"train_steps_per_second": 1.161
}