{ "epoch": 47.0, "eval_loss": 0.7128096222877502, "eval_runtime": 11.4031, "eval_samples_per_second": 160.307, "eval_steps_per_second": 5.086, "perplexity": 2.039714041484612, "total_flos": 2.5044104326938624e+16, "train_loss": 0.1997737506061201, "train_runtime": 1307.9406, "train_samples_per_second": 326.009, "train_steps_per_second": 10.207 }