{ "epoch": 29.0, "eval_loss": 0.4475274682044983, "eval_runtime": 362.3481, "eval_samples_per_second": 157.114, "eval_steps_per_second": 4.912, "perplexity": 1.5644392736681412, "total_flos": 5.058807603414958e+17, "train_loss": 0.11824046083851339, "train_runtime": 25872.5126, "train_samples_per_second": 514.295, "train_steps_per_second": 16.073 }