{ "epoch": 24.0, "eval_loss": 0.6872262954711914, "eval_runtime": 1.8886, "eval_samples_per_second": 559.678, "eval_steps_per_second": 70.423, "perplexity": 1.9881932176157675, "total_flos": 7672437924691968.0, "train_loss": 0.7372308338926138, "train_runtime": 572.2889, "train_samples_per_second": 426.096, "train_steps_per_second": 53.295 }