{ "epoch": 38.0, "eval_loss": 0.5203976631164551, "eval_runtime": 9.8245, "eval_samples_per_second": 161.535, "eval_steps_per_second": 5.089, "perplexity": 1.6826966630681837, "total_flos": 1.886593281372979e+16, "train_loss": 0.15147609674822032, "train_runtime": 971.6736, "train_samples_per_second": 389.74, "train_steps_per_second": 12.195 }