{ "epoch": 31.0, "eval_loss": 0.6716023087501526, "eval_runtime": 232.3059, "eval_samples_per_second": 160.323, "eval_steps_per_second": 5.011, "perplexity": 1.9573711221830141, "total_flos": 3.528546650263388e+17, "train_loss": 0.17647521918996942, "train_runtime": 17128.7716, "train_samples_per_second": 506.884, "train_steps_per_second": 15.842 }