{ "epoch": 25.0, "eval_accuracy": 0.15245521839859863, "eval_loss": 7.787292003631592, "eval_runtime": 0.7336, "eval_samples": 479, "eval_samples_per_second": 652.912, "eval_steps_per_second": 6.815, "perplexity": 2409.783054689172, "total_flos": 3.049796905526016e+17, "train_loss": 7.265635145365141, "train_runtime": 11576.6001, "train_samples": 228639, "train_samples_per_second": 493.752, "train_steps_per_second": 5.144 }