{ "epoch": 25.0, "eval_accuracy": 0.15361360682601571, "eval_loss": 6.361563682556152, "eval_runtime": 0.6853, "eval_samples": 479, "eval_samples_per_second": 698.929, "eval_steps_per_second": 7.296, "perplexity": 579.1512574389864, "total_flos": 3.050247306064896e+17, "train_loss": 6.340149333707231, "train_runtime": 11680.4757, "train_samples": 228639, "train_samples_per_second": 489.361, "train_steps_per_second": 5.098 }