{ "epoch": 25.0, "eval_accuracy": 0.15341583319206645, "eval_loss": 9.082741737365723, "eval_runtime": 1.0384, "eval_samples": 479, "eval_samples_per_second": 461.307, "eval_steps_per_second": 4.815, "perplexity": 8802.065927180123, "total_flos": 1.5151126801503744e+18, "train_loss": 7.655053733486172, "train_runtime": 24646.3655, "train_samples": 228639, "train_samples_per_second": 231.92, "train_steps_per_second": 2.416 }