{ "epoch": 25.0, "eval_accuracy": 0.15406566084647116, "eval_loss": 6.5065765380859375, "eval_runtime": 0.6822, "eval_samples": 479, "eval_samples_per_second": 702.098, "eval_steps_per_second": 7.329, "perplexity": 669.5303778823405, "total_flos": 3.051148107142656e+17, "train_loss": 6.453962587345357, "train_runtime": 11281.7551, "train_samples": 228639, "train_samples_per_second": 506.657, "train_steps_per_second": 5.278 }