{ "epoch": 25.0, "eval_accuracy": 0.151748883991637, "eval_loss": 10.138225555419922, "eval_runtime": 1.0511, "eval_samples": 479, "eval_samples_per_second": 455.694, "eval_steps_per_second": 4.757, "perplexity": 25291.548193853436, "total_flos": 1.5155177772432384e+18, "train_loss": 8.027886620048312, "train_runtime": 24986.4669, "train_samples": 228639, "train_samples_per_second": 228.763, "train_steps_per_second": 2.383 }