{ "epoch": 25.0, "eval_accuracy": 0.15350059332090185, "eval_loss": 9.08564567565918, "eval_runtime": 1.0357, "eval_samples": 479, "eval_samples_per_second": 462.482, "eval_steps_per_second": 4.828, "perplexity": 8827.663732722915, "total_flos": 1.5151126801503744e+18, "train_loss": 7.625829259710688, "train_runtime": 24701.7833, "train_samples": 228639, "train_samples_per_second": 231.399, "train_steps_per_second": 2.411 }