{ "epoch": 3.0, "eval_accuracy": 0.24484439445069367, "eval_loss": 5.178476810455322, "eval_runtime": 2.5253, "eval_samples": 294, "eval_samples_per_second": 116.424, "eval_steps_per_second": 3.168, "perplexity": 177.4123724102887, "total_flos": 4.300357860694426e+16, "train_loss": 0.6495532799400761, "train_runtime": 3174.7304, "train_samples": 2408, "train_samples_per_second": 2.275, "train_steps_per_second": 0.569 }