{ "epoch": 2.995008319467554, "eval_accuracy": 0.6477501136495986, "eval_loss": 2.9963440895080566, "eval_runtime": 49.7886, "eval_samples": 921, "eval_samples_per_second": 18.498, "eval_steps_per_second": 9.259, "perplexity": 20.012240063032426, "total_flos": 2.6245163088714138e+17, "train_loss": 3.7161494956193146, "train_runtime": 2214.8433, "train_samples": 7211, "train_samples_per_second": 9.767, "train_steps_per_second": 0.61 }