{ "epoch": 49.814258911819884, "eval_loss": 0.6708822250366211, "eval_runtime": 3.6448, "eval_samples_per_second": 501.534, "eval_steps_per_second": 62.829, "perplexity": 1.9559621584633884, "total_flos": 2.18714101825536e+16, "train_loss": 0.6980596797627614, "train_runtime": 3389.5401, "train_samples_per_second": 125.799, "train_steps_per_second": 3.924 }