{ "epoch": 33.44444444444444, "eval_ppl": 265.109507069636, "total_flos": 4.709999853439795e+16, "train_loss": 5.68605941772461, "train_runtime": 1228.1978, "train_samples_per_second": 46.247, "train_steps_per_second": 0.081 }