{ "epoch": 0.9996261682242991, "total_flos": 4.450466167504896e+16, "train_loss": 3.11931433781101, "train_runtime": 1360.775, "train_samples_per_second": 7.863, "train_steps_per_second": 0.983 }