{ "epoch": 2.88, "total_flos": 5.59772512916521e+16, "train_loss": 0.10819435450765821, "train_runtime": 65.0195, "train_samples_per_second": 35.712, "train_steps_per_second": 0.277 }