{ "epoch": 3.0, "total_flos": 1.6530581665087488e+16, "train_loss": 0.3794273254576331, "train_runtime": 265798.511, "train_samples_per_second": 1.334, "train_steps_per_second": 0.014 }