{ "epoch": 4.992, "total_flos": 1.878482348849234e+18, "train_loss": 0.37849522767922816, "train_runtime": 19752.9737, "train_samples_per_second": 2.531, "train_steps_per_second": 0.02 }