{ "epoch": 3.0, "eval_loss": 0.4810695946216583, "eval_runtime": 526.6047, "eval_samples_per_second": 3.781, "eval_steps_per_second": 0.473, "total_flos": 3000194903834624.0, "train_loss": 0.4290710630871001, "train_runtime": 89946.115, "train_samples_per_second": 0.597, "train_steps_per_second": 0.037 }