{ "epoch": 9.996763754045308, "eval_loss": 0.6763796806335449, "eval_runtime": 26.5385, "eval_samples_per_second": 368.069, "eval_steps_per_second": 46.009, "perplexity": 1.9667445843771059, "total_flos": 2.9966216313176064e+16, "train_loss": 0.7098540155932651, "train_runtime": 3818.8619, "train_samples_per_second": 119.748, "train_steps_per_second": 7.484 }