{ "epoch": 4.996316004911994, "eval_loss": 2.1617491245269775, "eval_runtime": 16.2011, "eval_samples_per_second": 1033.94, "eval_steps_per_second": 64.625, "perplexity": 8.686317830153754, "total_flos": 2.358780336672768e+16, "train_loss": 9.447584004445119, "train_runtime": 9280.2532, "train_samples_per_second": 42.117, "train_steps_per_second": 0.658 }