{ "epoch": 50.0, "eval_loss": 0.5416154265403748, "eval_runtime": 9.3336, "eval_samples_per_second": 160.924, "eval_steps_per_second": 5.036, "perplexity": 1.7187811854679051, "total_flos": 2.35191607492608e+16, "train_loss": 0.15202610808478462, "train_runtime": 1233.6469, "train_samples_per_second": 290.845, "train_steps_per_second": 9.119 }