{ "epoch": 49.94117647058823, "eval_loss": 1.9181811809539795, "eval_runtime": 2.5587, "eval_samples": 1945, "eval_samples_per_second": 760.165, "eval_steps_per_second": 12.116, "perplexity": 6.8085636554933355, "total_flos": 1.2548402868338688e+16, "train_loss": 1.8820014402601455, "train_runtime": 2628.924, "train_samples": 9733, "train_samples_per_second": 185.114, "train_steps_per_second": 0.171 }