{ "epoch": 0.4, "eval/perplexity": 7.994621224231238, "eval_loss": 2.0787689685821533, "eval_runtime": 33.0993, "eval_samples_per_second": 3.293, "eval_steps_per_second": 0.846, "perplexity": 7.994621224231238, "total_flos": 3.673093344067584e+17, "train_loss": 2.038690024614334, "train_perplexity": 7.680541285926508, "train_runtime": 33114.4358, "train_samples_per_second": 0.483, "train_steps_per_second": 0.03 }