| { | |
| "epoch": 2.9918166939443536, | |
| "eval_loss": 0.7127311825752258, | |
| "eval_runtime": 27.5772, | |
| "eval_samples_per_second": 607.423, | |
| "eval_steps_per_second": 9.501, | |
| "perplexity": 2.0395540531763667, | |
| "total_flos": 5.437860691102925e+16, | |
| "train_loss": 0.9607737994584881, | |
| "train_runtime": 2198.2213, | |
| "train_samples_per_second": 106.683, | |
| "train_steps_per_second": 0.416 | |
| } |