| { | |
| "epoch": 10.0, | |
| "eval_loss": 1.9962048530578613, | |
| "eval_runtime": 2.1252, | |
| "eval_samples": 1945, | |
| "eval_samples_per_second": 915.193, | |
| "eval_steps_per_second": 57.405, | |
| "perplexity": 7.361066690824402, | |
| "total_flos": 1536221652235776.0, | |
| "train_loss": 1.731730433872768, | |
| "train_runtime": 362.8983, | |
| "train_samples": 9733, | |
| "train_samples_per_second": 268.202, | |
| "train_steps_per_second": 16.782 | |
| } |