| { | |
| "epoch": 9.96, | |
| "eval_loss": 10.791767120361328, | |
| "eval_runtime": 5.99, | |
| "eval_samples": 444, | |
| "eval_samples_per_second": 74.123, | |
| "eval_steps_per_second": 18.531, | |
| "perplexity": 48618.875553525686, | |
| "train_loss": 11.18234748840332, | |
| "train_runtime": 256.0921, | |
| "train_samples": 8516, | |
| "train_samples_per_second": 332.537, | |
| "train_steps_per_second": 0.625 | |
| } |