| { | |
| "epoch": 3.0, | |
| "eval_loss": 2.1944403648376465, | |
| "eval_runtime": 83.9431, | |
| "eval_samples": 3913, | |
| "eval_samples_per_second": 46.615, | |
| "eval_steps_per_second": 1.465, | |
| "perplexity": 8.97497693843778, | |
| "train_loss": 2.733830861908257, | |
| "train_runtime": 14258.7293, | |
| "train_samples": 97236, | |
| "train_samples_per_second": 20.458, | |
| "train_steps_per_second": 0.639 | |
| } |