| { | |
| "epoch": 128.95, | |
| "eval_accuracy": 0.7366529161278139, | |
| "eval_loss": 1.1318359375, | |
| "eval_runtime": 325.6978, | |
| "eval_samples": 125529, | |
| "eval_samples_per_second": 385.416, | |
| "eval_steps_per_second": 1.508, | |
| "perplexity": 3.101345152387537, | |
| "train_loss": 0.110439400390625, | |
| "train_runtime": 5222.9883, | |
| "train_samples": 2976812, | |
| "train_samples_per_second": 73521.13, | |
| "train_steps_per_second": 35.899 | |
| } |