| { | |
| "epoch": 1.64, | |
| "eval_accuracy": 0.4078498471094888, | |
| "eval_loss": 3.5663564205169678, | |
| "eval_runtime": 1763.6541, | |
| "eval_samples": 308356, | |
| "eval_samples_per_second": 174.839, | |
| "eval_steps_per_second": 3.643, | |
| "perplexity": 35.38742108875682, | |
| "train_loss": 5.382437963459396, | |
| "train_runtime": 198262.7738, | |
| "train_samples": 5858758, | |
| "train_samples_per_second": 147.752, | |
| "train_steps_per_second": 3.078 | |
| } |