| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.371191240289195, | |
| "eval_loss": 3.5466434955596924, | |
| "eval_runtime": 179.6731, | |
| "eval_samples": 16643, | |
| "eval_samples_per_second": 92.629, | |
| "eval_steps_per_second": 5.794, | |
| "perplexity": 34.69666231918936, | |
| "total_flos": 1.43566384398336e+18, | |
| "train_loss": 3.438475851533715, | |
| "train_runtime": 136533.177, | |
| "train_samples": 274724, | |
| "train_samples_per_second": 40.243, | |
| "train_steps_per_second": 0.503 | |
| } |