| { | |
| "epoch": 20.0, | |
| "eval_accuracy": 0.3686057656808563, | |
| "eval_loss": 3.563647985458374, | |
| "eval_runtime": 180.1205, | |
| "eval_samples": 16644, | |
| "eval_samples_per_second": 92.405, | |
| "eval_steps_per_second": 5.779, | |
| "perplexity": 35.29170623409146, | |
| "total_flos": 1.43513603407872e+18, | |
| "train_loss": 3.4363333413179364, | |
| "train_runtime": 137192.0021, | |
| "train_samples": 274623, | |
| "train_samples_per_second": 40.035, | |
| "train_steps_per_second": 0.5 | |
| } |