| { | |
| "epoch": 24.0, | |
| "eval_accuracy": 0.1853157281132229, | |
| "eval_loss": 5.635913372039795, | |
| "eval_runtime": 1.9203, | |
| "eval_samples": 479, | |
| "eval_samples_per_second": 249.437, | |
| "eval_steps_per_second": 1.562, | |
| "perplexity": 280.3148321499051, | |
| "total_flos": 2.175368143688663e+17, | |
| "train_loss": 5.765684167821925, | |
| "train_runtime": 24142.3828, | |
| "train_samples": 228639, | |
| "train_samples_per_second": 227.291, | |
| "train_steps_per_second": 1.137 | |
| } |