| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.15406566084647116, | |
| "eval_loss": 6.5065765380859375, | |
| "eval_runtime": 0.6822, | |
| "eval_samples": 479, | |
| "eval_samples_per_second": 702.098, | |
| "eval_steps_per_second": 7.329, | |
| "perplexity": 669.5303778823405, | |
| "total_flos": 3.051148107142656e+17, | |
| "train_loss": 6.453962587345357, | |
| "train_runtime": 11281.7551, | |
| "train_samples": 228639, | |
| "train_samples_per_second": 506.657, | |
| "train_steps_per_second": 5.278 | |
| } |