| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.15200316437814318, | |
| "eval_loss": 10.231886863708496, | |
| "eval_runtime": 0.7409, | |
| "eval_samples": 479, | |
| "eval_samples_per_second": 646.532, | |
| "eval_steps_per_second": 6.749, | |
| "perplexity": 27774.86804686192, | |
| "total_flos": 3.053850510375936e+17, | |
| "train_loss": 8.741478605102232, | |
| "train_runtime": 12176.6113, | |
| "train_samples": 228639, | |
| "train_samples_per_second": 469.422, | |
| "train_steps_per_second": 4.891 | |
| } |