| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.15502627563993898, | |
| "eval_loss": 6.300896644592285, | |
| "eval_runtime": 0.7232, | |
| "eval_samples": 479, | |
| "eval_samples_per_second": 662.33, | |
| "eval_steps_per_second": 6.914, | |
| "perplexity": 545.0604165598512, | |
| "total_flos": 3.049796905526016e+17, | |
| "train_loss": 6.258596241115823, | |
| "train_runtime": 11648.8655, | |
| "train_samples": 228639, | |
| "train_samples_per_second": 490.689, | |
| "train_steps_per_second": 5.112 | |
| } |