| { | |
| "base_eval_samples": 13188, | |
| "epoch": 3.0, | |
| "eval_loss": 1.6745600700378418, | |
| "eval_model_preparation_time": 0.0049, | |
| "eval_runtime": 339.9146, | |
| "eval_samples": 13188, | |
| "eval_samples_per_second": 38.798, | |
| "eval_steps_per_second": 2.427, | |
| "total_flos": 7.533943292711404e+17, | |
| "train_loss": 1.4212341141200129, | |
| "train_runtime": 13229.3679, | |
| "train_samples": 117772, | |
| "train_samples_per_second": 14.73, | |
| "train_steps_per_second": 0.058 | |
| } |