| { | |
| "epoch": 10.0, | |
| "eval_loss": 2.299952745437622, | |
| "eval_runtime": 2.1048, | |
| "eval_samples": 1945, | |
| "eval_samples_per_second": 924.096, | |
| "eval_steps_per_second": 57.964, | |
| "perplexity": 9.973711140323708, | |
| "total_flos": 1536221652235776.0, | |
| "train_loss": 1.5534028151939656, | |
| "train_runtime": 363.1065, | |
| "train_samples": 9733, | |
| "train_samples_per_second": 268.048, | |
| "train_steps_per_second": 16.772 | |
| } |