| { | |
| "epoch": 28.812761993479274, | |
| "eval_accuracy": 0.3701093509307751, | |
| "eval_loss": 3.5537867546081543, | |
| "eval_runtime": 80.891, | |
| "eval_samples": 16651, | |
| "eval_samples_per_second": 205.845, | |
| "eval_steps_per_second": 12.869, | |
| "perplexity": 34.945396896348726, | |
| "total_flos": 2.068898812526592e+18, | |
| "train_loss": 3.384700189301462, | |
| "train_runtime": 72601.828, | |
| "train_samples": 274807, | |
| "train_samples_per_second": 189.256, | |
| "train_steps_per_second": 2.366 | |
| } |