| { | |
| "epoch": 42.63, | |
| "eval_accuracy": 0.8063465783386143, | |
| "eval_loss": 0.8021716475486755, | |
| "eval_runtime": 54.6256, | |
| "eval_samples": 51744, | |
| "eval_samples_per_second": 947.248, | |
| "eval_steps_per_second": 14.81, | |
| "perplexity": 2.230379270679791, | |
| "train_loss": 0.07689679595947266, | |
| "train_runtime": 32435.3069, | |
| "train_samples": 6005301, | |
| "train_samples_per_second": 7892.634, | |
| "train_steps_per_second": 30.831 | |
| } |