| { | |
| "epoch": 0.93, | |
| "eval_accuracy": 0.198145828598818, | |
| "eval_loss": 5.527432918548584, | |
| "eval_runtime": 1749.7981, | |
| "eval_samples": 308356, | |
| "eval_samples_per_second": 176.224, | |
| "eval_steps_per_second": 3.672, | |
| "perplexity": 251.49746715846484, | |
| "train_loss": 6.147486028159083, | |
| "train_runtime": 107984.4242, | |
| "train_samples": 5858758, | |
| "train_samples_per_second": 271.278, | |
| "train_steps_per_second": 5.652 | |
| } |