| { | |
| "epoch": 0.89, | |
| "eval_accuracy": 0.5276878957675893, | |
| "eval_loss": 2.621161460876465, | |
| "eval_runtime": 1910.5455, | |
| "eval_samples": 308356, | |
| "eval_samples_per_second": 161.397, | |
| "eval_steps_per_second": 3.363, | |
| "perplexity": 13.751686358906099, | |
| "train_loss": 2.857705880085117, | |
| "train_runtime": 107970.477, | |
| "train_samples": 5858758, | |
| "train_samples_per_second": 271.313, | |
| "train_steps_per_second": 5.652 | |
| } |