| { | |
| "epoch": 0.82, | |
| "eval_accuracy": 0.1759858884379102, | |
| "eval_loss": 5.553138256072998, | |
| "eval_runtime": 1546.0138, | |
| "eval_samples": 308356, | |
| "eval_samples_per_second": 199.452, | |
| "eval_steps_per_second": 4.156, | |
| "perplexity": 258.0461012754175, | |
| "train_loss": 5.658731824803928, | |
| "train_runtime": 86394.9765, | |
| "train_samples": 5858758, | |
| "train_samples_per_second": 339.068, | |
| "train_steps_per_second": 7.064 | |
| } |