| { | |
| "epoch": 0.67, | |
| "eval_loss": 0.9398621916770935, | |
| "eval_runtime": 183.2326, | |
| "eval_samples": 23110, | |
| "eval_samples_per_second": 126.124, | |
| "eval_steps_per_second": 0.497, | |
| "perplexity": 2.559628655890698, | |
| "train_loss": 0.9917194036876454, | |
| "train_runtime": 6192.0322, | |
| "train_samples": 207865, | |
| "train_samples_per_second": 33.57, | |
| "train_steps_per_second": 0.066 | |
| } |