| { | |
| "epoch": 3.0, | |
| "eval_loss": 0.9489470720291138, | |
| "eval_runtime": 279.8429, | |
| "eval_samples": 1267, | |
| "eval_samples_per_second": 4.528, | |
| "eval_steps_per_second": 2.266, | |
| "perplexity": 2.582988526120989, | |
| "train_loss": 0.9826037574650801, | |
| "train_runtime": 24274.8201, | |
| "train_samples": 11364, | |
| "train_samples_per_second": 1.404, | |
| "train_steps_per_second": 0.702 | |
| } |