| { | |
| "epoch": 1.99, | |
| "eval_accuracy": 0.23619257086999024, | |
| "eval_loss": 5.369718551635742, | |
| "eval_runtime": 8.2411, | |
| "eval_samples": 40, | |
| "eval_samples_per_second": 4.854, | |
| "eval_steps_per_second": 2.427, | |
| "perplexity": 214.80240341086764, | |
| "total_flos": 2829332565196800.0, | |
| "train_loss": 6.479159524507612, | |
| "train_runtime": 865.9454, | |
| "train_samples": 862, | |
| "train_samples_per_second": 1.991, | |
| "train_steps_per_second": 0.247 | |
| } |