| { | |
| "epoch": 1.04632568359375, | |
| "eval_accuracy": 0.04088023483365949, | |
| "eval_loss": 6.392906188964844, | |
| "eval_runtime": 244.4224, | |
| "eval_samples": 10000, | |
| "eval_samples_per_second": 40.913, | |
| "eval_steps_per_second": 10.228, | |
| "perplexity": 597.5907702266671, | |
| "total_flos": 5.045399375119909e+18, | |
| "train_loss": 6.577412648592144, | |
| "train_runtime": 154506.2809, | |
| "train_samples": 2000000, | |
| "train_samples_per_second": 13.573, | |
| "train_steps_per_second": 3.393 | |
| } |