| { | |
| "epoch": 1.9985964912280703, | |
| "eval_loss": 0.22910664975643158, | |
| "eval_runtime": 8.378, | |
| "eval_samples": 100, | |
| "eval_samples_per_second": 6.565, | |
| "eval_steps_per_second": 0.836, | |
| "perplexity": 1.2574761413829163, | |
| "raw_train_examples": 78434, | |
| "total_flos": 8.025299762167153e+17, | |
| "train_examples": 39900, | |
| "train_loss": 0.37913749282088366, | |
| "train_runtime": 28381.1385, | |
| "train_samples_per_second": 2.812, | |
| "train_steps_per_second": 0.088 | |
| } |