| { | |
| "epoch": 25.0, | |
| "eval_accuracy": 0.15262473865626944, | |
| "eval_loss": 6.875680923461914, | |
| "eval_runtime": 0.6832, | |
| "eval_samples": 479, | |
| "eval_samples_per_second": 701.123, | |
| "eval_steps_per_second": 7.319, | |
| "perplexity": 968.4345709456935, | |
| "total_flos": 3.053850510375936e+17, | |
| "train_loss": 6.665182815410828, | |
| "train_runtime": 11393.6254, | |
| "train_samples": 228639, | |
| "train_samples_per_second": 501.682, | |
| "train_steps_per_second": 5.227 | |
| } |