| { | |
| "achieved_tflops_per_gpu": 4.949651343267627, | |
| "achieved_tflops_per_gpu_theoretical": 243.92912852326808, | |
| "epoch": 5.0, | |
| "loss_nan_ranks": 0, | |
| "loss_rank_avg": 0.2248307466506958, | |
| "mfu_percent": 0.3497986815030125, | |
| "mfu_percent_theoretical": 17.23880766948891, | |
| "total_flos": 3.151185311610962e+17, | |
| "train_loss": 0.24082276695653013, | |
| "train_runtime": 3979.0496, | |
| "train_samples_per_second": 4.505, | |
| "train_steps_per_second": 0.072, | |
| "valid_targets_mean": 2971.6, | |
| "valid_targets_min": 1283 | |
| } |