{ "achieved_tflops_per_gpu": 5.143096781650618, "achieved_tflops_per_gpu_theoretical": 216.82589202068274, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.07686486095190048, "mfu_percent": 0.5200300082558764, "mfu_percent_theoretical": 21.923750457096332, "total_flos": 2.65446196155043e+18, "train_loss": 0.30306281665335555, "train_runtime": 64515.1665, "train_samples_per_second": 1.024, "train_steps_per_second": 0.064, "valid_targets_mean": 6255.1, "valid_targets_min": 3251 }