{ "achieved_tflops_per_gpu": 4.949651343267627, "achieved_tflops_per_gpu_theoretical": 243.92912852326808, "epoch": 5.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2248307466506958, "mfu_percent": 0.3497986815030125, "mfu_percent_theoretical": 17.23880766948891, "total_flos": 3.151185311610962e+17, "train_loss": 0.24082276695653013, "train_runtime": 3979.0496, "train_samples_per_second": 4.505, "train_steps_per_second": 0.072, "valid_targets_mean": 2971.6, "valid_targets_min": 1283 }