{ "achieved_tflops_per_gpu": 0.003027794354282776, "achieved_tflops_per_gpu_theoretical": 921.5100410879018, "epoch": 7.0, "loss_nan_ranks": 0, "loss_rank_avg": 0.2101745903491974, "mfu_percent": 0.0002139783995959559, "mfu_percent_theoretical": 65.12438452918033, "total_flos": 1189003618287616.0, "train_loss": 0.21699104300674413, "train_runtime": 24543.5183, "train_samples_per_second": 4.344, "train_steps_per_second": 0.272, "valid_targets_mean": 3715.1, "valid_targets_min": 791 }