taskmaster2-16ep / train_results.json
penfever's picture
End of training
8d602c8 verified
{
"achieved_tflops_per_gpu": 4.838622773087782,
"achieved_tflops_per_gpu_theoretical": 111.80085057316455,
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.3410820960998535,
"mfu_percent": 0.3419521394408327,
"mfu_percent_theoretical": 7.901120181849085,
"total_flos": 1.8466654367420252e+18,
"train_loss": 0.38092176382708703,
"train_runtime": 23853.1903,
"train_samples_per_second": 2.096,
"train_steps_per_second": 0.033,
"valid_targets_mean": 5863.9,
"valid_targets_min": 645
}