taskmaster2-4ep / train_results.json
penfever's picture
End of training
bcd3062 verified
raw
history blame contribute delete
540 Bytes
{
"achieved_tflops_per_gpu": 5.333613089682677,
"achieved_tflops_per_gpu_theoretical": 277.80817415149977,
"epoch": 5.0,
"loss_nan_ranks": 0,
"loss_rank_avg": 0.4209003150463104,
"mfu_percent": 0.3769337872567263,
"mfu_percent_theoretical": 19.633086512473483,
"total_flos": 8.136605209670451e+17,
"train_loss": 0.4667121115763476,
"train_runtime": 9534.5841,
"train_samples_per_second": 5.242,
"train_steps_per_second": 0.082,
"valid_targets_mean": 2253.5,
"valid_targets_min": 645
}