train_multirc_1745950262 / train_results.json
rbelanec's picture
End of training
c76ddfa verified
{
"epoch": 6.525328330206379,
"num_input_tokens_seen": 76963024,
"total_flos": 3.2232900582312346e+17,
"train_loss": 3.2710773272037508,
"train_runtime": 26847.8872,
"train_samples_per_second": 5.96,
"train_steps_per_second": 1.49
}