distilbert_km_100_v2_mnli / all_results.json
Hartunka's picture
End of training
b76664c verified
{
"epoch": 9.0,
"epoch_mm": 9.0,
"eval_accuracy": 0.6360672440142638,
"eval_accuracy_mm": 0.6334418226200162,
"eval_loss": 0.8316934704780579,
"eval_loss_mm": 0.8361369371414185,
"eval_runtime": 3.9936,
"eval_runtime_mm": 4.0144,
"eval_samples": 9815,
"eval_samples_mm": 9832,
"eval_samples_per_second": 2457.686,
"eval_samples_per_second_mm": 2449.195,
"eval_steps_per_second": 9.766,
"eval_steps_per_second_mm": 9.715,
"total_flos": 2.340951304214108e+17,
"train_loss": 0.6929499982457809,
"train_runtime": 3245.2005,
"train_samples": 392702,
"train_samples_per_second": 6050.504,
"train_steps_per_second": 23.635
}