hBERTv2_data_aug_stsb / trainer_state.json
gokuls's picture
End of training
f46642b
{
"best_metric": 2.135712146759033,
"best_model_checkpoint": "hBERTv2_data_aug_stsb/checkpoint-1259",
"epoch": 6.0,
"global_step": 7554,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"learning_rate": 4.900317712470215e-05,
"loss": 0.6302,
"step": 1259
},
{
"epoch": 1.0,
"eval_combined_score": 0.5155992873552944,
"eval_loss": 2.135712146759033,
"eval_pearson": 0.5180732083614772,
"eval_runtime": 1.7839,
"eval_samples_per_second": 840.872,
"eval_spearmanr": 0.5131253663491117,
"eval_steps_per_second": 3.363,
"step": 1259
},
{
"epoch": 2.0,
"learning_rate": 4.800317712470215e-05,
"loss": 0.0973,
"step": 2518
},
{
"epoch": 2.0,
"eval_combined_score": 0.4388959634942341,
"eval_loss": 2.4677507877349854,
"eval_pearson": 0.44945880353679196,
"eval_runtime": 1.7897,
"eval_samples_per_second": 838.143,
"eval_spearmanr": 0.4283331234516762,
"eval_steps_per_second": 3.353,
"step": 2518
},
{
"epoch": 3.0,
"learning_rate": 4.700317712470215e-05,
"loss": 0.0514,
"step": 3777
},
{
"epoch": 3.0,
"eval_combined_score": 0.40110936321253565,
"eval_loss": 2.3102009296417236,
"eval_pearson": 0.4100592328009352,
"eval_runtime": 1.8032,
"eval_samples_per_second": 831.867,
"eval_spearmanr": 0.39215949362413616,
"eval_steps_per_second": 3.327,
"step": 3777
},
{
"epoch": 4.0,
"learning_rate": 4.6003177124702146e-05,
"loss": 0.0384,
"step": 5036
},
{
"epoch": 4.0,
"eval_combined_score": 0.4411314393998532,
"eval_loss": 2.5410399436950684,
"eval_pearson": 0.44464954748981084,
"eval_runtime": 1.8348,
"eval_samples_per_second": 817.514,
"eval_spearmanr": 0.43761333130989566,
"eval_steps_per_second": 3.27,
"step": 5036
},
{
"epoch": 5.0,
"learning_rate": 4.500317712470214e-05,
"loss": 0.031,
"step": 6295
},
{
"epoch": 5.0,
"eval_combined_score": 0.40039690758107405,
"eval_loss": 2.4586338996887207,
"eval_pearson": 0.4091069786387324,
"eval_runtime": 1.8247,
"eval_samples_per_second": 822.056,
"eval_spearmanr": 0.3916868365234156,
"eval_steps_per_second": 3.288,
"step": 6295
},
{
"epoch": 6.0,
"learning_rate": 4.4003177124702145e-05,
"loss": 0.0255,
"step": 7554
},
{
"epoch": 6.0,
"eval_combined_score": 0.39364433082151107,
"eval_loss": 2.5980560779571533,
"eval_pearson": 0.39984420561965867,
"eval_runtime": 1.817,
"eval_samples_per_second": 825.557,
"eval_spearmanr": 0.3874444560233634,
"eval_steps_per_second": 3.302,
"step": 7554
},
{
"epoch": 6.0,
"step": 7554,
"total_flos": 2.4081953784122573e+17,
"train_loss": 0.14565795876217924,
"train_runtime": 6838.9097,
"train_samples_per_second": 2355.982,
"train_steps_per_second": 9.205
}
],
"max_steps": 62950,
"num_train_epochs": 50,
"total_flos": 2.4081953784122573e+17,
"trial_name": null,
"trial_params": null
}