bioformer-cellfinder_V1 / trainer_state.json
Mardiyyah's picture
add bioformer cellfinder v1 model
3390687 verified
{
"best_metric": 0.8438751000800641,
"best_model_checkpoint": "/nfs/production/literature/amina-mardiyyah/new_data/OT-Entity-Extraction-Pipeline/model_outputs/hf_cellfinder_conll-V1/bioformers/checkpoint-1221",
"epoch": 11.0,
"eval_steps": 500,
"global_step": 1221,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"grad_norm": 0.795136570930481,
"learning_rate": 1.901801801801802e-05,
"loss": 0.2939,
"step": 111
},
{
"epoch": 1.0,
"eval_accuracy": 0.974508886810103,
"eval_f1": 0.578688524590164,
"eval_loss": 0.09425864368677139,
"eval_precision": 0.5952782462057336,
"eval_recall": 0.5629984051036683,
"eval_runtime": 9.1819,
"eval_samples_per_second": 48.356,
"eval_steps_per_second": 3.049,
"step": 111
},
{
"epoch": 2.0,
"grad_norm": 1.5788325071334839,
"learning_rate": 1.801801801801802e-05,
"loss": 0.0922,
"step": 222
},
{
"epoch": 2.0,
"eval_accuracy": 0.9832787652011226,
"eval_f1": 0.7074601844090529,
"eval_loss": 0.060064926743507385,
"eval_precision": 0.7455830388692579,
"eval_recall": 0.6730462519936204,
"eval_runtime": 9.1954,
"eval_samples_per_second": 48.285,
"eval_steps_per_second": 3.045,
"step": 222
},
{
"epoch": 3.0,
"grad_norm": 1.0079556703567505,
"learning_rate": 1.701801801801802e-05,
"loss": 0.066,
"step": 333
},
{
"epoch": 3.0,
"eval_accuracy": 0.9841557530402245,
"eval_f1": 0.7742435996896818,
"eval_loss": 0.054448943585157394,
"eval_precision": 0.7537764350453172,
"eval_recall": 0.79585326953748,
"eval_runtime": 9.1805,
"eval_samples_per_second": 48.363,
"eval_steps_per_second": 3.05,
"step": 333
},
{
"epoch": 4.0,
"grad_norm": 1.0463738441467285,
"learning_rate": 1.601801801801802e-05,
"loss": 0.05,
"step": 444
},
{
"epoch": 4.0,
"eval_accuracy": 0.9860851262862488,
"eval_f1": 0.801261829652997,
"eval_loss": 0.05010896548628807,
"eval_precision": 0.7925117004680188,
"eval_recall": 0.810207336523126,
"eval_runtime": 9.1685,
"eval_samples_per_second": 48.427,
"eval_steps_per_second": 3.054,
"step": 444
},
{
"epoch": 5.0,
"grad_norm": 1.8808237314224243,
"learning_rate": 1.5018018018018019e-05,
"loss": 0.0384,
"step": 555
},
{
"epoch": 5.0,
"eval_accuracy": 0.9872544434050514,
"eval_f1": 0.8314960629921261,
"eval_loss": 0.047017596662044525,
"eval_precision": 0.8211508553654744,
"eval_recall": 0.8421052631578947,
"eval_runtime": 9.141,
"eval_samples_per_second": 48.573,
"eval_steps_per_second": 3.063,
"step": 555
},
{
"epoch": 6.0,
"grad_norm": 0.8775511980056763,
"learning_rate": 1.4018018018018018e-05,
"loss": 0.0316,
"step": 666
},
{
"epoch": 6.0,
"eval_accuracy": 0.9878975678203928,
"eval_f1": 0.819935691318328,
"eval_loss": 0.0532170832157135,
"eval_precision": 0.826580226904376,
"eval_recall": 0.8133971291866029,
"eval_runtime": 9.3828,
"eval_samples_per_second": 47.321,
"eval_steps_per_second": 2.984,
"step": 666
},
{
"epoch": 7.0,
"grad_norm": 2.152559757232666,
"learning_rate": 1.301801801801802e-05,
"loss": 0.0261,
"step": 777
},
{
"epoch": 7.0,
"eval_accuracy": 0.987488306828812,
"eval_f1": 0.812807881773399,
"eval_loss": 0.050550468266010284,
"eval_precision": 0.8375634517766497,
"eval_recall": 0.7894736842105263,
"eval_runtime": 9.3573,
"eval_samples_per_second": 47.449,
"eval_steps_per_second": 2.992,
"step": 777
},
{
"epoch": 8.0,
"grad_norm": 0.400267630815506,
"learning_rate": 1.2018018018018019e-05,
"loss": 0.0228,
"step": 888
},
{
"epoch": 8.0,
"eval_accuracy": 0.9872544434050514,
"eval_f1": 0.825296442687747,
"eval_loss": 0.05137129873037338,
"eval_precision": 0.8181818181818182,
"eval_recall": 0.8325358851674641,
"eval_runtime": 9.3986,
"eval_samples_per_second": 47.241,
"eval_steps_per_second": 2.979,
"step": 888
},
{
"epoch": 9.0,
"grad_norm": 0.5100765228271484,
"learning_rate": 1.101801801801802e-05,
"loss": 0.0189,
"step": 999
},
{
"epoch": 9.0,
"eval_accuracy": 0.9877221702525725,
"eval_f1": 0.8288726682887267,
"eval_loss": 0.05429461598396301,
"eval_precision": 0.8432343234323433,
"eval_recall": 0.8149920255183413,
"eval_runtime": 9.1439,
"eval_samples_per_second": 48.557,
"eval_steps_per_second": 3.062,
"step": 999
},
{
"epoch": 10.0,
"grad_norm": 2.543349266052246,
"learning_rate": 1.001801801801802e-05,
"loss": 0.0162,
"step": 1110
},
{
"epoch": 10.0,
"eval_accuracy": 0.9881314312441534,
"eval_f1": 0.8352180936995154,
"eval_loss": 0.05771711841225624,
"eval_precision": 0.8461538461538461,
"eval_recall": 0.8245614035087719,
"eval_runtime": 9.1278,
"eval_samples_per_second": 48.642,
"eval_steps_per_second": 3.068,
"step": 1110
},
{
"epoch": 11.0,
"grad_norm": 0.7831849455833435,
"learning_rate": 9.018018018018019e-06,
"loss": 0.0142,
"step": 1221
},
{
"epoch": 11.0,
"eval_accuracy": 0.9886576239476146,
"eval_f1": 0.8438751000800641,
"eval_loss": 0.05389339104294777,
"eval_precision": 0.8472668810289389,
"eval_recall": 0.8405103668261563,
"eval_runtime": 9.1654,
"eval_samples_per_second": 48.443,
"eval_steps_per_second": 3.055,
"step": 1221
}
],
"logging_steps": 500,
"max_steps": 2220,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 1622782443811692.0,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}