bert-base-uncased / trainer_state.json
seanfarrell's picture
Upload folder using huggingface_hub
15bd19a verified
{
"best_global_step": 1092,
"best_metric": 0.7072933549432739,
"best_model_checkpoint": "projects/PetBERT_disease/model/checkpoint-1092",
"epoch": 12.0,
"eval_steps": 500,
"global_step": 1092,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_f1": 0.6436176302232398,
"eval_loss": 0.042807724326848984,
"eval_precision": 0.720030737704918,
"eval_recall": 0.5818671082591595,
"eval_runtime": 28.0832,
"eval_samples_per_second": 178.007,
"eval_steps_per_second": 5.591,
"step": 91
},
{
"epoch": 2.0,
"eval_f1": 0.6762402088772846,
"eval_loss": 0.03623269498348236,
"eval_precision": 0.7126805778491172,
"eval_recall": 0.6433450631339267,
"eval_runtime": 28.7199,
"eval_samples_per_second": 174.061,
"eval_steps_per_second": 5.467,
"step": 182
},
{
"epoch": 3.0,
"eval_f1": 0.6854706461134799,
"eval_loss": 0.04084809869527817,
"eval_precision": 0.7263670064874884,
"eval_recall": 0.6489339681225419,
"eval_runtime": 28.935,
"eval_samples_per_second": 172.766,
"eval_steps_per_second": 5.426,
"step": 273
},
{
"epoch": 4.0,
"eval_f1": 0.6827867947443966,
"eval_loss": 0.04500150680541992,
"eval_precision": 0.7316611452910554,
"eval_recall": 0.6400331194369696,
"eval_runtime": 29.0241,
"eval_samples_per_second": 172.236,
"eval_steps_per_second": 5.409,
"step": 364
},
{
"epoch": 5.0,
"eval_f1": 0.684967037717497,
"eval_loss": 0.058024812489748,
"eval_precision": 0.716644052464948,
"eval_recall": 0.6559718484785758,
"eval_runtime": 29.1182,
"eval_samples_per_second": 171.68,
"eval_steps_per_second": 5.392,
"step": 455
},
{
"epoch": 5.4945054945054945,
"grad_norm": 0.24326272308826447,
"learning_rate": 4.9725824175824175e-05,
"loss": 0.0324,
"step": 500
},
{
"epoch": 6.0,
"eval_f1": 0.6974244120940649,
"eval_loss": 0.06078333407640457,
"eval_precision": 0.759697487191998,
"eval_recall": 0.6445870420202856,
"eval_runtime": 29.0499,
"eval_samples_per_second": 172.083,
"eval_steps_per_second": 5.404,
"step": 546
},
{
"epoch": 7.0,
"eval_f1": 0.699815837937385,
"eval_loss": 0.06435026973485947,
"eval_precision": 0.7340909090909091,
"eval_recall": 0.668598633823225,
"eval_runtime": 29.1958,
"eval_samples_per_second": 171.223,
"eval_steps_per_second": 5.377,
"step": 637
},
{
"epoch": 8.0,
"eval_f1": 0.6904121863799283,
"eval_loss": 0.06762922555208206,
"eval_precision": 0.7522577495728582,
"eval_recall": 0.6379631546263713,
"eval_runtime": 29.1932,
"eval_samples_per_second": 171.238,
"eval_steps_per_second": 5.378,
"step": 728
},
{
"epoch": 9.0,
"eval_f1": 0.6979665708506334,
"eval_loss": 0.07541821897029877,
"eval_precision": 0.718544498027181,
"eval_recall": 0.6785344649140964,
"eval_runtime": 29.3157,
"eval_samples_per_second": 170.523,
"eval_steps_per_second": 5.355,
"step": 819
},
{
"epoch": 10.0,
"eval_f1": 0.7055853581571474,
"eval_loss": 0.06385636329650879,
"eval_precision": 0.7172797262617622,
"eval_recall": 0.6942661974746429,
"eval_runtime": 29.2092,
"eval_samples_per_second": 171.144,
"eval_steps_per_second": 5.375,
"step": 910
},
{
"epoch": 10.989010989010989,
"grad_norm": 0.7826827168464661,
"learning_rate": 4.9451098901098904e-05,
"loss": 0.0035,
"step": 1000
},
{
"epoch": 11.0,
"eval_f1": 0.7059959240587794,
"eval_loss": 0.07221361249685287,
"eval_precision": 0.7326357969723953,
"eval_recall": 0.6812254191678742,
"eval_runtime": 29.1291,
"eval_samples_per_second": 171.615,
"eval_steps_per_second": 5.39,
"step": 1001
},
{
"epoch": 12.0,
"eval_f1": 0.7072933549432739,
"eval_loss": 0.06996828317642212,
"eval_precision": 0.7398282097649186,
"eval_recall": 0.6774994825087973,
"eval_runtime": 29.1242,
"eval_samples_per_second": 171.644,
"eval_steps_per_second": 5.391,
"step": 1092
}
],
"logging_steps": 500,
"max_steps": 91000,
"num_input_tokens_seen": 0,
"num_train_epochs": 1000,
"save_steps": 500,
"stateful_callbacks": {
"EarlyStoppingCallback": {
"args": {
"early_stopping_patience": 3,
"early_stopping_threshold": 0.0
},
"attributes": {
"early_stopping_patience_counter": 0
}
},
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": false
},
"attributes": {}
}
},
"total_flos": 9096344934248448.0,
"train_batch_size": 32,
"trial_name": null,
"trial_params": null
}