RoBERTa-CyNER / trainer_state.json
Anonymous
Upload folder using huggingface_hub
be243c7
{
"best_metric": 0.07372047752141953,
"best_model_checkpoint": "/content/dnrti_our/checkpoint-1000",
"epoch": 10.0,
"eval_steps": 500,
"global_step": 3520,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.42,
"learning_rate": 1.715909090909091e-05,
"loss": 0.13,
"step": 500
},
{
"epoch": 1.42,
"eval_accuracy": 0.979574031306133,
"eval_f1": 0.733705772811918,
"eval_loss": 0.08860738575458527,
"eval_precision": 0.7137681159420289,
"eval_recall": 0.7547892720306514,
"eval_runtime": 4.2683,
"eval_samples_per_second": 190.242,
"eval_steps_per_second": 23.897,
"step": 500
},
{
"epoch": 2.84,
"learning_rate": 1.431818181818182e-05,
"loss": 0.0421,
"step": 1000
},
{
"epoch": 2.84,
"eval_accuracy": 0.9835771105978958,
"eval_f1": 0.7874920229738354,
"eval_loss": 0.07372047752141953,
"eval_precision": 0.7869897959183674,
"eval_recall": 0.7879948914431673,
"eval_runtime": 4.138,
"eval_samples_per_second": 196.232,
"eval_steps_per_second": 24.65,
"step": 1000
},
{
"epoch": 4.26,
"learning_rate": 1.1477272727272729e-05,
"loss": 0.0249,
"step": 1500
},
{
"epoch": 4.26,
"eval_accuracy": 0.9821914293045932,
"eval_f1": 0.7684478371501273,
"eval_loss": 0.08549553900957108,
"eval_precision": 0.7655259822560203,
"eval_recall": 0.7713920817369093,
"eval_runtime": 3.9823,
"eval_samples_per_second": 203.9,
"eval_steps_per_second": 25.613,
"step": 1500
},
{
"epoch": 5.68,
"learning_rate": 8.636363636363637e-06,
"loss": 0.0167,
"step": 2000
},
{
"epoch": 5.68,
"eval_accuracy": 0.9826020015396458,
"eval_f1": 0.77743335399876,
"eval_loss": 0.09457844495773315,
"eval_precision": 0.755421686746988,
"eval_recall": 0.8007662835249042,
"eval_runtime": 4.0013,
"eval_samples_per_second": 202.937,
"eval_steps_per_second": 25.492,
"step": 2000
},
{
"epoch": 7.1,
"learning_rate": 5.795454545454546e-06,
"loss": 0.0104,
"step": 2500
},
{
"epoch": 7.1,
"eval_accuracy": 0.981986143187067,
"eval_f1": 0.7681704260651631,
"eval_loss": 0.09761953353881836,
"eval_precision": 0.7539975399753998,
"eval_recall": 0.7828863346104725,
"eval_runtime": 4.1035,
"eval_samples_per_second": 197.878,
"eval_steps_per_second": 24.857,
"step": 2500
},
{
"epoch": 8.52,
"learning_rate": 2.954545454545455e-06,
"loss": 0.0066,
"step": 3000
},
{
"epoch": 8.52,
"eval_accuracy": 0.9835771105978958,
"eval_f1": 0.7897371714643304,
"eval_loss": 0.10236399620771408,
"eval_precision": 0.7742331288343558,
"eval_recall": 0.8058748403575989,
"eval_runtime": 3.5311,
"eval_samples_per_second": 229.955,
"eval_steps_per_second": 28.886,
"step": 3000
},
{
"epoch": 9.94,
"learning_rate": 1.1363636363636364e-07,
"loss": 0.0044,
"step": 3500
},
{
"epoch": 9.94,
"eval_accuracy": 0.9832691814216064,
"eval_f1": 0.7871536523929471,
"eval_loss": 0.10687276721000671,
"eval_precision": 0.7763975155279503,
"eval_recall": 0.7982120051085568,
"eval_runtime": 3.5664,
"eval_samples_per_second": 227.682,
"eval_steps_per_second": 28.6,
"step": 3500
},
{
"epoch": 10.0,
"step": 3520,
"total_flos": 1150724100209448.0,
"train_loss": 0.03344021574170752,
"train_runtime": 609.2851,
"train_samples_per_second": 46.12,
"train_steps_per_second": 5.777
}
],
"logging_steps": 500,
"max_steps": 3520,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 1150724100209448.0,
"trial_name": null,
"trial_params": null
}