ner_FT-checkpoint-2387debert / trainer_state.json
Aspik101's picture
Upload folder using huggingface_hub
9b82ad5 verified
{
"best_metric": 0.8816773017319963,
"best_model_checkpoint": "ft/checkpoint-2046",
"epoch": 7.0,
"eval_steps": 500,
"global_step": 2387,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_f1": 0.25525268677252616,
"eval_loss": 0.0030135156121104956,
"eval_precision": 0.42857142857142855,
"eval_recall": 0.25118934348239774,
"eval_runtime": 46.7461,
"eval_samples_per_second": 29.136,
"eval_steps_per_second": 1.84,
"step": 341
},
{
"epoch": 1.47,
"learning_rate": 1.8973984286913584e-05,
"loss": 0.0524,
"step": 500
},
{
"epoch": 2.0,
"eval_f1": 0.7398991743990649,
"eval_loss": 0.0016016679583117366,
"eval_precision": 0.7088262056414922,
"eval_recall": 0.7411988582302569,
"eval_runtime": 46.8135,
"eval_samples_per_second": 29.094,
"eval_steps_per_second": 1.837,
"step": 682
},
{
"epoch": 2.93,
"learning_rate": 1.607725459161122e-05,
"loss": 0.0014,
"step": 1000
},
{
"epoch": 3.0,
"eval_f1": 0.868271080619986,
"eval_loss": 0.0015651908470317721,
"eval_precision": 0.7221350078492935,
"eval_recall": 0.8753568030447193,
"eval_runtime": 46.8355,
"eval_samples_per_second": 29.081,
"eval_steps_per_second": 1.836,
"step": 1023
},
{
"epoch": 4.0,
"eval_f1": 0.7916895679894471,
"eval_loss": 0.0016834472771734,
"eval_precision": 0.8179133858267716,
"eval_recall": 0.7906755470980019,
"eval_runtime": 46.5374,
"eval_samples_per_second": 29.267,
"eval_steps_per_second": 1.848,
"step": 1364
},
{
"epoch": 4.4,
"learning_rate": 1.1913616304731064e-05,
"loss": 0.0007,
"step": 1500
},
{
"epoch": 5.0,
"eval_f1": 0.8055126791620728,
"eval_loss": 0.001440966036170721,
"eval_precision": 0.9016042780748663,
"eval_recall": 0.80209324452902,
"eval_runtime": 46.5939,
"eval_samples_per_second": 29.231,
"eval_steps_per_second": 1.846,
"step": 1705
},
{
"epoch": 5.87,
"learning_rate": 7.3510516768689765e-06,
"loss": 0.0004,
"step": 2000
},
{
"epoch": 6.0,
"eval_f1": 0.8816773017319963,
"eval_loss": 0.001409668242558837,
"eval_precision": 0.808695652173913,
"eval_recall": 0.884871550903901,
"eval_runtime": 46.5762,
"eval_samples_per_second": 29.242,
"eval_steps_per_second": 1.846,
"step": 2046
},
{
"epoch": 7.0,
"eval_f1": 0.8618469193619203,
"eval_loss": 0.0015025387983769178,
"eval_precision": 0.8571428571428571,
"eval_recall": 0.8620361560418649,
"eval_runtime": 46.722,
"eval_samples_per_second": 29.151,
"eval_steps_per_second": 1.841,
"step": 2387
}
],
"logging_steps": 500,
"max_steps": 3410,
"num_input_tokens_seen": 0,
"num_train_epochs": 10,
"save_steps": 500,
"total_flos": 1.3498705156498326e+16,
"train_batch_size": 16,
"trial_name": null,
"trial_params": null
}