longformer-full_labels / checkpoint-162 /trainer_state.json
Theoreticallyhugo's picture
Training in progress, epoch 2, checkpoint
e3efc2f verified
{
"best_metric": 0.5138605833053589,
"best_model_checkpoint": "longformer-full_labels/checkpoint-162",
"epoch": 2.0,
"eval_steps": 500,
"global_step": 162,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_B-Claim": {
"f1-score": 0.006993006993006993,
"precision": 0.5,
"recall": 0.0035211267605633804,
"support": 284.0
},
"eval_B-MajorClaim": {
"f1-score": 0.0,
"precision": 0.0,
"recall": 0.0,
"support": 141.0
},
"eval_B-Premise": {
"f1-score": 0.6336375488917861,
"precision": 0.5883777239709443,
"recall": 0.6864406779661016,
"support": 708.0
},
"eval_I-Claim": {
"f1-score": 0.37228850325379614,
"precision": 0.41618672324946954,
"recall": 0.3367672308069659,
"support": 4077.0
},
"eval_I-MajorClaim": {
"f1-score": 0.49153013051930017,
"precision": 0.5611921369689283,
"recall": 0.43725296442687744,
"support": 2024.0
},
"eval_I-Premise": {
"f1-score": 0.846019669697532,
"precision": 0.7746890504995582,
"recall": 0.9318181818181818,
"support": 12232.0
},
"eval_O": {
"f1-score": 0.8650519031141869,
"precision": 0.9111808904340025,
"recall": 0.8233684637211187,
"support": 9868.0
},
"eval_accuracy": 0.7591191109292971,
"eval_loss": 0.6442636251449585,
"eval_macro avg": {
"f1-score": 0.4593601089242298,
"precision": 0.535946646446129,
"recall": 0.4598812350714013,
"support": 29334.0
},
"eval_runtime": 6.1153,
"eval_samples_per_second": 13.082,
"eval_steps_per_second": 1.635,
"eval_weighted avg": {
"f1-score": 0.7448054609057474,
"precision": 0.7451676238152983,
"recall": 0.7591191109292971,
"support": 29334.0
},
"step": 81
},
{
"epoch": 2.0,
"eval_B-Claim": {
"f1-score": 0.47385620915032683,
"precision": 0.4420731707317073,
"recall": 0.5105633802816901,
"support": 284.0
},
"eval_B-MajorClaim": {
"f1-score": 0.5267489711934156,
"precision": 0.6274509803921569,
"recall": 0.45390070921985815,
"support": 141.0
},
"eval_B-Premise": {
"f1-score": 0.7686170212765958,
"precision": 0.7261306532663316,
"recall": 0.8163841807909604,
"support": 708.0
},
"eval_I-Claim": {
"f1-score": 0.5068787075602675,
"precision": 0.5221008840353614,
"recall": 0.49251900907530044,
"support": 4077.0
},
"eval_I-MajorClaim": {
"f1-score": 0.6644462947543713,
"precision": 0.5741007194244604,
"recall": 0.7885375494071146,
"support": 2024.0
},
"eval_I-Premise": {
"f1-score": 0.8735948241002829,
"precision": 0.8642982877260361,
"recall": 0.8830935251798561,
"support": 12232.0
},
"eval_O": {
"f1-score": 0.8825588796944621,
"precision": 0.925979519145147,
"recall": 0.8430279691933522,
"support": 9868.0
},
"eval_accuracy": 0.8015272380173177,
"eval_loss": 0.5138605833053589,
"eval_macro avg": {
"f1-score": 0.6709572725328175,
"precision": 0.668876316388743,
"recall": 0.6840037604497332,
"support": 29334.0
},
"eval_runtime": 6.1482,
"eval_samples_per_second": 13.012,
"eval_steps_per_second": 1.627,
"eval_weighted avg": {
"f1-score": 0.8031401896750007,
"precision": 0.8089032379475054,
"recall": 0.8015272380173177,
"support": 29334.0
},
"step": 162
}
],
"logging_steps": 500,
"max_steps": 1620,
"num_input_tokens_seen": 0,
"num_train_epochs": 20,
"save_steps": 500,
"total_flos": 287581625436000.0,
"train_batch_size": 4,
"trial_name": null,
"trial_params": null
}