NER_skill_extractor / trainer_state.json
wt3639's picture
Upload 11 files
54ca777 verified
{
"best_metric": 0.21624045073986053,
"best_model_checkpoint": "/hpcwork/vg380347/NER/EduGBERT/checkpoint-550",
"epoch": 7.446808510638298,
"eval_steps": 50,
"global_step": 1050,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.35,
"eval_f1": 0.5815712900096993,
"eval_loss": 0.3045153319835663,
"eval_precision": 0.5216332212040367,
"eval_recall": 0.6570718877849211,
"eval_runtime": 7.1562,
"eval_samples_per_second": 629.381,
"eval_steps_per_second": 5.031,
"step": 50
},
{
"epoch": 0.71,
"eval_f1": 0.6822522225880804,
"eval_loss": 0.25079214572906494,
"eval_precision": 0.6210286536386525,
"eval_recall": 0.7568673290473408,
"eval_runtime": 7.2954,
"eval_samples_per_second": 617.376,
"eval_steps_per_second": 4.935,
"step": 100
},
{
"epoch": 1.06,
"eval_f1": 0.7016087182148418,
"eval_loss": 0.24814821779727936,
"eval_precision": 0.6308912739150724,
"eval_recall": 0.7901811805961426,
"eval_runtime": 7.1783,
"eval_samples_per_second": 627.45,
"eval_steps_per_second": 5.015,
"step": 150
},
{
"epoch": 1.42,
"eval_f1": 0.7199271355149306,
"eval_loss": 0.2445540428161621,
"eval_precision": 0.6488800281458895,
"eval_recall": 0.8084453535943893,
"eval_runtime": 7.1384,
"eval_samples_per_second": 630.95,
"eval_steps_per_second": 5.043,
"step": 200
},
{
"epoch": 1.77,
"eval_f1": 0.722252082773448,
"eval_loss": 0.22964715957641602,
"eval_precision": 0.6685323383084577,
"eval_recall": 0.7853594389246055,
"eval_runtime": 7.434,
"eval_samples_per_second": 605.866,
"eval_steps_per_second": 4.843,
"step": 250
},
{
"epoch": 2.13,
"eval_f1": 0.7319960997353392,
"eval_loss": 0.21758420765399933,
"eval_precision": 0.6993611924407772,
"eval_recall": 0.7678258328462887,
"eval_runtime": 7.1469,
"eval_samples_per_second": 630.207,
"eval_steps_per_second": 5.037,
"step": 300
},
{
"epoch": 2.48,
"eval_f1": 0.7406113537117905,
"eval_loss": 0.22185301780700684,
"eval_precision": 0.6854868797413257,
"eval_recall": 0.8053769725306839,
"eval_runtime": 7.1574,
"eval_samples_per_second": 629.281,
"eval_steps_per_second": 5.03,
"step": 350
},
{
"epoch": 2.84,
"eval_f1": 0.7412340309866812,
"eval_loss": 0.2164618819952011,
"eval_precision": 0.6928353658536586,
"eval_recall": 0.7969023962594973,
"eval_runtime": 7.1409,
"eval_samples_per_second": 630.735,
"eval_steps_per_second": 5.041,
"step": 400
},
{
"epoch": 3.19,
"eval_f1": 0.7499483221938952,
"eval_loss": 0.2220638245344162,
"eval_precision": 0.7096101186595384,
"eval_recall": 0.7951490356516657,
"eval_runtime": 7.4483,
"eval_samples_per_second": 604.703,
"eval_steps_per_second": 4.833,
"step": 450
},
{
"epoch": 3.55,
"learning_rate": 4.822695035460993e-06,
"loss": 0.2581,
"step": 500
},
{
"epoch": 3.55,
"eval_f1": 0.7439247452312516,
"eval_loss": 0.2487693727016449,
"eval_precision": 0.6727315689981096,
"eval_recall": 0.8319696084161309,
"eval_runtime": 7.1497,
"eval_samples_per_second": 629.957,
"eval_steps_per_second": 5.035,
"step": 500
},
{
"epoch": 3.9,
"eval_f1": 0.7555155958226711,
"eval_loss": 0.21624045073986053,
"eval_precision": 0.717268548916612,
"eval_recall": 0.7980713033313852,
"eval_runtime": 7.1536,
"eval_samples_per_second": 629.612,
"eval_steps_per_second": 5.032,
"step": 550
},
{
"epoch": 4.26,
"eval_f1": 0.7588671611598112,
"eval_loss": 0.23951853811740875,
"eval_precision": 0.7046080641121963,
"eval_recall": 0.8221800116890707,
"eval_runtime": 7.0397,
"eval_samples_per_second": 639.8,
"eval_steps_per_second": 5.114,
"step": 600
},
{
"epoch": 4.61,
"eval_f1": 0.7562726374711887,
"eval_loss": 0.24661774933338165,
"eval_precision": 0.688406665867402,
"eval_recall": 0.8389830508474576,
"eval_runtime": 7.1388,
"eval_samples_per_second": 630.916,
"eval_steps_per_second": 5.043,
"step": 650
},
{
"epoch": 4.96,
"eval_f1": 0.7577822311289245,
"eval_loss": 0.24025806784629822,
"eval_precision": 0.6980063992124046,
"eval_recall": 0.8287551139684395,
"eval_runtime": 7.1329,
"eval_samples_per_second": 631.441,
"eval_steps_per_second": 5.047,
"step": 700
},
{
"epoch": 5.32,
"eval_f1": 0.7517815517815518,
"eval_loss": 0.261866956949234,
"eval_precision": 0.6907355280871375,
"eval_recall": 0.8246639392168322,
"eval_runtime": 7.3254,
"eval_samples_per_second": 614.846,
"eval_steps_per_second": 4.914,
"step": 750
},
{
"epoch": 5.67,
"eval_f1": 0.7615306467998646,
"eval_loss": 0.2429821491241455,
"eval_precision": 0.7097588688296932,
"eval_recall": 0.8214494447691408,
"eval_runtime": 7.1352,
"eval_samples_per_second": 631.236,
"eval_steps_per_second": 5.045,
"step": 800
},
{
"epoch": 6.03,
"eval_f1": 0.7594460131773565,
"eval_loss": 0.24021703004837036,
"eval_precision": 0.7033623910336239,
"eval_recall": 0.8252483927527762,
"eval_runtime": 7.155,
"eval_samples_per_second": 629.489,
"eval_steps_per_second": 5.031,
"step": 850
},
{
"epoch": 6.38,
"eval_f1": 0.7594716019580233,
"eval_loss": 0.25845229625701904,
"eval_precision": 0.70182178708638,
"eval_recall": 0.8274400935125658,
"eval_runtime": 7.1743,
"eval_samples_per_second": 627.796,
"eval_steps_per_second": 5.018,
"step": 900
},
{
"epoch": 6.74,
"eval_f1": 0.7634940255459416,
"eval_loss": 0.2463415563106537,
"eval_precision": 0.7202643171806168,
"eval_recall": 0.8122443015780245,
"eval_runtime": 7.1315,
"eval_samples_per_second": 631.568,
"eval_steps_per_second": 5.048,
"step": 950
},
{
"epoch": 7.09,
"learning_rate": 4.645390070921986e-06,
"loss": 0.1517,
"step": 1000
},
{
"epoch": 7.09,
"eval_f1": 0.7641669494401085,
"eval_loss": 0.25761693716049194,
"eval_precision": 0.7134710429603346,
"eval_recall": 0.8226183518410286,
"eval_runtime": 7.1379,
"eval_samples_per_second": 630.995,
"eval_steps_per_second": 5.043,
"step": 1000
},
{
"epoch": 7.45,
"eval_f1": 0.7703476197124111,
"eval_loss": 0.2536332607269287,
"eval_precision": 0.7375033413525796,
"eval_recall": 0.8062536528345996,
"eval_runtime": 7.1375,
"eval_samples_per_second": 631.035,
"eval_steps_per_second": 5.044,
"step": 1050
}
],
"logging_steps": 500,
"max_steps": 14100,
"num_train_epochs": 100,
"save_steps": 50,
"total_flos": 6.408198647855674e+16,
"trial_name": null,
"trial_params": null
}