m3_hierarchical_ner_ref_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
5cf5142
{
"best_metric": 0.9684392563769997,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/311-camembert-ner-hierarchical-loss-io/checkpoint-1200",
"epoch": 3.1496062992125986,
"global_step": 1200,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.9010175763182239,
"number": 519,
"precision": 0.8665480427046264,
"recall": 0.9383429672447013
},
"eval_ACT_L1": {
"f1": 0.9145539906103287,
"number": 503,
"precision": 0.8665480427046264,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9911894273127753,
"number": 678,
"precision": 0.9868421052631579,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9495472186287194,
"number": 761,
"precision": 0.935031847133758,
"recall": 0.9645203679369251
},
"eval_PER": {
"f1": 0.9402214022140221,
"number": 676,
"precision": 0.9381443298969072,
"recall": 0.9423076923076923
},
"eval_SPAT": {
"f1": 0.9390934844192635,
"number": 694,
"precision": 0.9233983286908078,
"recall": 0.9553314121037464
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9394240317775571,
"eval_accuracy-all": 0.956616186693148,
"eval_accuracy-das": 0.9525819265143992,
"eval_accuracy-l1": 0.9433962264150944,
"eval_accuracy-l2": 0.9698361469712016,
"eval_f1": 0.9469872537659327,
"eval_f1-all": 0.9354602663544563,
"eval_f1-das": 0.9454949944382648,
"eval_f1-l1": 0.9249482401656315,
"eval_f1-l2": 0.9491411249578983,
"eval_loss": 0.33225661516189575,
"eval_precision": 0.947261663286004,
"eval_precision-all": 0.9323220536756126,
"eval_precision-das": 0.940959409594096,
"eval_precision-l1": 0.9122001020929046,
"eval_precision-l2": 0.9591558883594282,
"eval_recall": 0.9467130031856357,
"eval_recall-all": 0.9386196769456682,
"eval_recall-das": 0.9500745156482862,
"eval_recall-l1": 0.9380577427821523,
"eval_recall-l2": 0.9393333333333334,
"eval_runtime": 20.7794,
"eval_samples_per_second": 32.532,
"eval_steps_per_second": 2.069,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.9138576779026217,
"number": 519,
"precision": 0.8888888888888888,
"recall": 0.9402697495183044
},
"eval_ACT_L1": {
"f1": 0.9277566539923954,
"number": 503,
"precision": 0.8888888888888888,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9874723655121592,
"number": 678,
"precision": 0.9867452135493373,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.2758620689655172,
"number": 30,
"precision": 0.2857142857142857,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9415542710340399,
"number": 761,
"precision": 0.9208542713567839,
"recall": 0.9632063074901446
},
"eval_PER": {
"f1": 0.9559471365638766,
"number": 676,
"precision": 0.9489795918367347,
"recall": 0.9630177514792899
},
"eval_SPAT": {
"f1": 0.9455830388692581,
"number": 694,
"precision": 0.9278779472954231,
"recall": 0.9639769452449568
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.5666666666666667,
"number": 33,
"precision": 0.6296296296296297,
"recall": 0.5151515151515151
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9484856007944389,
"eval_accuracy-all": 0.9626986097318768,
"eval_accuracy-das": 0.9611469712015889,
"eval_accuracy-l1": 0.9540714995034757,
"eval_accuracy-l2": 0.9713257199602781,
"eval_f1": 0.9447711949505092,
"eval_f1-all": 0.9391960528225222,
"eval_f1-das": 0.944280442804428,
"eval_f1-l1": 0.9339161738236049,
"eval_f1-l2": 0.9460359760159894,
"eval_loss": 0.24740029871463776,
"eval_precision": 0.9360432063672541,
"eval_precision-all": 0.9282845668387837,
"eval_precision-das": 0.9353070175438597,
"eval_precision-l1": 0.9153225806451613,
"eval_precision-l2": 0.9454061251664447,
"eval_recall": 0.9536634810309875,
"eval_recall-all": 0.950367107195301,
"eval_recall-das": 0.9534277198211625,
"eval_recall-l1": 0.9532808398950131,
"eval_recall-l2": 0.9466666666666667,
"eval_runtime": 8.6217,
"eval_samples_per_second": 78.406,
"eval_steps_per_second": 4.987,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9371428571428572,
"number": 519,
"precision": 0.9265536723163842,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9516441005802708,
"number": 503,
"precision": 0.9265536723163842,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9904481998530492,
"number": 678,
"precision": 0.986822840409956,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.2962962962962963,
"number": 30,
"precision": 0.3333333333333333,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9492187500000001,
"number": 761,
"precision": 0.9406451612903226,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9800443458980044,
"number": 676,
"precision": 0.9793205317577548,
"recall": 0.9807692307692307
},
"eval_SPAT": {
"f1": 0.9494661921708185,
"number": 694,
"precision": 0.9381153305203939,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8615384615384615,
"number": 33,
"precision": 0.875,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9577954319761668,
"eval_accuracy-all": 0.9672293942403177,
"eval_accuracy-das": 0.9703326713008937,
"eval_accuracy-l1": 0.961643495531281,
"eval_accuracy-l2": 0.9728152929493545,
"eval_f1": 0.9603587962962964,
"eval_f1-all": 0.9537876572097104,
"eval_f1-das": 0.9622886866059818,
"eval_f1-l1": 0.9511434511434511,
"eval_f1-l2": 0.957190635451505,
"eval_loss": 0.20228183269500732,
"eval_precision": 0.9595258745302111,
"eval_precision-all": 0.9498980483542091,
"eval_precision-das": 0.9596146721007781,
"eval_precision-l1": 0.9418425115800309,
"eval_precision-l2": 0.9604026845637584,
"eval_recall": 0.9611931653634521,
"eval_recall-all": 0.9577092511013215,
"eval_recall-das": 0.9649776453055141,
"eval_recall-l1": 0.9606299212598425,
"eval_recall-l2": 0.954,
"eval_runtime": 13.7481,
"eval_samples_per_second": 49.17,
"eval_steps_per_second": 3.128,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9320574162679425,
"number": 519,
"precision": 0.9258555133079848,
"recall": 0.9383429672447013
},
"eval_ACT_L1": {
"f1": 0.9530332681017614,
"number": 503,
"precision": 0.9383429672447013,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9926470588235294,
"number": 678,
"precision": 0.9897360703812317,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.18750000000000003,
"number": 30,
"precision": 0.17647058823529413,
"recall": 0.2
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9535036018336608,
"number": 761,
"precision": 0.9503916449086162,
"recall": 0.9566360052562418
},
"eval_PER": {
"f1": 0.967032967032967,
"number": 676,
"precision": 0.9579100145137881,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9663564781675018,
"number": 694,
"precision": 0.9601706970128022,
"recall": 0.9726224783861671
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.927536231884058,
"number": 33,
"precision": 0.8888888888888888,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9505958291956306,
"eval_accuracy-all": 0.9659260178748759,
"eval_accuracy-das": 0.9659880834160874,
"eval_accuracy-l1": 0.9558093346573983,
"eval_accuracy-l2": 0.9760427010923535,
"eval_f1": 0.955606803113289,
"eval_f1-all": 0.9539541002777371,
"eval_f1-das": 0.9637613826426314,
"eval_f1-l1": 0.9496103896103896,
"eval_f1-l2": 0.9595453025743899,
"eval_loss": 0.16856572031974792,
"eval_precision": 0.9512195121951219,
"eval_precision-all": 0.94965075669383,
"eval_precision-das": 0.9614386355209492,
"eval_precision-l1": 0.9398457583547558,
"eval_precision-l2": 0.9624413145539906,
"eval_recall": 0.9600347523892268,
"eval_recall-all": 0.9582966226138032,
"eval_recall-das": 0.9660953800298062,
"eval_recall-l1": 0.9595800524934384,
"eval_recall-l2": 0.9566666666666667,
"eval_runtime": 11.6651,
"eval_samples_per_second": 57.951,
"eval_steps_per_second": 3.686,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.3379,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9362511893434823,
"number": 519,
"precision": 0.924812030075188,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9616519174041297,
"number": 503,
"precision": 0.9513618677042801,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.17647058823529413,
"number": 16,
"precision": 0.16666666666666666,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.3823529411764707,
"number": 30,
"precision": 0.34210526315789475,
"recall": 0.43333333333333335
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9488010369410239,
"number": 761,
"precision": 0.9360613810741688,
"recall": 0.961892247043364
},
"eval_PER": {
"f1": 0.9764705882352941,
"number": 676,
"precision": 0.9707602339181286,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9529914529914529,
"number": 694,
"precision": 0.9422535211267605,
"recall": 0.9639769452449568
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7878787878787878,
"number": 33,
"precision": 0.7878787878787878,
"recall": 0.7878787878787878
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.952085402184707,
"eval_accuracy-all": 0.9604642502482622,
"eval_accuracy-das": 0.9714498510427011,
"eval_accuracy-l1": 0.9569265143992055,
"eval_accuracy-l2": 0.9640019860973188,
"eval_f1": 0.9596425482848083,
"eval_f1-all": 0.9529497450837582,
"eval_f1-das": 0.9628528974739969,
"eval_f1-l1": 0.9529992209815632,
"eval_f1-l2": 0.9528865295288654,
"eval_loss": 0.1725856363773346,
"eval_precision": 0.9552367288378766,
"eval_precision-all": 0.9453757225433526,
"eval_precision-das": 0.96,
"eval_precision-l1": 0.9429599177800617,
"eval_precision-l2": 0.9484808454425363,
"eval_recall": 0.9640891977990154,
"eval_recall-all": 0.9606461086637298,
"eval_recall-das": 0.9657228017883756,
"eval_recall-l1": 0.963254593175853,
"eval_recall-l2": 0.9573333333333334,
"eval_runtime": 16.0693,
"eval_samples_per_second": 42.068,
"eval_steps_per_second": 2.676,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9299242424242424,
"number": 519,
"precision": 0.9143389199255121,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.949514563106796,
"number": 503,
"precision": 0.9278937381404174,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.15384615384615385,
"number": 16,
"precision": 0.2,
"recall": 0.125
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.3333333333333333,
"number": 30,
"precision": 0.3055555555555556,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9640757674722404,
"number": 761,
"precision": 0.9584415584415584,
"recall": 0.9697766097240473
},
"eval_PER": {
"f1": 0.978629329403095,
"number": 676,
"precision": 0.9750367107195301,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9642346208869814,
"number": 694,
"precision": 0.9573863636363636,
"recall": 0.9711815561959655
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8857142857142858,
"number": 33,
"precision": 0.8378378378378378,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.951837140019861,
"eval_accuracy-all": 0.9630089374379345,
"eval_accuracy-das": 0.9715739821251241,
"eval_accuracy-l1": 0.9551886792452831,
"eval_accuracy-l2": 0.9708291956305859,
"eval_f1": 0.9633583381419504,
"eval_f1-all": 0.958692161728215,
"eval_f1-das": 0.9671431223315389,
"eval_f1-l1": 0.9540617700493121,
"eval_f1-l2": 0.9646430953969313,
"eval_loss": 0.1551111489534378,
"eval_precision": 0.959758551307847,
"eval_precision-all": 0.9529889727219966,
"eval_precision-das": 0.9637439881613022,
"eval_precision-l1": 0.9435318275154004,
"eval_precision-l2": 0.965287049399199,
"eval_recall": 0.9669852302345786,
"eval_recall-all": 0.9644640234948605,
"eval_recall-das": 0.9705663189269746,
"eval_recall-l1": 0.9648293963254593,
"eval_recall-l2": 0.964,
"eval_runtime": 7.6982,
"eval_samples_per_second": 87.813,
"eval_steps_per_second": 5.586,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9238005644402634,
"number": 519,
"precision": 0.9025735294117647,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9530332681017614,
"number": 503,
"precision": 0.9383429672447013,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.19512195121951217,
"number": 16,
"precision": 0.16,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.9941089837997055,
"number": 678,
"precision": 0.9926470588235294,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.33707865168539325,
"number": 30,
"precision": 0.2542372881355932,
"recall": 0.5
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.954308093994778,
"number": 761,
"precision": 0.9481193255512321,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.9807976366322009,
"number": 676,
"precision": 0.9793510324483776,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9555236728837877,
"number": 694,
"precision": 0.9514285714285714,
"recall": 0.9596541786743515
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9411764705882354,
"number": 33,
"precision": 0.9142857142857143,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 5,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9544438927507448,
"eval_accuracy-all": 0.9669190665342602,
"eval_accuracy-das": 0.9714498510427011,
"eval_accuracy-l1": 0.9606504468718967,
"eval_accuracy-l2": 0.9731876861966237,
"eval_f1": 0.9572330654420207,
"eval_f1-all": 0.9528521536670547,
"eval_f1-das": 0.9665551839464882,
"eval_f1-l1": 0.948976948976949,
"eval_f1-l2": 0.9578213218199934,
"eval_loss": 0.14552079141139984,
"eval_precision": 0.9487908961593172,
"eval_precision-all": 0.944332275742717,
"eval_precision-das": 0.964047442550037,
"eval_precision-l1": 0.9366053169734151,
"eval_precision-l2": 0.9543348775645268,
"eval_recall": 0.9658268172603534,
"eval_recall-all": 0.9615271659324522,
"eval_recall-das": 0.9690760059612519,
"eval_recall-l1": 0.9616797900262467,
"eval_recall-l2": 0.9613333333333334,
"eval_runtime": 13.1454,
"eval_samples_per_second": 51.425,
"eval_steps_per_second": 3.271,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9493791786055396,
"number": 519,
"precision": 0.9412878787878788,
"recall": 0.9576107899807321
},
"eval_ACT_L1": {
"f1": 0.9760956175298805,
"number": 503,
"precision": 0.9780439121756487,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.3255813953488372,
"number": 16,
"precision": 0.25925925925925924,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9933677229182019,
"number": 678,
"precision": 0.9926362297496318,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.45569620253164556,
"number": 30,
"precision": 0.3673469387755102,
"recall": 0.6
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9652002626395274,
"number": 761,
"precision": 0.9645669291338582,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9830258302583026,
"number": 676,
"precision": 0.9808541973490427,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9676956209619526,
"number": 694,
"precision": 0.9642346208869814,
"recall": 0.9711815561959655
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8985507246376813,
"number": 33,
"precision": 0.8611111111111112,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.3636363636363636,
"number": 5,
"precision": 0.3333333333333333,
"recall": 0.4
},
"eval_accuracy": 0.9563058589870904,
"eval_accuracy-all": 0.9666708043694141,
"eval_accuracy-das": 0.9784011916583912,
"eval_accuracy-l1": 0.9617676266137041,
"eval_accuracy-l2": 0.9715739821251241,
"eval_f1": 0.965945165945166,
"eval_f1-all": 0.9636124506795265,
"eval_f1-das": 0.9720878302940081,
"eval_f1-l1": 0.9642577615444821,
"eval_f1-l2": 0.9627906976744186,
"eval_loss": 0.14274396002292633,
"eval_precision": 0.9626114466494105,
"eval_precision-all": 0.9589877835951134,
"eval_precision-das": 0.971003717472119,
"eval_precision-l1": 0.9585062240663901,
"eval_precision-l2": 0.9596026490066225,
"eval_recall": 0.9693020561830292,
"eval_recall-all": 0.9682819383259912,
"eval_recall-das": 0.9731743666169895,
"eval_recall-l1": 0.9700787401574803,
"eval_recall-l2": 0.966,
"eval_runtime": 32.3788,
"eval_samples_per_second": 20.878,
"eval_steps_per_second": 1.328,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9467680608365019,
"number": 519,
"precision": 0.9343339587242027,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9693372898120672,
"number": 503,
"precision": 0.9645669291338582,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.39024390243902435,
"number": 16,
"precision": 0.32,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.5333333333333333,
"number": 30,
"precision": 0.4444444444444444,
"recall": 0.6666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.953063885267275,
"number": 761,
"precision": 0.9456662354463131,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.9918699186991871,
"number": 676,
"precision": 0.9911373707533235,
"recall": 0.992603550295858
},
"eval_SPAT": {
"f1": 0.9627507163323783,
"number": 694,
"precision": 0.9572649572649573,
"recall": 0.968299711815562
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9411764705882354,
"number": 33,
"precision": 0.9142857142857143,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.26666666666666666,
"number": 5,
"precision": 0.2,
"recall": 0.4
},
"eval_accuracy": 0.958291956305859,
"eval_accuracy-all": 0.9676017874875869,
"eval_accuracy-das": 0.9782770605759682,
"eval_accuracy-l1": 0.9653674280039722,
"eval_accuracy-l2": 0.9698361469712016,
"eval_f1": 0.9656065620952655,
"eval_f1-all": 0.9622504008162076,
"eval_f1-das": 0.9712377064390424,
"eval_f1-l1": 0.9658587438102684,
"eval_f1-l2": 0.9576719576719577,
"eval_loss": 0.13768324255943298,
"eval_precision": 0.9596681922196796,
"eval_precision-all": 0.9551504629629629,
"eval_precision-das": 0.9674676524953789,
"eval_precision-l1": 0.9591097308488613,
"eval_precision-l2": 0.9501312335958005,
"eval_recall": 0.9716188821314798,
"eval_recall-all": 0.9694566813509545,
"eval_recall-das": 0.9750372578241431,
"eval_recall-l1": 0.9727034120734908,
"eval_recall-l2": 0.9653333333333334,
"eval_runtime": 14.3312,
"eval_samples_per_second": 47.17,
"eval_steps_per_second": 3.0,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1289,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9370229007633587,
"number": 519,
"precision": 0.9281663516068053,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9640718562874252,
"number": 503,
"precision": 0.9679358717434869,
"recall": 0.9602385685884692
},
"eval_ACT_L2": {
"f1": 0.3478260869565218,
"number": 16,
"precision": 0.26666666666666666,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.5063291139240507,
"number": 30,
"precision": 0.40816326530612246,
"recall": 0.6666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9711286089238845,
"number": 761,
"precision": 0.9698558322411533,
"recall": 0.9724047306176085
},
"eval_PER": {
"f1": 0.9867060561299853,
"number": 676,
"precision": 0.9852507374631269,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9676956209619526,
"number": 694,
"precision": 0.9642346208869814,
"recall": 0.9711815561959655
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9142857142857143,
"number": 33,
"precision": 0.8648648648648649,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.4000000000000001,
"number": 5,
"precision": 0.4,
"recall": 0.4
},
"eval_accuracy": 0.9533267130089375,
"eval_accuracy-all": 0.9641881827209533,
"eval_accuracy-das": 0.9762909632571996,
"eval_accuracy-l1": 0.958291956305859,
"eval_accuracy-l2": 0.9700844091360477,
"eval_f1": 0.9668492360910925,
"eval_f1-all": 0.9646508910312591,
"eval_f1-das": 0.972470238095238,
"eval_f1-l1": 0.9634464751958223,
"eval_f1-l2": 0.9661803713527852,
"eval_loss": 0.1481187343597412,
"eval_precision": 0.9624103299856528,
"eval_precision-all": 0.959604766056379,
"eval_precision-das": 0.9710252600297177,
"eval_precision-l1": 0.9584415584415584,
"eval_precision-l2": 0.9610817941952506,
"eval_recall": 0.9713292788879235,
"eval_recall-all": 0.9697503671071953,
"eval_recall-das": 0.973919523099851,
"eval_recall-l1": 0.968503937007874,
"eval_recall-l2": 0.9713333333333334,
"eval_runtime": 20.9824,
"eval_samples_per_second": 32.217,
"eval_steps_per_second": 2.049,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9523809523809523,
"number": 519,
"precision": 0.9416195856873822,
"recall": 0.9633911368015414
},
"eval_ACT_L1": {
"f1": 0.9713721618953604,
"number": 503,
"precision": 0.9647058823529412,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.4324324324324324,
"number": 16,
"precision": 0.38095238095238093,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9911373707533235,
"number": 678,
"precision": 0.992603550295858,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.4864864864864865,
"number": 30,
"precision": 0.4090909090909091,
"recall": 0.6
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9648437500000001,
"number": 761,
"precision": 0.9561290322580646,
"recall": 0.973718791064389
},
"eval_PER": {
"f1": 0.9874353288987435,
"number": 676,
"precision": 0.9867060561299852,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.966113914924297,
"number": 694,
"precision": 0.9668109668109668,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9253731343283583,
"number": 33,
"precision": 0.9117647058823529,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.5333333333333333,
"number": 5,
"precision": 0.4,
"recall": 0.8
},
"eval_accuracy": 0.9617676266137041,
"eval_accuracy-all": 0.9718843098311817,
"eval_accuracy-das": 0.9786494538232373,
"eval_accuracy-l1": 0.9664846077457795,
"eval_accuracy-l2": 0.9772840119165839,
"eval_f1": 0.9666474985623923,
"eval_f1-all": 0.9650942018402219,
"eval_f1-das": 0.9727222119131563,
"eval_f1-l1": 0.9652650822669104,
"eval_f1-l2": 0.9648774022531478,
"eval_loss": 0.13178446888923645,
"eval_precision": 0.9597487867542107,
"eval_precision-all": 0.9599070307960488,
"eval_precision-das": 0.9689463955637708,
"eval_precision-l1": 0.9604989604989606,
"eval_precision-l2": 0.9591567852437418,
"eval_recall": 0.9736461048363741,
"eval_recall-all": 0.970337738619677,
"eval_recall-das": 0.9765275707898659,
"eval_recall-l1": 0.9700787401574803,
"eval_recall-l2": 0.9706666666666667,
"eval_runtime": 21.6072,
"eval_samples_per_second": 31.286,
"eval_steps_per_second": 1.99,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9504761904761905,
"number": 519,
"precision": 0.9397363465160076,
"recall": 0.9614643545279383
},
"eval_ACT_L1": {
"f1": 0.971201588877855,
"number": 503,
"precision": 0.9702380952380952,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.4651162790697674,
"number": 16,
"precision": 0.37037037037037035,
"recall": 0.625
},
"eval_CARDINAL": {
"f1": 0.9926253687315634,
"number": 678,
"precision": 0.9926253687315634,
"recall": 0.9926253687315634
},
"eval_DESC": {
"f1": 0.5263157894736841,
"number": 30,
"precision": 0.43478260869565216,
"recall": 0.6666666666666666
},
"eval_FT": {
"f1": 0.25,
"number": 7,
"precision": 1.0,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9691803278688523,
"number": 761,
"precision": 0.9672774869109948,
"recall": 0.9710906701708278
},
"eval_PER": {
"f1": 0.9852289512555391,
"number": 676,
"precision": 0.9837758112094396,
"recall": 0.9866863905325444
},
"eval_SPAT": {
"f1": 0.9595959595959597,
"number": 694,
"precision": 0.9609826589595376,
"recall": 0.9582132564841499
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8985507246376813,
"number": 33,
"precision": 0.8611111111111112,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.4444444444444445,
"number": 5,
"precision": 0.5,
"recall": 0.4
},
"eval_accuracy": 0.9602780536246276,
"eval_accuracy-all": 0.9703326713008937,
"eval_accuracy-das": 0.9793942403177756,
"eval_accuracy-l1": 0.9651191658391262,
"eval_accuracy-l2": 0.9755461767626614,
"eval_f1": 0.9684392563769997,
"eval_f1-all": 0.9647403072421361,
"eval_f1-das": 0.9741395348837208,
"eval_f1-l1": 0.9626143790849672,
"eval_f1-l2": 0.9674418604651163,
"eval_loss": 0.13072313368320465,
"eval_precision": 0.963855421686747,
"eval_precision-all": 0.9612244897959183,
"eval_precision-das": 0.9728725380899294,
"eval_precision-l1": 0.9588541666666667,
"eval_precision-l2": 0.9642384105960264,
"eval_recall": 0.9730668983492615,
"eval_recall-all": 0.9682819383259912,
"eval_recall-das": 0.9754098360655737,
"eval_recall-l1": 0.9664041994750656,
"eval_recall-l2": 0.9706666666666667,
"eval_runtime": 7.9998,
"eval_samples_per_second": 84.502,
"eval_steps_per_second": 5.375,
"step": 1200
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 486860284369728.0,
"trial_name": null,
"trial_params": null
}