m3_hierarchical_ner_ocr_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
5becf8f
{
"best_metric": 0.9663670629167874,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_3/tmp/321-camembert-ner-hierarchical-loss-io/checkpoint-2000",
"epoch": 5.2493438320209975,
"global_step": 2000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8378378378378379,
"number": 519,
"precision": 0.7868020304568528,
"recall": 0.8959537572254336
},
"eval_ACT_L1": {
"f1": 0.850091407678245,
"number": 503,
"precision": 0.7868020304568528,
"recall": 0.9244532803180915
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9687726942628904,
"number": 678,
"precision": 0.9542203147353362,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.908150064683053,
"number": 761,
"precision": 0.8942675159235669,
"recall": 0.9224704336399474
},
"eval_PER": {
"f1": 0.9078947368421053,
"number": 676,
"precision": 0.8973988439306358,
"recall": 0.9186390532544378
},
"eval_SPAT": {
"f1": 0.9194915254237289,
"number": 694,
"precision": 0.9016620498614959,
"recall": 0.9380403458213257
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.926600860541635,
"eval_accuracy-all": 0.950582131106049,
"eval_accuracy-das": 0.9424196405973171,
"eval_accuracy-l1": 0.9369779802581625,
"eval_accuracy-l2": 0.9641862819539357,
"eval_f1": 0.9032535473699298,
"eval_f1-all": 0.9009427121102248,
"eval_f1-das": 0.8991195891415995,
"eval_f1-l1": 0.8884910485933504,
"eval_f1-l2": 0.917252931323283,
"eval_loss": 0.3965435028076172,
"eval_precision": 0.8908679672038451,
"eval_precision-all": 0.8902264259100029,
"eval_precision-das": 0.8857968919407301,
"eval_precision-l1": 0.8663341645885286,
"eval_precision-l2": 0.9225067385444744,
"eval_recall": 0.9159883720930233,
"eval_recall-all": 0.9119201409277745,
"eval_recall-das": 0.9128491620111732,
"eval_recall-l1": 0.9118110236220472,
"eval_recall-l2": 0.9120586275816123,
"eval_runtime": 5.6993,
"eval_samples_per_second": 118.611,
"eval_steps_per_second": 7.545,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.888888888888889,
"number": 519,
"precision": 0.8556149732620321,
"recall": 0.9248554913294798
},
"eval_ACT_L1": {
"f1": 0.9022556390977442,
"number": 503,
"precision": 0.8556149732620321,
"recall": 0.9542743538767395
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9744338933528124,
"number": 678,
"precision": 0.9652677279305355,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9430255402750493,
"number": 761,
"precision": 0.9399477806788512,
"recall": 0.9461235216819974
},
"eval_PER": {
"f1": 0.943952802359882,
"number": 676,
"precision": 0.9411764705882353,
"recall": 0.9467455621301775
},
"eval_SPAT": {
"f1": 0.9349535382416011,
"number": 694,
"precision": 0.9276595744680851,
"recall": 0.9423631123919308
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9360921285750443,
"eval_accuracy-all": 0.955960516324981,
"eval_accuracy-das": 0.9502657555049354,
"eval_accuracy-l1": 0.9448240951657808,
"eval_accuracy-l2": 0.9670969374841812,
"eval_f1": 0.931761967117707,
"eval_f1-all": 0.927931894906796,
"eval_f1-das": 0.9288500835965074,
"eval_f1-l1": 0.9203631647211413,
"eval_f1-l2": 0.9377958079783638,
"eval_loss": 0.279910147190094,
"eval_precision": 0.9327119137780367,
"eval_precision-all": 0.9277957147050191,
"eval_precision-das": 0.9266123054114158,
"eval_precision-l1": 0.9097435897435897,
"eval_precision-l2": 0.9519560741249142,
"eval_recall": 0.9308139534883721,
"eval_recall-all": 0.9280681150910158,
"eval_recall-das": 0.931098696461825,
"eval_recall-l1": 0.9312335958005249,
"eval_recall-l2": 0.9240506329113924,
"eval_runtime": 5.3228,
"eval_samples_per_second": 127.0,
"eval_steps_per_second": 8.078,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9224880382775119,
"number": 519,
"precision": 0.9163498098859315,
"recall": 0.928709055876686
},
"eval_ACT_L1": {
"f1": 0.9368318756073858,
"number": 503,
"precision": 0.9163498098859315,
"recall": 0.9582504970178927
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9773226042428675,
"number": 678,
"precision": 0.969521044992743,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.07692307692307691,
"number": 30,
"precision": 0.09090909090909091,
"recall": 0.06666666666666667
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9381107491856677,
"number": 761,
"precision": 0.9302325581395349,
"recall": 0.9461235216819974
},
"eval_PER": {
"f1": 0.9358879882092852,
"number": 676,
"precision": 0.9324522760646109,
"recall": 0.9393491124260355
},
"eval_SPAT": {
"f1": 0.9390070921985816,
"number": 694,
"precision": 0.9245810055865922,
"recall": 0.9538904899135446
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.3921568627450981,
"number": 33,
"precision": 0.5555555555555556,
"recall": 0.30303030303030304
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9426727410782081,
"eval_accuracy-all": 0.9577322196912175,
"eval_accuracy-das": 0.960389774740572,
"eval_accuracy-l1": 0.9483675018982536,
"eval_accuracy-l2": 0.9670969374841812,
"eval_f1": 0.939160737621606,
"eval_f1-all": 0.9306206088992975,
"eval_f1-das": 0.9402568397543273,
"eval_f1-l1": 0.925194805194805,
"eval_f1-l2": 0.937625754527163,
"eval_loss": 0.23822064697742462,
"eval_precision": 0.938207136640557,
"eval_precision-all": 0.9279042615294805,
"eval_precision-das": 0.9397321428571429,
"eval_precision-l1": 0.9156812339331619,
"eval_precision-l2": 0.9439567859554355,
"eval_recall": 0.9401162790697675,
"eval_recall-all": 0.9333529066353494,
"eval_recall-das": 0.9407821229050279,
"eval_recall-l1": 0.9349081364829396,
"eval_recall-l2": 0.9313790806129247,
"eval_runtime": 5.4317,
"eval_samples_per_second": 124.456,
"eval_steps_per_second": 7.917,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9135802469135802,
"number": 519,
"precision": 0.900749063670412,
"recall": 0.9267822736030829
},
"eval_ACT_L1": {
"f1": 0.9276759884281581,
"number": 503,
"precision": 0.900749063670412,
"recall": 0.9562624254473161
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9852941176470589,
"number": 678,
"precision": 0.9824046920821115,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.16129032258064516,
"number": 30,
"precision": 0.15625,
"recall": 0.16666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9414858645627877,
"number": 761,
"precision": 0.9421052631578948,
"recall": 0.9408672798948752
},
"eval_PER": {
"f1": 0.9646539027982327,
"number": 676,
"precision": 0.9604105571847508,
"recall": 0.9689349112426036
},
"eval_SPAT": {
"f1": 0.9440459110473458,
"number": 694,
"precision": 0.94,
"recall": 0.9481268011527377
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7118644067796609,
"number": 33,
"precision": 0.8076923076923077,
"recall": 0.6363636363636364
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9511516071880537,
"eval_accuracy-all": 0.9660212604403948,
"eval_accuracy-das": 0.9677296886864085,
"eval_accuracy-l1": 0.9574791192103265,
"eval_accuracy-l2": 0.9745634016704632,
"eval_f1": 0.9458987783595114,
"eval_f1-all": 0.9399003224860745,
"eval_f1-das": 0.9493293591654248,
"eval_f1-l1": 0.9338178043083311,
"eval_f1-l2": 0.9477938699898956,
"eval_loss": 0.18405073881149292,
"eval_precision": 0.9464493597206054,
"eval_precision-all": 0.9385245901639344,
"eval_precision-das": 0.9496831904584421,
"eval_precision-l1": 0.9235112936344969,
"eval_precision-l2": 0.9584468664850136,
"eval_recall": 0.9453488372093023,
"eval_recall-all": 0.9412800939518496,
"eval_recall-das": 0.948975791433892,
"eval_recall-l1": 0.9443569553805774,
"eval_recall-l2": 0.9373750832778148,
"eval_runtime": 5.2971,
"eval_samples_per_second": 127.616,
"eval_steps_per_second": 8.118,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.3703,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9379178605539636,
"number": 519,
"precision": 0.9299242424242424,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9524733268671194,
"number": 503,
"precision": 0.9299242424242424,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9816041206769685,
"number": 678,
"precision": 0.9794419970631424,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.22727272727272724,
"number": 30,
"precision": 0.35714285714285715,
"recall": 0.16666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9286640726329443,
"number": 761,
"precision": 0.9167733674775929,
"recall": 0.9408672798948752
},
"eval_PER": {
"f1": 0.960294117647059,
"number": 676,
"precision": 0.9546783625730995,
"recall": 0.9659763313609467
},
"eval_SPAT": {
"f1": 0.9291784702549575,
"number": 694,
"precision": 0.9136490250696379,
"recall": 0.9452449567723343
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7419354838709677,
"number": 33,
"precision": 0.7931034482758621,
"recall": 0.696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.951784358390281,
"eval_accuracy-all": 0.964123006833713,
"eval_accuracy-das": 0.9651986838774994,
"eval_accuracy-l1": 0.9583649708934447,
"eval_accuracy-l2": 0.9698810427739812,
"eval_f1": 0.9481932956029604,
"eval_f1-all": 0.9384772760485167,
"eval_f1-das": 0.9487940630797775,
"eval_f1-l1": 0.9379059495972979,
"eval_f1-l2": 0.9392117568470274,
"eval_loss": 0.20227569341659546,
"eval_precision": 0.9466821211243118,
"eval_precision-all": 0.9342449810881582,
"eval_precision-das": 0.945286506469501,
"eval_precision-l1": 0.9284979423868313,
"eval_precision-l2": 0.941728064300067,
"eval_recall": 0.9497093023255814,
"eval_recall-all": 0.9427480916030534,
"eval_recall-das": 0.9523277467411546,
"eval_recall-l1": 0.94750656167979,
"eval_recall-l2": 0.9367088607594937,
"eval_runtime": 5.4983,
"eval_samples_per_second": 122.948,
"eval_steps_per_second": 7.821,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9351145038167938,
"number": 519,
"precision": 0.9262759924385633,
"recall": 0.9441233140655106
},
"eval_ACT_L1": {
"f1": 0.9496124031007751,
"number": 503,
"precision": 0.9262759924385633,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9808823529411764,
"number": 678,
"precision": 0.9780058651026393,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.2711864406779661,
"number": 30,
"precision": 0.27586206896551724,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9541284403669723,
"number": 761,
"precision": 0.9516339869281045,
"recall": 0.9566360052562418
},
"eval_PER": {
"f1": 0.9720176730486009,
"number": 676,
"precision": 0.967741935483871,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9633883704235463,
"number": 694,
"precision": 0.9599427753934192,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.676470588235294,
"number": 33,
"precision": 0.6571428571428571,
"recall": 0.696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9583649708934447,
"eval_accuracy-all": 0.9695646671728676,
"eval_accuracy-das": 0.9716527461402177,
"eval_accuracy-l1": 0.9644393824348266,
"eval_accuracy-l2": 0.9746899519109087,
"eval_f1": 0.9551458847437944,
"eval_f1-all": 0.9510837727006444,
"eval_f1-das": 0.9576050576422462,
"eval_f1-l1": 0.9516129032258065,
"eval_f1-l2": 0.9504021447721179,
"eval_loss": 0.16219548881053925,
"eval_precision": 0.953899681066976,
"eval_precision-all": 0.9488603156049094,
"eval_precision-das": 0.9561826958782027,
"eval_precision-l1": 0.9432697266632285,
"eval_precision-l2": 0.9561699258260283,
"eval_recall": 0.9563953488372093,
"eval_recall-all": 0.9533176746917205,
"eval_recall-das": 0.9590316573556797,
"eval_recall-l1": 0.9601049868766404,
"eval_recall-l2": 0.9447035309793471,
"eval_runtime": 5.458,
"eval_samples_per_second": 123.855,
"eval_steps_per_second": 7.878,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9361296472831266,
"number": 519,
"precision": 0.9264150943396227,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9483933787731256,
"number": 503,
"precision": 0.9293893129770993,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.36363636363636365,
"number": 16,
"precision": 0.6666666666666666,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.9889298892988929,
"number": 678,
"precision": 0.9896602658788775,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.4528301886792453,
"number": 30,
"precision": 0.5217391304347826,
"recall": 0.4
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9514435695538058,
"number": 761,
"precision": 0.9501965923984272,
"recall": 0.9526938239159002
},
"eval_PER": {
"f1": 0.9666913397483345,
"number": 676,
"precision": 0.9674074074074074,
"recall": 0.9659763313609467
},
"eval_SPAT": {
"f1": 0.9519713261648747,
"number": 694,
"precision": 0.9472182596291013,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.6216216216216217,
"number": 33,
"precision": 0.5609756097560976,
"recall": 0.696969696969697
},
"eval_TITREP": {
"f1": 0.2222222222222222,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.16666666666666666
},
"eval_accuracy": 0.9605163249810175,
"eval_accuracy-all": 0.9719691217413313,
"eval_accuracy-das": 0.9713996456593268,
"eval_accuracy-l1": 0.9669703872437357,
"eval_accuracy-l2": 0.9769678562389269,
"eval_f1": 0.9528096413532743,
"eval_f1-all": 0.9499926675465612,
"eval_f1-das": 0.9529827169671065,
"eval_f1-l1": 0.9487983281086729,
"eval_f1-l2": 0.9515212303577398,
"eval_loss": 0.1616193950176239,
"eval_precision": 0.9518421816071947,
"eval_precision-all": 0.9490184588338705,
"eval_precision-das": 0.9510385756676558,
"eval_precision-l1": 0.9443577743109725,
"eval_precision-l2": 0.9550335570469799,
"eval_recall": 0.9537790697674419,
"eval_recall-all": 0.9509688784497945,
"eval_recall-das": 0.9549348230912477,
"eval_recall-l1": 0.9532808398950131,
"eval_recall-l2": 0.9480346435709527,
"eval_runtime": 5.3537,
"eval_samples_per_second": 126.267,
"eval_steps_per_second": 8.032,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9180018850141377,
"number": 519,
"precision": 0.8985239852398524,
"recall": 0.9383429672447013
},
"eval_ACT_L1": {
"f1": 0.942439024390244,
"number": 503,
"precision": 0.9252873563218391,
"recall": 0.9602385685884692
},
"eval_ACT_L2": {
"f1": 0.22222222222222224,
"number": 16,
"precision": 0.2,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.986019131714496,
"number": 678,
"precision": 0.9838472834067548,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.4210526315789474,
"number": 30,
"precision": 0.34782608695652173,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9256844850065189,
"number": 761,
"precision": 0.9184993531694696,
"recall": 0.9329829172141918
},
"eval_PER": {
"f1": 0.9558173784977908,
"number": 676,
"precision": 0.9516129032258065,
"recall": 0.9600591715976331
},
"eval_SPAT": {
"f1": 0.9461593682699211,
"number": 694,
"precision": 0.9427753934191703,
"recall": 0.9495677233429395
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7605633802816901,
"number": 33,
"precision": 0.7105263157894737,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9474816502151354,
"eval_accuracy-all": 0.9607694254619084,
"eval_accuracy-das": 0.967603138445963,
"eval_accuracy-l1": 0.9552012148823082,
"eval_accuracy-l2": 0.9663376360415085,
"eval_f1": 0.9397035544682689,
"eval_f1-all": 0.9369998545031283,
"eval_f1-das": 0.9450305385896723,
"eval_f1-l1": 0.9377270368448366,
"eval_f1-l2": 0.9360715468698245,
"eval_loss": 0.17993101477622986,
"eval_precision": 0.9304645198062126,
"eval_precision-all": 0.9287568503028555,
"eval_precision-das": 0.9392935982339956,
"eval_precision-l1": 0.9271421241662391,
"eval_precision-l2": 0.9308300395256917,
"eval_recall": 0.9491279069767442,
"eval_recall-all": 0.9453904873752202,
"eval_recall-das": 0.9508379888268157,
"eval_recall-l1": 0.9485564304461942,
"eval_recall-l2": 0.9413724183877415,
"eval_runtime": 5.7248,
"eval_samples_per_second": 118.084,
"eval_steps_per_second": 7.511,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9387370405278038,
"number": 519,
"precision": 0.9188191881918819,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9555125725338492,
"number": 503,
"precision": 0.9303201506591338,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.2962962962962963,
"number": 16,
"precision": 0.36363636363636365,
"recall": 0.25
},
"eval_CARDINAL": {
"f1": 0.9845474613686535,
"number": 678,
"precision": 0.9823788546255506,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.3384615384615384,
"number": 30,
"precision": 0.3142857142857143,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9481967213114754,
"number": 761,
"precision": 0.9463350785340314,
"recall": 0.9500657030223391
},
"eval_PER": {
"f1": 0.969786293294031,
"number": 676,
"precision": 0.9662261380323054,
"recall": 0.9733727810650887
},
"eval_SPAT": {
"f1": 0.9511494252873564,
"number": 694,
"precision": 0.9484240687679083,
"recall": 0.9538904899135446
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7936507936507938,
"number": 33,
"precision": 0.8333333333333334,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9600101240192357,
"eval_accuracy-all": 0.9705770690964313,
"eval_accuracy-das": 0.9731713490255631,
"eval_accuracy-l1": 0.9653252341179448,
"eval_accuracy-l2": 0.9758289040749177,
"eval_f1": 0.9563578367406117,
"eval_f1-all": 0.9492912465293001,
"eval_f1-das": 0.959539717891611,
"eval_f1-l1": 0.9480519480519479,
"eval_f1-l2": 0.9508853992649516,
"eval_loss": 0.16017325222492218,
"eval_precision": 0.9540063638993347,
"eval_precision-all": 0.945010183299389,
"eval_precision-das": 0.9563448020717721,
"eval_precision-l1": 0.9383033419023136,
"eval_precision-l2": 0.9537533512064343,
"eval_recall": 0.9587209302325581,
"eval_recall-all": 0.9536112742219612,
"eval_recall-das": 0.962756052141527,
"eval_recall-l1": 0.958005249343832,
"eval_recall-l2": 0.9480346435709527,
"eval_runtime": 5.5031,
"eval_samples_per_second": 122.84,
"eval_steps_per_second": 7.814,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1449,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9233716475095786,
"number": 519,
"precision": 0.9180952380952381,
"recall": 0.928709055876686
},
"eval_ACT_L1": {
"f1": 0.9397828232971372,
"number": 503,
"precision": 0.9333333333333333,
"recall": 0.9463220675944334
},
"eval_ACT_L2": {
"f1": 0.38709677419354843,
"number": 16,
"precision": 0.4,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9823788546255506,
"number": 678,
"precision": 0.9780701754385965,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.47058823529411764,
"number": 30,
"precision": 0.42105263157894735,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9440104166666667,
"number": 761,
"precision": 0.9354838709677419,
"recall": 0.9526938239159002
},
"eval_PER": {
"f1": 0.9690265486725664,
"number": 676,
"precision": 0.9661764705882353,
"recall": 0.9718934911242604
},
"eval_SPAT": {
"f1": 0.946236559139785,
"number": 694,
"precision": 0.9415121255349501,
"recall": 0.9510086455331412
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8307692307692308,
"number": 33,
"precision": 0.84375,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.3636363636363636,
"number": 6,
"precision": 0.4,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.957605669450772,
"eval_accuracy-all": 0.9693748418121995,
"eval_accuracy-das": 0.9710199949379904,
"eval_accuracy-l1": 0.9641862819539357,
"eval_accuracy-l2": 0.9745634016704632,
"eval_f1": 0.9503177354130561,
"eval_f1-all": 0.9459538416593631,
"eval_f1-das": 0.953583364277757,
"eval_f1-l1": 0.9436619718309859,
"eval_f1-l2": 0.948871181938911,
"eval_loss": 0.17344143986701965,
"eval_precision": 0.9443168771526981,
"eval_precision-all": 0.9412790697674419,
"eval_precision-das": 0.9507589781562384,
"eval_precision-l1": 0.937791601866252,
"eval_precision-l2": 0.9457313037723362,
"eval_recall": 0.9563953488372093,
"eval_recall-all": 0.9506752789195537,
"eval_recall-das": 0.9564245810055866,
"eval_recall-l1": 0.9496062992125984,
"eval_recall-l2": 0.9520319786808794,
"eval_runtime": 5.2868,
"eval_samples_per_second": 127.865,
"eval_steps_per_second": 8.133,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9411764705882353,
"number": 519,
"precision": 0.9271028037383178,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.966403162055336,
"number": 503,
"precision": 0.9607072691552063,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.33333333333333337,
"number": 16,
"precision": 0.2692307692307692,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9852724594992636,
"number": 678,
"precision": 0.9838235294117647,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.4864864864864865,
"number": 30,
"precision": 0.4090909090909091,
"recall": 0.6
},
"eval_FT": {
"f1": 0.18181818181818182,
"number": 7,
"precision": 0.25,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9514435695538058,
"number": 761,
"precision": 0.9501965923984272,
"recall": 0.9526938239159002
},
"eval_PER": {
"f1": 0.9807976366322009,
"number": 676,
"precision": 0.9793510324483776,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9503239740820734,
"number": 694,
"precision": 0.9496402877697842,
"recall": 0.9510086455331412
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.819672131147541,
"number": 33,
"precision": 0.8928571428571429,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.26666666666666666,
"number": 6,
"precision": 0.2222222222222222,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9530498607947355,
"eval_accuracy-all": 0.964819033156163,
"eval_accuracy-das": 0.9724120475828905,
"eval_accuracy-l1": 0.960389774740572,
"eval_accuracy-l2": 0.969248291571754,
"eval_f1": 0.9578566256335989,
"eval_f1-all": 0.952937737503654,
"eval_f1-das": 0.9619029920089203,
"eval_f1-l1": 0.9558861915948839,
"eval_f1-l2": 0.9491863168382597,
"eval_loss": 0.16722118854522705,
"eval_precision": 0.9544011544011544,
"eval_precision-all": 0.9487776484284052,
"eval_precision-das": 0.9599406528189911,
"eval_precision-l1": 0.95067497403946,
"eval_precision-l2": 0.9463576158940398,
"eval_recall": 0.9613372093023256,
"eval_recall-all": 0.9571344685848503,
"eval_recall-das": 0.9638733705772812,
"eval_recall-l1": 0.9611548556430446,
"eval_recall-l2": 0.9520319786808794,
"eval_runtime": 5.3735,
"eval_samples_per_second": 125.803,
"eval_steps_per_second": 8.002,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9268755935422602,
"number": 519,
"precision": 0.9138576779026217,
"recall": 0.9402697495183044
},
"eval_ACT_L1": {
"f1": 0.95069033530572,
"number": 503,
"precision": 0.9432485322896281,
"recall": 0.9582504970178927
},
"eval_ACT_L2": {
"f1": 0.30769230769230765,
"number": 16,
"precision": 0.2608695652173913,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9867647058823529,
"number": 678,
"precision": 0.9838709677419355,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.43243243243243246,
"number": 30,
"precision": 0.36363636363636365,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9523809523809524,
"number": 761,
"precision": 0.9455958549222798,
"recall": 0.9592641261498029
},
"eval_PER": {
"f1": 0.9742078113485629,
"number": 676,
"precision": 0.9706314243759178,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9633883704235463,
"number": 694,
"precision": 0.9599427753934192,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8059701492537314,
"number": 33,
"precision": 0.7941176470588235,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.5,
"number": 6,
"precision": 0.5,
"recall": 0.5
},
"eval_accuracy": 0.9558339660845355,
"eval_accuracy-all": 0.9667172867628449,
"eval_accuracy-das": 0.9746899519109087,
"eval_accuracy-l1": 0.9619083776259175,
"eval_accuracy-l2": 0.9715261958997722,
"eval_f1": 0.9552411204158244,
"eval_f1-all": 0.9526308118350095,
"eval_f1-das": 0.9595697329376855,
"eval_f1-l1": 0.9531249999999999,
"eval_f1-l2": 0.9520026481297584,
"eval_loss": 0.15443478524684906,
"eval_precision": 0.948938611589214,
"eval_precision-all": 0.9458755426917511,
"eval_precision-das": 0.9556704839305504,
"eval_precision-l1": 0.9457364341085271,
"eval_precision-l2": 0.9460526315789474,
"eval_recall": 0.9616279069767442,
"eval_recall-all": 0.9594832648267763,
"eval_recall-das": 0.9635009310986965,
"eval_recall-l1": 0.9606299212598425,
"eval_recall-l2": 0.9580279813457695,
"eval_runtime": 5.4706,
"eval_samples_per_second": 123.569,
"eval_steps_per_second": 7.86,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.9435406698564592,
"number": 519,
"precision": 0.9372623574144486,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9560975609756097,
"number": 503,
"precision": 0.9386973180076629,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.3,
"number": 16,
"precision": 0.75,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9882179675994109,
"number": 678,
"precision": 0.986764705882353,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.48,
"number": 30,
"precision": 0.6,
"recall": 0.4
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9551656920077972,
"number": 761,
"precision": 0.9447300771208226,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9756457564575647,
"number": 676,
"precision": 0.9734904270986745,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9558404558404557,
"number": 694,
"precision": 0.9450704225352112,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8307692307692308,
"number": 33,
"precision": 0.84375,
"recall": 0.8181818181818182
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9607694254619084,
"eval_accuracy-all": 0.9705770690964313,
"eval_accuracy-das": 0.9731713490255631,
"eval_accuracy-l1": 0.9668438370032904,
"eval_accuracy-l2": 0.9743103011895723,
"eval_f1": 0.9611481588866339,
"eval_f1-all": 0.9570175438596491,
"eval_f1-das": 0.9630866258579114,
"eval_f1-l1": 0.9562043795620437,
"eval_f1-l2": 0.9580559254327563,
"eval_loss": 0.17625676095485687,
"eval_precision": 0.9586466165413534,
"eval_precision-all": 0.9531158998252767,
"eval_precision-das": 0.959349593495935,
"eval_precision-l1": 0.949766960124288,
"eval_precision-l2": 0.957418496340652,
"eval_recall": 0.9636627906976745,
"eval_recall-all": 0.96095126247798,
"eval_recall-das": 0.966852886405959,
"eval_recall-l1": 0.9627296587926509,
"eval_recall-l2": 0.9586942038640907,
"eval_runtime": 5.5364,
"eval_samples_per_second": 122.101,
"eval_steps_per_second": 7.767,
"step": 1300
},
{
"epoch": 3.67,
"eval_ACT": {
"f1": 0.9299242424242424,
"number": 519,
"precision": 0.9143389199255121,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9517241379310345,
"number": 503,
"precision": 0.943359375,
"recall": 0.9602385685884692
},
"eval_ACT_L2": {
"f1": 0.39024390243902435,
"number": 16,
"precision": 0.32,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9830757910228108,
"number": 678,
"precision": 0.9809104258443465,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.49315068493150693,
"number": 30,
"precision": 0.4186046511627907,
"recall": 0.6
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9440832249674903,
"number": 761,
"precision": 0.9343629343629344,
"recall": 0.9540078843626807
},
"eval_PER": {
"f1": 0.9756457564575647,
"number": 676,
"precision": 0.9734904270986745,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9613180515759313,
"number": 694,
"precision": 0.9558404558404558,
"recall": 0.9668587896253602
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8484848484848486,
"number": 33,
"precision": 0.8484848484848485,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.5
},
"eval_accuracy": 0.9524171095925082,
"eval_accuracy-all": 0.9641862819539357,
"eval_accuracy-das": 0.9696279422930904,
"eval_accuracy-l1": 0.9610225259427992,
"eval_accuracy-l2": 0.9673500379650721,
"eval_f1": 0.9534112216933507,
"eval_f1-all": 0.9512301645072062,
"eval_f1-das": 0.9583101723179546,
"eval_f1-l1": 0.9544389481905754,
"eval_f1-l2": 0.9471598414795244,
"eval_loss": 0.17374566197395325,
"eval_precision": 0.9461780704265674,
"eval_precision-all": 0.9434016748483973,
"eval_precision-das": 0.9535398230088495,
"eval_precision-l1": 0.9467975206611571,
"eval_precision-l2": 0.9390962671905697,
"eval_recall": 0.9607558139534884,
"eval_recall-all": 0.9591896652965355,
"eval_recall-das": 0.9631284916201117,
"eval_recall-l1": 0.9622047244094488,
"eval_recall-l2": 0.955363091272485,
"eval_runtime": 5.5496,
"eval_samples_per_second": 121.811,
"eval_steps_per_second": 7.748,
"step": 1400
},
{
"epoch": 3.94,
"learning_rate": 7e-05,
"loss": 0.0874,
"step": 1500
},
{
"epoch": 3.94,
"eval_ACT": {
"f1": 0.9458689458689458,
"number": 519,
"precision": 0.9325842696629213,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9647749510763209,
"number": 503,
"precision": 0.9499036608863198,
"recall": 0.9801192842942346
},
"eval_ACT_L2": {
"f1": 0.3225806451612903,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9823788546255506,
"number": 678,
"precision": 0.9780701754385965,
"recall": 0.9867256637168141
},
"eval_DESC": {
"f1": 0.3225806451612903,
"number": 30,
"precision": 0.3125,
"recall": 0.3333333333333333
},
"eval_FT": {
"f1": 0.25,
"number": 7,
"precision": 0.2222222222222222,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.954367666232073,
"number": 761,
"precision": 0.9469598965071151,
"recall": 0.961892247043364
},
"eval_PER": {
"f1": 0.9764011799410028,
"number": 676,
"precision": 0.9735294117647059,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9601706970128022,
"number": 694,
"precision": 0.9480337078651685,
"recall": 0.9726224783861671
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8358208955223881,
"number": 33,
"precision": 0.8235294117647058,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.28571428571428575,
"number": 6,
"precision": 0.25,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9526702100733991,
"eval_accuracy-all": 0.9644393824348266,
"eval_accuracy-das": 0.9700075930144267,
"eval_accuracy-l1": 0.9602632245001266,
"eval_accuracy-l2": 0.9686155403695267,
"eval_f1": 0.9585320040456581,
"eval_f1-all": 0.9540162980209547,
"eval_f1-das": 0.9615384615384616,
"eval_f1-l1": 0.9563409563409563,
"eval_f1-l2": 0.9510582010582012,
"eval_loss": 0.1944604068994522,
"eval_precision": 0.9528871014076414,
"eval_precision-all": 0.9457587997691864,
"eval_precision-das": 0.9548292324641939,
"eval_precision-l1": 0.9469891919711786,
"eval_precision-l2": 0.9441891004596191,
"eval_recall": 0.9642441860465116,
"eval_recall-all": 0.9624192601291838,
"eval_recall-das": 0.9683426443202979,
"eval_recall-l1": 0.9658792650918635,
"eval_recall-l2": 0.9580279813457695,
"eval_runtime": 5.5418,
"eval_samples_per_second": 121.983,
"eval_steps_per_second": 7.759,
"step": 1500
},
{
"epoch": 4.2,
"eval_ACT": {
"f1": 0.9579349904397705,
"number": 519,
"precision": 0.9506641366223909,
"recall": 0.9653179190751445
},
"eval_ACT_L1": {
"f1": 0.973293768545994,
"number": 503,
"precision": 0.968503937007874,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.5142857142857142,
"number": 16,
"precision": 0.47368421052631576,
"recall": 0.5625
},
"eval_CARDINAL": {
"f1": 0.9801031687546058,
"number": 678,
"precision": 0.979381443298969,
"recall": 0.9808259587020649
},
"eval_DESC": {
"f1": 0.5901639344262295,
"number": 30,
"precision": 0.5806451612903226,
"recall": 0.6
},
"eval_FT": {
"f1": 0.30769230769230765,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9542483660130721,
"number": 761,
"precision": 0.9492847854356307,
"recall": 0.9592641261498029
},
"eval_PER": {
"f1": 0.9793510324483775,
"number": 676,
"precision": 0.9764705882352941,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9649749821300929,
"number": 694,
"precision": 0.9574468085106383,
"recall": 0.9726224783861671
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8064516129032258,
"number": 33,
"precision": 0.8620689655172413,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9616552771450265,
"eval_accuracy-all": 0.9713996456593268,
"eval_accuracy-das": 0.9751961528726905,
"eval_accuracy-l1": 0.9691217413313086,
"eval_accuracy-l2": 0.973677549987345,
"eval_f1": 0.9617391304347827,
"eval_f1-all": 0.9599298040362678,
"eval_f1-das": 0.9646971386101821,
"eval_f1-l1": 0.9657874118568817,
"eval_f1-l2": 0.9524759056164839,
"eval_loss": 0.18698786199092865,
"eval_precision": 0.9589595375722544,
"eval_precision-all": 0.9562937062937062,
"eval_precision-das": 0.9625509825732295,
"eval_precision-l1": 0.9610187110187111,
"eval_precision-l2": 0.9502652519893899,
"eval_recall": 0.9645348837209302,
"eval_recall-all": 0.9635936582501468,
"eval_recall-das": 0.966852886405959,
"eval_recall-l1": 0.9706036745406824,
"eval_recall-l2": 0.9546968687541639,
"eval_runtime": 5.912,
"eval_samples_per_second": 114.344,
"eval_steps_per_second": 7.273,
"step": 1600
},
{
"epoch": 4.46,
"eval_ACT": {
"f1": 0.9420702754036088,
"number": 519,
"precision": 0.9288389513108615,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9663366336633663,
"number": 503,
"precision": 0.9625246548323472,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.37209302325581395,
"number": 16,
"precision": 0.2962962962962963,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9823269513991163,
"number": 678,
"precision": 0.9808823529411764,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.4927536231884058,
"number": 30,
"precision": 0.4358974358974359,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9489528795811519,
"number": 761,
"precision": 0.9452411994784876,
"recall": 0.9526938239159002
},
"eval_PER": {
"f1": 0.9778434268833086,
"number": 676,
"precision": 0.976401179941003,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9577060931899642,
"number": 694,
"precision": 0.9529243937232525,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8405797101449276,
"number": 33,
"precision": 0.8055555555555556,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.3333333333333333,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9578587699316629,
"eval_accuracy-all": 0.9679827891672994,
"eval_accuracy-das": 0.9738041002277904,
"eval_accuracy-l1": 0.9646924829157175,
"eval_accuracy-l2": 0.9712730954188813,
"eval_f1": 0.9567731675581899,
"eval_f1-all": 0.9541605839416059,
"eval_f1-das": 0.962109955423477,
"eval_f1-l1": 0.9582245430809399,
"eval_f1-l2": 0.9490066225165563,
"eval_loss": 0.1859915405511856,
"eval_precision": 0.9516824849007766,
"eval_precision-all": 0.9488966318234611,
"eval_precision-das": 0.9596146721007781,
"eval_precision-l1": 0.9532467532467532,
"eval_precision-l2": 0.9433838051349572,
"eval_recall": 0.9619186046511627,
"eval_recall-all": 0.9594832648267763,
"eval_recall-das": 0.9646182495344506,
"eval_recall-l1": 0.963254593175853,
"eval_recall-l2": 0.9546968687541639,
"eval_runtime": 5.5062,
"eval_samples_per_second": 122.771,
"eval_steps_per_second": 7.809,
"step": 1700
},
{
"epoch": 4.72,
"eval_ACT": {
"f1": 0.9666348903717827,
"number": 519,
"precision": 0.9566037735849057,
"recall": 0.976878612716763
},
"eval_ACT_L1": {
"f1": 0.9764705882352941,
"number": 503,
"precision": 0.9632495164410058,
"recall": 0.9900596421471173
},
"eval_ACT_L2": {
"f1": 0.6206896551724138,
"number": 16,
"precision": 0.6923076923076923,
"recall": 0.5625
},
"eval_CARDINAL": {
"f1": 0.9852941176470589,
"number": 678,
"precision": 0.9824046920821115,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.5666666666666667,
"number": 30,
"precision": 0.5666666666666667,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.2,
"number": 7,
"precision": 0.3333333333333333,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9542483660130721,
"number": 761,
"precision": 0.9492847854356307,
"recall": 0.9592641261498029
},
"eval_PER": {
"f1": 0.9793205317577548,
"number": 676,
"precision": 0.9778761061946902,
"recall": 0.9807692307692307
},
"eval_SPAT": {
"f1": 0.9547738693467337,
"number": 694,
"precision": 0.9513590844062947,
"recall": 0.9582132564841499
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8823529411764706,
"number": 33,
"precision": 0.8571428571428571,
"recall": 0.9090909090909091
},
"eval_TITREP": {
"f1": 0.4615384615384615,
"number": 6,
"precision": 0.42857142857142855,
"recall": 0.5
},
"eval_accuracy": 0.9643128321943811,
"eval_accuracy-all": 0.974120475828904,
"eval_accuracy-das": 0.9757023538344722,
"eval_accuracy-l1": 0.9711465451784358,
"eval_accuracy-l2": 0.9770944064793723,
"eval_f1": 0.9649580075296842,
"eval_f1-all": 0.9609592045620704,
"eval_f1-das": 0.968651456130588,
"eval_f1-l1": 0.9626534343170541,
"eval_f1-l2": 0.9588039867109635,
"eval_loss": 0.16283993422985077,
"eval_precision": 0.96133871898442,
"eval_precision-all": 0.9571803087678415,
"eval_precision-das": 0.9648928307464892,
"eval_precision-l1": 0.9579002079002079,
"eval_precision-l2": 0.9562624254473161,
"eval_recall": 0.9686046511627907,
"eval_recall-all": 0.9647680563711099,
"eval_recall-das": 0.97243947858473,
"eval_recall-l1": 0.9674540682414698,
"eval_recall-l2": 0.9613590939373751,
"eval_runtime": 5.4991,
"eval_samples_per_second": 122.928,
"eval_steps_per_second": 7.819,
"step": 1800
},
{
"epoch": 4.99,
"eval_ACT": {
"f1": 0.941398865784499,
"number": 519,
"precision": 0.9239332096474954,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9655172413793103,
"number": 503,
"precision": 0.95703125,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.37209302325581395,
"number": 16,
"precision": 0.2962962962962963,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9852507374631269,
"number": 678,
"precision": 0.9852507374631269,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.49315068493150693,
"number": 30,
"precision": 0.4186046511627907,
"recall": 0.6
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9614126880313931,
"number": 761,
"precision": 0.95703125,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9815225424981524,
"number": 676,
"precision": 0.9807976366322009,
"recall": 0.9822485207100592
},
"eval_SPAT": {
"f1": 0.9555236728837877,
"number": 694,
"precision": 0.9514285714285714,
"recall": 0.9596541786743515
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.923076923076923,
"number": 33,
"precision": 0.9375,
"recall": 0.9090909090909091
},
"eval_TITREP": {
"f1": 0.28571428571428575,
"number": 6,
"precision": 0.25,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.960389774740572,
"eval_accuracy-all": 0.9701341432548722,
"eval_accuracy-das": 0.9759554543153632,
"eval_accuracy-l1": 0.9659579853201721,
"eval_accuracy-l2": 0.9743103011895723,
"eval_f1": 0.9632523148148149,
"eval_f1-all": 0.9577012835472578,
"eval_f1-das": 0.9673226884515411,
"eval_f1-l1": 0.9580401355225436,
"eval_f1-l2": 0.9572706194104007,
"eval_loss": 0.16160346567630768,
"eval_precision": 0.9588133640552995,
"eval_precision-all": 0.9515942028985507,
"eval_precision-das": 0.9644576082932247,
"eval_precision-l1": 0.9513457556935818,
"eval_precision-l2": 0.9519104084321476,
"eval_recall": 0.9677325581395348,
"eval_recall-all": 0.9638872577803875,
"eval_recall-das": 0.9702048417132216,
"eval_recall-l1": 0.9648293963254593,
"eval_recall-l2": 0.9626915389740173,
"eval_runtime": 5.4066,
"eval_samples_per_second": 125.032,
"eval_steps_per_second": 7.953,
"step": 1900
},
{
"epoch": 5.25,
"learning_rate": 6e-05,
"loss": 0.0496,
"step": 2000
},
{
"epoch": 5.25,
"eval_ACT": {
"f1": 0.9627507163323782,
"number": 519,
"precision": 0.9545454545454546,
"recall": 0.9710982658959537
},
"eval_ACT_L1": {
"f1": 0.9735034347399412,
"number": 503,
"precision": 0.9612403100775194,
"recall": 0.9860834990059643
},
"eval_ACT_L2": {
"f1": 0.5714285714285715,
"number": 16,
"precision": 0.6666666666666666,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9852507374631269,
"number": 678,
"precision": 0.9852507374631269,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.5901639344262295,
"number": 30,
"precision": 0.5806451612903226,
"recall": 0.6
},
"eval_FT": {
"f1": 0.4615384615384615,
"number": 7,
"precision": 0.5,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9574328749181402,
"number": 761,
"precision": 0.9543080939947781,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.9785344189489268,
"number": 676,
"precision": 0.9792592592592593,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9619526202440775,
"number": 694,
"precision": 0.9585121602288984,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9206349206349207,
"number": 33,
"precision": 0.9666666666666667,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.4615384615384615,
"number": 6,
"precision": 0.42857142857142855,
"recall": 0.5
},
"eval_accuracy": 0.9693748418121995,
"eval_accuracy-all": 0.9779169830422678,
"eval_accuracy-das": 0.9788661098456087,
"eval_accuracy-l1": 0.9744368514300177,
"eval_accuracy-l2": 0.9813971146545178,
"eval_f1": 0.9663670629167874,
"eval_f1-all": 0.9630823322590096,
"eval_f1-das": 0.9693137437232657,
"eval_f1-l1": 0.964453737584945,
"eval_f1-l2": 0.9613333333333334,
"eval_loss": 0.1529596447944641,
"eval_precision": 0.9638519375361481,
"eval_precision-all": 0.9611111111111111,
"eval_precision-das": 0.9680534918276374,
"eval_precision-l1": 0.9604372722540343,
"eval_precision-l2": 0.961974649766511,
"eval_recall": 0.9688953488372093,
"eval_recall-all": 0.9650616559013505,
"eval_recall-das": 0.9705772811918063,
"eval_recall-l1": 0.968503937007874,
"eval_recall-l2": 0.960692871419054,
"eval_runtime": 5.5475,
"eval_samples_per_second": 121.856,
"eval_steps_per_second": 7.751,
"step": 2000
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 813927239246016.0,
"trial_name": null,
"trial_params": null
}