m2_joint_label_ref_cmbert_iob2 / trainer_state.json
nlpso's picture
Load model and tokenizer
e552d5a
{
"best_metric": 0.9712999437253799,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/212-camembert-ner-joint-labelling-iob2/checkpoint-1300",
"epoch": 3.4120734908136483,
"global_step": 1300,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8496849684968496,
"number": 519,
"precision": 0.7972972972972973,
"recall": 0.9094412331406551
},
"eval_ACT_L1": {
"f1": 0.8621004566210045,
"number": 503,
"precision": 0.7972972972972973,
"recall": 0.9383697813121272
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9751461988304094,
"number": 678,
"precision": 0.9666666666666667,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9186351706036745,
"number": 762,
"precision": 0.9186351706036745,
"recall": 0.9186351706036745
},
"eval_PER": {
"f1": 0.9389256806475349,
"number": 676,
"precision": 0.9341142020497804,
"recall": 0.9437869822485208
},
"eval_SPAT": {
"f1": 0.8896746817538898,
"number": 694,
"precision": 0.8736111111111111,
"recall": 0.9063400576368876
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9276315789473685,
"eval_accuracy-all": 0.9507199602780536,
"eval_accuracy-das": 0.9462512413108243,
"eval_accuracy-l1": 0.9363207547169812,
"eval_accuracy-l1l2": 0.9285004965243296,
"eval_accuracy-l2": 0.9651191658391262,
"eval_f1": 0.9257838935258289,
"eval_f1-all": 0.9063320688648964,
"eval_f1-das": 0.9201930215293245,
"eval_f1-l1": 0.8917948717948718,
"eval_f1-l1l2": 0.9167508296061174,
"eval_f1-l2": 0.92552471225457,
"eval_loss": 0.5488097667694092,
"eval_precision": 0.926201760324983,
"eval_precision-all": 0.9010733971569481,
"eval_precision-das": 0.9167899408284024,
"eval_precision-l1": 0.8716791979949875,
"eval_precision-l1l2": 0.913981588032221,
"eval_precision-l2": 0.9414600550964187,
"eval_recall": 0.9253664036076663,
"eval_recall-all": 0.9116524801878485,
"eval_recall-das": 0.9236214605067065,
"eval_recall-l1": 0.9128608923884515,
"eval_recall-l1l2": 0.9195369030390738,
"eval_recall-l2": 0.9101198402130493,
"eval_runtime": 7.7665,
"eval_samples_per_second": 87.04,
"eval_steps_per_second": 5.537,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.8874538745387454,
"number": 519,
"precision": 0.8513274336283185,
"recall": 0.9267822736030829
},
"eval_ACT_L1": {
"f1": 0.9007490636704119,
"number": 503,
"precision": 0.8513274336283185,
"recall": 0.9562624254473161
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9780058651026392,
"number": 678,
"precision": 0.9723032069970845,
"recall": 0.9837758112094396
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9423076923076922,
"number": 762,
"precision": 0.9210526315789473,
"recall": 0.9645669291338582
},
"eval_PER": {
"f1": 0.9515418502202644,
"number": 676,
"precision": 0.9446064139941691,
"recall": 0.9585798816568047
},
"eval_SPAT": {
"f1": 0.9454287739192062,
"number": 694,
"precision": 0.9302649930264993,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.939051638530288,
"eval_accuracy-all": 0.9588505461767627,
"eval_accuracy-das": 0.9565541211519365,
"eval_accuracy-l1": 0.9492303872889771,
"eval_accuracy-l1l2": 0.9397964250248262,
"eval_accuracy-l2": 0.9684707050645481,
"eval_f1": 0.9397725993470674,
"eval_f1-all": 0.9324974486076687,
"eval_f1-das": 0.9345932925699463,
"eval_f1-l1": 0.9274464239607539,
"eval_f1-l1l2": 0.9324499495895148,
"eval_f1-l2": 0.9390488948425987,
"eval_loss": 0.33518391847610474,
"eval_precision": 0.9383992805755396,
"eval_precision-all": 0.9264194669756662,
"eval_precision-das": 0.9295982307408772,
"eval_precision-l1": 0.9126016260162602,
"eval_precision-l1l2": 0.9280389908256881,
"eval_precision-l2": 0.944743935309973,
"eval_recall": 0.9411499436302142,
"eval_recall-all": 0.938655708834752,
"eval_recall-das": 0.9396423248882265,
"eval_recall-l1": 0.9427821522309712,
"eval_recall-l1l2": 0.9369030390738061,
"eval_recall-l2": 0.933422103861518,
"eval_runtime": 8.3825,
"eval_samples_per_second": 80.645,
"eval_steps_per_second": 5.13,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9334600760456274,
"number": 519,
"precision": 0.9212007504690432,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9478764478764479,
"number": 503,
"precision": 0.9212007504690432,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9919058130978661,
"number": 678,
"precision": 0.9897209985315712,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.20689655172413796,
"number": 30,
"precision": 0.21428571428571427,
"recall": 0.2
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.945736434108527,
"number": 762,
"precision": 0.9312977099236641,
"recall": 0.9606299212598425
},
"eval_PER": {
"f1": 0.9684519442406457,
"number": 676,
"precision": 0.9606986899563319,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9579472558802565,
"number": 694,
"precision": 0.9478138222849083,
"recall": 0.968299711815562
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.4186046511627907,
"number": 33,
"precision": 0.33962264150943394,
"recall": 0.5454545454545454
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9463753723932473,
"eval_accuracy-all": 0.9628848063555114,
"eval_accuracy-das": 0.9671052631578947,
"eval_accuracy-l1": 0.9544438927507448,
"eval_accuracy-l1l2": 0.9468718967229395,
"eval_accuracy-l2": 0.9713257199602781,
"eval_f1": 0.9517800811176207,
"eval_f1-all": 0.9450900639163278,
"eval_f1-das": 0.961645358532518,
"eval_f1-l1": 0.9471776281719316,
"eval_f1-l1l2": 0.9484092863284609,
"eval_f1-l2": 0.942422236929186,
"eval_loss": 0.24298420548439026,
"eval_precision": 0.9511371312767395,
"eval_precision-all": 0.9355766465343687,
"eval_precision-das": 0.9565057132325838,
"eval_precision-l1": 0.9345937659683189,
"eval_precision-l1l2": 0.9392563156400795,
"eval_precision-l2": 0.9368421052631579,
"eval_recall": 0.952423900789177,
"eval_recall-all": 0.9547989433519225,
"eval_recall-das": 0.9668405365126677,
"eval_recall-l1": 0.9601049868766404,
"eval_recall-l1l2": 0.9577424023154848,
"eval_recall-l2": 0.948069241011984,
"eval_runtime": 8.4801,
"eval_samples_per_second": 79.716,
"eval_steps_per_second": 5.071,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9203373945641987,
"number": 519,
"precision": 0.8959854014598541,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9343482397716462,
"number": 503,
"precision": 0.8959854014598541,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9911764705882352,
"number": 678,
"precision": 0.9882697947214076,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9491307147456535,
"number": 762,
"precision": 0.93173198482933,
"recall": 0.9671916010498688
},
"eval_PER": {
"f1": 0.9611151870873074,
"number": 676,
"precision": 0.9534206695778749,
"recall": 0.9689349112426036
},
"eval_SPAT": {
"f1": 0.9446808510638297,
"number": 694,
"precision": 0.9301675977653632,
"recall": 0.9596541786743515
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.4235294117647059,
"number": 33,
"precision": 0.34615384615384615,
"recall": 0.5454545454545454
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9483614697120158,
"eval_accuracy-all": 0.9652432969215492,
"eval_accuracy-das": 0.9685948361469712,
"eval_accuracy-l1": 0.9546921549155909,
"eval_accuracy-l1l2": 0.948982125124131,
"eval_accuracy-l2": 0.9757944389275075,
"eval_f1": 0.9511620074099024,
"eval_f1-all": 0.9386041123660586,
"eval_f1-das": 0.9583333333333334,
"eval_f1-l1": 0.934261407579273,
"eval_f1-l1l2": 0.9454285714285714,
"eval_f1-l2": 0.9441691443673604,
"eval_loss": 0.21430818736553192,
"eval_precision": 0.947227191413238,
"eval_precision-all": 0.9262646470420121,
"eval_precision-das": 0.9485401459854015,
"eval_precision-l1": 0.9179331306990881,
"eval_precision-l1l2": 0.9334273624823696,
"eval_precision-l2": 0.9370491803278689,
"eval_recall": 0.9551296505073281,
"eval_recall-all": 0.9512767830936307,
"eval_recall-das": 0.9683308494783904,
"eval_recall-l1": 0.9511811023622048,
"eval_recall-l1l2": 0.9577424023154848,
"eval_recall-l2": 0.9513981358189081,
"eval_runtime": 7.6902,
"eval_samples_per_second": 87.904,
"eval_steps_per_second": 5.592,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.5127,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9113680154142582,
"number": 519,
"precision": 0.9113680154142582,
"recall": 0.9113680154142582
},
"eval_ACT_L1": {
"f1": 0.9256360078277887,
"number": 503,
"precision": 0.9113680154142582,
"recall": 0.9403578528827038
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9903917220990391,
"number": 678,
"precision": 0.9925925925925926,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.17391304347826086,
"number": 30,
"precision": 0.12903225806451613,
"recall": 0.26666666666666666
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9475728155339805,
"number": 762,
"precision": 0.9348659003831418,
"recall": 0.9606299212598425
},
"eval_PER": {
"f1": 0.9661764705882354,
"number": 676,
"precision": 0.9605263157894737,
"recall": 0.9718934911242604
},
"eval_SPAT": {
"f1": 0.9448818897637796,
"number": 694,
"precision": 0.9388335704125178,
"recall": 0.9510086455331412
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.6000000000000001,
"number": 33,
"precision": 0.5675675675675675,
"recall": 0.6363636363636364
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9419066534260179,
"eval_accuracy-all": 0.9626365441906654,
"eval_accuracy-das": 0.9543197616683218,
"eval_accuracy-l1": 0.9530784508440914,
"eval_accuracy-l1l2": 0.94240317775571,
"eval_accuracy-l2": 0.9721946375372393,
"eval_f1": 0.9503098591549296,
"eval_f1-all": 0.9377001455604075,
"eval_f1-das": 0.9520980319346454,
"eval_f1-l1": 0.9284792150787502,
"eval_f1-l1l2": 0.9436559139784947,
"eval_f1-l2": 0.9496162829496162,
"eval_loss": 0.2053818553686142,
"eval_precision": 0.9497747747747748,
"eval_precision-all": 0.9301183944556742,
"eval_precision-das": 0.9489267209474463,
"eval_precision-l1": 0.9136178861788617,
"eval_precision-l1l2": 0.9349431818181818,
"eval_precision-l2": 0.9518394648829431,
"eval_recall": 0.9508455467869222,
"eval_recall-all": 0.9454065159964778,
"eval_recall-das": 0.9552906110283159,
"eval_recall-l1": 0.9438320209973753,
"eval_recall-l1l2": 0.9525325615050652,
"eval_recall-l2": 0.9474034620505992,
"eval_runtime": 7.6109,
"eval_samples_per_second": 88.82,
"eval_steps_per_second": 5.65,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9271028037383178,
"number": 519,
"precision": 0.9001814882032668,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9411764705882354,
"number": 503,
"precision": 0.9001814882032668,
"recall": 0.9860834990059643
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9926362297496317,
"number": 678,
"precision": 0.9911764705882353,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9522580645161292,
"number": 762,
"precision": 0.9365482233502538,
"recall": 0.968503937007874
},
"eval_PER": {
"f1": 0.9815770081061165,
"number": 676,
"precision": 0.9779735682819384,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9544159544159543,
"number": 694,
"precision": 0.9436619718309859,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8611111111111112,
"number": 33,
"precision": 0.7948717948717948,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9571747765640516,
"eval_accuracy-all": 0.9683465739821251,
"eval_accuracy-das": 0.9715739821251241,
"eval_accuracy-l1": 0.9617676266137041,
"eval_accuracy-l1l2": 0.9575471698113207,
"eval_accuracy-l2": 0.9749255213505462,
"eval_f1": 0.9623233908948194,
"eval_f1-all": 0.9512053441765902,
"eval_f1-das": 0.9656446250461765,
"eval_f1-l1": 0.9450606138767088,
"eval_f1-l1l2": 0.9576696800114795,
"eval_f1-l2": 0.959122632103689,
"eval_loss": 0.1763894408941269,
"eval_precision": 0.9571715369172429,
"eval_precision-all": 0.9413624604771486,
"eval_precision-das": 0.9575091575091575,
"eval_precision-l1": 0.9290060851926978,
"eval_precision-l1l2": 0.9496300512236767,
"eval_precision-l2": 0.9575315195753152,
"eval_recall": 0.9675310033821871,
"eval_recall-all": 0.9612562371587907,
"eval_recall-das": 0.973919523099851,
"eval_recall-l1": 0.9616797900262467,
"eval_recall-l1l2": 0.9658465991316932,
"eval_recall-l2": 0.9607190412782957,
"eval_runtime": 7.2583,
"eval_samples_per_second": 93.135,
"eval_steps_per_second": 5.924,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9270142180094787,
"number": 519,
"precision": 0.9123134328358209,
"recall": 0.9421965317919075
},
"eval_ACT_L1": {
"f1": 0.9549902152641877,
"number": 503,
"precision": 0.9402697495183044,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.06060606060606061,
"number": 16,
"precision": 0.058823529411764705,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9926253687315634,
"number": 678,
"precision": 0.9926253687315634,
"recall": 0.9926253687315634
},
"eval_DESC": {
"f1": 0.2696629213483146,
"number": 30,
"precision": 0.2033898305084746,
"recall": 0.4
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.958169934640523,
"number": 762,
"precision": 0.9544270833333334,
"recall": 0.9619422572178478
},
"eval_PER": {
"f1": 0.9770879526977089,
"number": 676,
"precision": 0.9763663220088626,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.948957584471603,
"number": 694,
"precision": 0.9469153515064562,
"recall": 0.9510086455331412
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.955223880597015,
"number": 33,
"precision": 0.9411764705882353,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9451340615690169,
"eval_accuracy-all": 0.9622641509433962,
"eval_accuracy-das": 0.9667328699106256,
"eval_accuracy-l1": 0.9527060575968223,
"eval_accuracy-l1l2": 0.9458788480635552,
"eval_accuracy-l2": 0.9718222442899702,
"eval_f1": 0.9608019824284748,
"eval_f1-all": 0.9509918319719953,
"eval_f1-das": 0.9679702048417131,
"eval_f1-l1": 0.9442571947109151,
"eval_f1-l1l2": 0.958033917792469,
"eval_f1-l2": 0.9596532177392464,
"eval_loss": 0.19187191128730774,
"eval_precision": 0.9599369795183434,
"eval_precision-all": 0.9452015076833865,
"eval_precision-das": 0.9676098287416233,
"eval_precision-l1": 0.9328893442622951,
"eval_precision-l1l2": 0.9514701684270626,
"eval_precision-l2": 0.9612558450233801,
"eval_recall": 0.9616685456595265,
"eval_recall-all": 0.956853536835926,
"eval_recall-das": 0.9683308494783904,
"eval_recall-l1": 0.9559055118110236,
"eval_recall-l1l2": 0.9646888567293778,
"eval_recall-l2": 0.9580559254327563,
"eval_runtime": 8.1693,
"eval_samples_per_second": 82.748,
"eval_steps_per_second": 5.264,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9318181818181819,
"number": 519,
"precision": 0.9162011173184358,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9618021547502448,
"number": 503,
"precision": 0.9478764478764479,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.05714285714285714,
"number": 16,
"precision": 0.05263157894736842,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9926144756277695,
"number": 678,
"precision": 0.9940828402366864,
"recall": 0.9911504424778761
},
"eval_DESC": {
"f1": 0.3055555555555555,
"number": 30,
"precision": 0.2619047619047619,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9559585492227979,
"number": 762,
"precision": 0.9437340153452686,
"recall": 0.968503937007874
},
"eval_PER": {
"f1": 0.9801616458486407,
"number": 676,
"precision": 0.9737226277372263,
"recall": 0.9866863905325444
},
"eval_SPAT": {
"f1": 0.9519713261648747,
"number": 694,
"precision": 0.9472182596291013,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8611111111111112,
"number": 33,
"precision": 0.7948717948717948,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.5,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9492303872889771,
"eval_accuracy-all": 0.9608366434955313,
"eval_accuracy-das": 0.9750496524329693,
"eval_accuracy-l1": 0.95506454816286,
"eval_accuracy-l1l2": 0.9502234359483615,
"eval_accuracy-l2": 0.9666087388282025,
"eval_f1": 0.9611497866606782,
"eval_f1-all": 0.9535864978902954,
"eval_f1-das": 0.9695845697329377,
"eval_f1-l1": 0.951960529732537,
"eval_f1-l1l2": 0.9604017216642754,
"eval_f1-l2": 0.9556585043017869,
"eval_loss": 0.17047062516212463,
"eval_precision": 0.9572802505032432,
"eval_precision-all": 0.9454702827466821,
"eval_precision-das": 0.965288035450517,
"eval_precision-l1": 0.9419321685508736,
"eval_precision-l1l2": 0.9522048364153627,
"eval_precision-l2": 0.95,
"eval_recall": 0.9650507328072153,
"eval_recall-all": 0.961843263868506,
"eval_recall-das": 0.973919523099851,
"eval_recall-l1": 0.9622047244094488,
"eval_recall-l1l2": 0.9687409551374819,
"eval_recall-l2": 0.9613848202396804,
"eval_runtime": 7.4469,
"eval_samples_per_second": 90.776,
"eval_steps_per_second": 5.774,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9367327667610954,
"number": 519,
"precision": 0.9185185185185185,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9545893719806763,
"number": 503,
"precision": 0.9285714285714286,
"recall": 0.9821073558648111
},
"eval_ACT_L2": {
"f1": 0.16666666666666666,
"number": 16,
"precision": 0.25,
"recall": 0.125
},
"eval_CARDINAL": {
"f1": 0.9926362297496317,
"number": 678,
"precision": 0.9911764705882353,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.29032258064516125,
"number": 30,
"precision": 0.28125,
"recall": 0.3
},
"eval_FT": {
"f1": 0.25,
"number": 7,
"precision": 1.0,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9635416666666666,
"number": 762,
"precision": 0.9560723514211886,
"recall": 0.9711286089238845
},
"eval_PER": {
"f1": 0.9772226304188096,
"number": 676,
"precision": 0.9708029197080292,
"recall": 0.9837278106508875
},
"eval_SPAT": {
"f1": 0.9669540229885057,
"number": 694,
"precision": 0.9641833810888252,
"recall": 0.9697406340057637
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9014084507042254,
"number": 33,
"precision": 0.8421052631578947,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.16666666666666666,
"number": 6,
"precision": 0.16666666666666666,
"recall": 0.16666666666666666
},
"eval_accuracy": 0.9597815292949354,
"eval_accuracy-all": 0.9707050645481629,
"eval_accuracy-das": 0.9769116186693148,
"eval_accuracy-l1": 0.9648709036742801,
"eval_accuracy-l1l2": 0.9607745779543198,
"eval_accuracy-l2": 0.9765392254220456,
"eval_f1": 0.9659359190556492,
"eval_f1-all": 0.9593353738522081,
"eval_f1-das": 0.9703593923675434,
"eval_f1-l1": 0.9558670820353063,
"eval_f1-l1l2": 0.9641984184040259,
"eval_f1-l2": 0.9637753406447326,
"eval_loss": 0.17056229710578918,
"eval_precision": 0.9632286995515695,
"eval_precision-all": 0.9528083381586566,
"eval_precision-das": 0.9649963154016212,
"eval_precision-l1": 0.9455572675911659,
"eval_precision-l1l2": 0.958,
"eval_precision-l2": 0.962176509621765,
"eval_recall": 0.9686583990980834,
"eval_recall-all": 0.965952450836513,
"eval_recall-das": 0.9757824143070045,
"eval_recall-l1": 0.9664041994750656,
"eval_recall-l1l2": 0.9704775687409551,
"eval_recall-l2": 0.9653794940079894,
"eval_runtime": 7.8582,
"eval_samples_per_second": 86.025,
"eval_steps_per_second": 5.472,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1599,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9449715370018975,
"number": 519,
"precision": 0.930841121495327,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9723865877712031,
"number": 503,
"precision": 0.9647749510763209,
"recall": 0.9801192842942346
},
"eval_ACT_L2": {
"f1": 0.25,
"number": 16,
"precision": 0.20833333333333334,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.4411764705882353,
"number": 30,
"precision": 0.39473684210526316,
"recall": 0.5
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9633986928104575,
"number": 762,
"precision": 0.9596354166666666,
"recall": 0.9671916010498688
},
"eval_PER": {
"f1": 0.9874908020603386,
"number": 676,
"precision": 0.9824304538799414,
"recall": 0.992603550295858
},
"eval_SPAT": {
"f1": 0.9656652360515022,
"number": 694,
"precision": 0.9588068181818182,
"recall": 0.9726224783861671
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8888888888888888,
"number": 33,
"precision": 0.8205128205128205,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.30769230769230765,
"number": 6,
"precision": 0.2857142857142857,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9569265143992055,
"eval_accuracy-all": 0.9661742800397219,
"eval_accuracy-das": 0.977656405163853,
"eval_accuracy-l1": 0.9626365441906654,
"eval_accuracy-l1l2": 0.9570506454816285,
"eval_accuracy-l2": 0.9697120158887785,
"eval_f1": 0.9685987619583567,
"eval_f1-all": 0.9631356549613872,
"eval_f1-das": 0.9743970315398888,
"eval_f1-l1": 0.9653736006248372,
"eval_f1-l1l2": 0.9673240247588887,
"eval_f1-l2": 0.9602911978821972,
"eval_loss": 0.14895667135715485,
"eval_precision": 0.9669662921348314,
"eval_precision-all": 0.9563078703703703,
"eval_precision-das": 0.9704360679970436,
"eval_precision-l1": 0.9576446280991735,
"eval_precision-l1l2": 0.9621993127147767,
"eval_precision-l2": 0.9546052631578947,
"eval_recall": 0.9702367531003382,
"eval_recall-all": 0.9700616378045201,
"eval_recall-das": 0.9783904619970194,
"eval_recall-l1": 0.9732283464566929,
"eval_recall-l1l2": 0.9725036179450073,
"eval_recall-l2": 0.9660452729693741,
"eval_runtime": 7.5407,
"eval_samples_per_second": 89.647,
"eval_steps_per_second": 5.702,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9387370405278038,
"number": 519,
"precision": 0.9188191881918819,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9685039370078741,
"number": 503,
"precision": 0.9590643274853801,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.26666666666666666,
"number": 16,
"precision": 0.20689655172413793,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9933677229182019,
"number": 678,
"precision": 0.9926362297496318,
"recall": 0.9941002949852508
},
"eval_DESC": {
"f1": 0.3943661971830986,
"number": 30,
"precision": 0.34146341463414637,
"recall": 0.4666666666666667
},
"eval_FT": {
"f1": 0.25,
"number": 7,
"precision": 1.0,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9617627997407647,
"number": 762,
"precision": 0.9500640204865557,
"recall": 0.973753280839895
},
"eval_PER": {
"f1": 0.9874353288987435,
"number": 676,
"precision": 0.9867060561299852,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9611510791366907,
"number": 694,
"precision": 0.9597701149425287,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9117647058823529,
"number": 33,
"precision": 0.8857142857142857,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.30769230769230765,
"number": 6,
"precision": 0.2857142857142857,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9503475670307845,
"eval_accuracy-all": 0.964746772591857,
"eval_accuracy-das": 0.9734359483614697,
"eval_accuracy-l1": 0.9575471698113207,
"eval_accuracy-l1l2": 0.9512164846077458,
"eval_accuracy-l2": 0.9719463753723933,
"eval_f1": 0.9630707251566697,
"eval_f1-all": 0.9606757937663851,
"eval_f1-das": 0.9716719126087763,
"eval_f1-l1": 0.9613778705636743,
"eval_f1-l1l2": 0.963217403749821,
"eval_f1-l2": 0.9597890573500328,
"eval_loss": 0.16148586571216583,
"eval_precision": 0.956009775605421,
"eval_precision-all": 0.9534547557097427,
"eval_precision-das": 0.9657710710342289,
"eval_precision-l1": 0.9558899844317592,
"eval_precision-l1l2": 0.952718006795017,
"eval_precision-l2": 0.9503916449086162,
"eval_recall": 0.9702367531003382,
"eval_recall-all": 0.9680070443205165,
"eval_recall-das": 0.977645305514158,
"eval_recall-l1": 0.9669291338582677,
"eval_recall-l1l2": 0.9739507959479016,
"eval_recall-l2": 0.9693741677762983,
"eval_runtime": 7.3345,
"eval_samples_per_second": 92.167,
"eval_steps_per_second": 5.863,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9393939393939394,
"number": 519,
"precision": 0.9236499068901304,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9645669291338583,
"number": 503,
"precision": 0.9551656920077972,
"recall": 0.974155069582505
},
"eval_ACT_L2": {
"f1": 0.3,
"number": 16,
"precision": 0.25,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9941089837997055,
"number": 678,
"precision": 0.9926470588235294,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.5205479452054794,
"number": 30,
"precision": 0.4418604651162791,
"recall": 0.6333333333333333
},
"eval_FT": {
"f1": 0.25,
"number": 7,
"precision": 1.0,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9659685863874344,
"number": 762,
"precision": 0.9634464751958225,
"recall": 0.968503937007874
},
"eval_PER": {
"f1": 0.9881656804733728,
"number": 676,
"precision": 0.9881656804733728,
"recall": 0.9881656804733728
},
"eval_SPAT": {
"f1": 0.9754689754689755,
"number": 694,
"precision": 0.976878612716763,
"recall": 0.9740634005763689
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.927536231884058,
"number": 33,
"precision": 0.8888888888888888,
"recall": 0.9696969696969697
},
"eval_TITREP": {
"f1": 0.6666666666666666,
"number": 6,
"precision": 1.0,
"recall": 0.5
},
"eval_accuracy": 0.958540218470705,
"eval_accuracy-all": 0.9707671300893744,
"eval_accuracy-das": 0.9749255213505462,
"eval_accuracy-l1": 0.9651191658391262,
"eval_accuracy-l1l2": 0.9589126117179742,
"eval_accuracy-l2": 0.9764150943396226,
"eval_f1": 0.9679667303585477,
"eval_f1-all": 0.9671100716269552,
"eval_f1-das": 0.9717367050948309,
"eval_f1-l1": 0.9678767302167668,
"eval_f1-l1l2": 0.9674726540011515,
"eval_f1-l2": 0.9661354581673307,
"eval_loss": 0.15650230646133423,
"eval_precision": 0.9650380995069475,
"eval_precision-all": 0.963308095515434,
"eval_precision-das": 0.9699331848552338,
"eval_precision-l1": 0.9630977130977131,
"eval_precision-l1l2": 0.962210134554824,
"eval_precision-l2": 0.9635761589403974,
"eval_recall": 0.970913190529876,
"eval_recall-all": 0.9709421778690931,
"eval_recall-das": 0.9735469448584203,
"eval_recall-l1": 0.9727034120734908,
"eval_recall-l1l2": 0.9727930535455861,
"eval_recall-l2": 0.9687083888149135,
"eval_runtime": 7.961,
"eval_samples_per_second": 84.913,
"eval_steps_per_second": 5.401,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.949667616334283,
"number": 519,
"precision": 0.9363295880149812,
"recall": 0.9633911368015414
},
"eval_ACT_L1": {
"f1": 0.9686888454011742,
"number": 503,
"precision": 0.953757225433526,
"recall": 0.9840954274353877
},
"eval_ACT_L2": {
"f1": 0.3225806451612903,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.3125
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_DESC": {
"f1": 0.4571428571428572,
"number": 30,
"precision": 0.4,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9724409448818898,
"number": 762,
"precision": 0.9724409448818898,
"recall": 0.9724409448818898
},
"eval_PER": {
"f1": 0.9844789356984479,
"number": 676,
"precision": 0.983751846381093,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9748020158387328,
"number": 694,
"precision": 0.9741007194244604,
"recall": 0.9755043227665706
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.9117647058823529,
"number": 33,
"precision": 0.8857142857142857,
"recall": 0.9393939393939394
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.3333333333333333,
"recall": 0.5
},
"eval_accuracy": 0.9671052631578947,
"eval_accuracy-all": 0.9757323733862959,
"eval_accuracy-das": 0.9817527308838133,
"eval_accuracy-l1": 0.9728152929493545,
"eval_accuracy-l1l2": 0.9674776564051638,
"eval_accuracy-l2": 0.9786494538232373,
"eval_f1": 0.9712999437253799,
"eval_f1-all": 0.967704223293877,
"eval_f1-das": 0.9736255572065379,
"eval_f1-l1": 0.9666319082377476,
"eval_f1-l1l2": 0.9700201787258577,
"eval_f1-l2": 0.9690721649484535,
"eval_loss": 0.13404050469398499,
"eval_precision": 0.9696629213483146,
"eval_precision-all": 0.9636204889406287,
"eval_precision-das": 0.9707407407407408,
"eval_precision-l1": 0.9601242879337131,
"eval_precision-l1l2": 0.9661211599196096,
"eval_precision-l2": 0.9681063122923588,
"eval_recall": 0.9729425028184893,
"eval_recall-all": 0.971822717933666,
"eval_recall-das": 0.9765275707898659,
"eval_recall-l1": 0.9732283464566929,
"eval_recall-l1l2": 0.9739507959479016,
"eval_recall-l2": 0.9700399467376831,
"eval_runtime": 8.2551,
"eval_samples_per_second": 81.889,
"eval_steps_per_second": 5.209,
"step": 1300
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 526580233077360.0,
"trial_name": null,
"trial_params": null
}