m2_joint_label_ocr_cmbert_iob2 / trainer_state.json
nlpso's picture
Load model and tokenizer
cb92a69
{
"best_metric": 0.9663456090651559,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_2/tmp/222-camembert-ner-joint-labelling-iob2/checkpoint-1500",
"epoch": 3.937007874015748,
"global_step": 1500,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.8654019873532068,
"number": 519,
"precision": 0.814625850340136,
"recall": 0.9229287090558767
},
"eval_ACT_L1": {
"f1": 0.8780934922089826,
"number": 503,
"precision": 0.814625850340136,
"recall": 0.952286282306163
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9533381191672649,
"number": 678,
"precision": 0.9286713286713286,
"recall": 0.9793510324483776
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.8918918918918919,
"number": 762,
"precision": 0.875,
"recall": 0.9094488188976378
},
"eval_PER": {
"f1": 0.9017595307917888,
"number": 676,
"precision": 0.8938953488372093,
"recall": 0.9097633136094675
},
"eval_SPAT": {
"f1": 0.8731808731808732,
"number": 694,
"precision": 0.8411214953271028,
"recall": 0.9077809798270894
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9228043533282714,
"eval_accuracy-all": 0.9454568463680081,
"eval_accuracy-das": 0.9444444444444444,
"eval_accuracy-l1": 0.9322956213616805,
"eval_accuracy-l1l2": 0.9238167552518349,
"eval_accuracy-l2": 0.9586180713743356,
"eval_f1": 0.9154295996401259,
"eval_f1-all": 0.8880242109814094,
"eval_f1-das": 0.9100978401329148,
"eval_f1-l1": 0.8773536895674301,
"eval_f1-l1l2": 0.9032258064516129,
"eval_f1-l2": 0.9019607843137254,
"eval_loss": 0.591022253036499,
"eval_precision": 0.9107182814947415,
"eval_precision-all": 0.8723103057757644,
"eval_precision-das": 0.9022693997071742,
"eval_precision-l1": 0.851358024691358,
"eval_precision-l1l2": 0.8913412563667232,
"eval_precision-l2": 0.900464499004645,
"eval_recall": 0.9201899163463713,
"eval_recall-all": 0.9043146463164073,
"eval_recall-das": 0.9180633147113594,
"eval_recall-l1": 0.90498687664042,
"eval_recall-l1l2": 0.9154315605928509,
"eval_recall-l2": 0.903462050599201,
"eval_runtime": 6.4471,
"eval_samples_per_second": 104.854,
"eval_steps_per_second": 6.67,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.8866359447004608,
"number": 519,
"precision": 0.8498233215547704,
"recall": 0.9267822736030829
},
"eval_ACT_L1": {
"f1": 0.8999064546304959,
"number": 503,
"precision": 0.8498233215547704,
"recall": 0.9562624254473161
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9636627906976744,
"number": 678,
"precision": 0.9498567335243553,
"recall": 0.9778761061946902
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9296320206584893,
"number": 762,
"precision": 0.9148665819567979,
"recall": 0.9448818897637795
},
"eval_PER": {
"f1": 0.9425625920471281,
"number": 676,
"precision": 0.9384164222873901,
"recall": 0.9467455621301775
},
"eval_SPAT": {
"f1": 0.9255846917080085,
"number": 694,
"precision": 0.9107391910739191,
"recall": 0.9409221902017291
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.0,
"number": 33,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9325487218425715,
"eval_accuracy-all": 0.9526069349531764,
"eval_accuracy-das": 0.9507719564667173,
"eval_accuracy-l1": 0.942925841559099,
"eval_accuracy-l1l2": 0.9331814730447988,
"eval_accuracy-l2": 0.9622880283472539,
"eval_f1": 0.933272912654356,
"eval_f1-all": 0.9208108502260464,
"eval_f1-das": 0.9271007234279354,
"eval_f1-l1": 0.9167958656330749,
"eval_f1-l1l2": 0.9259901705695288,
"eval_f1-l2": 0.9260127217944426,
"eval_loss": 0.3781684637069702,
"eval_precision": 0.9352861035422343,
"eval_precision-all": 0.9150724637681159,
"eval_precision-das": 0.9235033259423503,
"eval_precision-l1": 0.9027989821882951,
"eval_precision-l1l2": 0.9211964337072188,
"eval_precision-l2": 0.9313131313131313,
"eval_recall": 0.9312683698846936,
"eval_recall-all": 0.9266216612855885,
"eval_recall-das": 0.9307262569832402,
"eval_recall-l1": 0.9312335958005249,
"eval_recall-l1l2": 0.930834059866318,
"eval_recall-l2": 0.9207723035952063,
"eval_runtime": 5.9776,
"eval_samples_per_second": 113.088,
"eval_steps_per_second": 7.193,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9058039961941009,
"number": 519,
"precision": 0.8947368421052632,
"recall": 0.9171483622350675
},
"eval_ACT_L1": {
"f1": 0.9198067632850242,
"number": 503,
"precision": 0.8947368421052632,
"recall": 0.9463220675944334
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9659173313995648,
"number": 678,
"precision": 0.9500713266761769,
"recall": 0.9823008849557522
},
"eval_DESC": {
"f1": 0.14035087719298248,
"number": 30,
"precision": 0.14814814814814814,
"recall": 0.13333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9347826086956521,
"number": 762,
"precision": 0.9114713216957606,
"recall": 0.9593175853018373
},
"eval_PER": {
"f1": 0.9528023598820058,
"number": 676,
"precision": 0.95,
"recall": 0.9556213017751479
},
"eval_SPAT": {
"f1": 0.931545518701482,
"number": 694,
"precision": 0.9128630705394191,
"recall": 0.9510086455331412
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.09523809523809523,
"number": 33,
"precision": 0.2222222222222222,
"recall": 0.06060606060606061
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9405213869906353,
"eval_accuracy-all": 0.9569096431283219,
"eval_accuracy-das": 0.9591242723361174,
"eval_accuracy-l1": 0.9511516071880537,
"eval_accuracy-l1l2": 0.9409010377119716,
"eval_accuracy-l2": 0.9626676790685902,
"eval_f1": 0.9373019465821638,
"eval_f1-all": 0.9257375381485249,
"eval_f1-das": 0.9348189415041782,
"eval_f1-l1": 0.9237134729764676,
"eval_f1-l1l2": 0.9300850511748595,
"eval_f1-l2": 0.9283344392833444,
"eval_loss": 0.2862992286682129,
"eval_precision": 0.9383639247677317,
"eval_precision-all": 0.9168105929763961,
"eval_precision-das": 0.9322222222222222,
"eval_precision-l1": 0.910295616717635,
"eval_precision-l1l2": 0.9227688787185355,
"eval_precision-l2": 0.9252645502645502,
"eval_recall": 0.9362423694325118,
"eval_recall-all": 0.9348400352216025,
"eval_recall-das": 0.9374301675977653,
"eval_recall-l1": 0.9375328083989501,
"eval_recall-l1l2": 0.9375181633246149,
"eval_recall-l2": 0.9314247669773635,
"eval_runtime": 6.3755,
"eval_samples_per_second": 106.031,
"eval_steps_per_second": 6.745,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9381541389153186,
"number": 519,
"precision": 0.9266917293233082,
"recall": 0.9499036608863198
},
"eval_ACT_L1": {
"f1": 0.9526570048309179,
"number": 503,
"precision": 0.9266917293233082,
"recall": 0.9801192842942346
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.976,
"number": 678,
"precision": 0.9626972740315638,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.03571428571428572,
"number": 30,
"precision": 0.038461538461538464,
"recall": 0.03333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9352331606217616,
"number": 762,
"precision": 0.9232736572890026,
"recall": 0.94750656167979
},
"eval_PER": {
"f1": 0.938506588579795,
"number": 676,
"precision": 0.9289855072463769,
"recall": 0.9482248520710059
},
"eval_SPAT": {
"f1": 0.929637526652452,
"number": 694,
"precision": 0.9172510518934082,
"recall": 0.9423631123919308
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.3614457831325301,
"number": 33,
"precision": 0.3,
"recall": 0.45454545454545453
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9454568463680081,
"eval_accuracy-all": 0.9614021766641356,
"eval_accuracy-das": 0.9687420906099722,
"eval_accuracy-l1": 0.9538091622374083,
"eval_accuracy-l1l2": 0.94596304732979,
"eval_accuracy-l2": 0.9689951910908631,
"eval_f1": 0.9435111060998985,
"eval_f1-all": 0.9270697404668696,
"eval_f1-das": 0.9485566247224279,
"eval_f1-l1": 0.925504397309881,
"eval_f1-l1l2": 0.9360481789503872,
"eval_f1-l2": 0.929066314747608,
"eval_loss": 0.2532674968242645,
"eval_precision": 0.9410706252811516,
"eval_precision-all": 0.9160458452722063,
"eval_precision-das": 0.9426259654284663,
"eval_precision-l1": 0.9122896481387047,
"eval_precision-l1l2": 0.9238607415793942,
"eval_precision-l2": 0.920863309352518,
"eval_recall": 0.9459642776396111,
"eval_recall-all": 0.9383621954798943,
"eval_recall-das": 0.954562383612663,
"eval_recall-l1": 0.9391076115485564,
"eval_recall-l1l2": 0.948561464690497,
"eval_recall-l2": 0.9374167776298269,
"eval_runtime": 6.3298,
"eval_samples_per_second": 106.797,
"eval_steps_per_second": 6.793,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.5519,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9220657276995305,
"number": 519,
"precision": 0.8992673992673993,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9379178605539638,
"number": 503,
"precision": 0.9025735294117647,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9831748354059985,
"number": 678,
"precision": 0.9753265602322206,
"recall": 0.9911504424778761
},
"eval_DESC": {
"f1": 0.0,
"number": 30,
"precision": 0.0,
"recall": 0.0
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.938749194068343,
"number": 762,
"precision": 0.9226869455006337,
"recall": 0.9553805774278216
},
"eval_PER": {
"f1": 0.9603524229074889,
"number": 676,
"precision": 0.9533527696793003,
"recall": 0.9674556213017751
},
"eval_SPAT": {
"f1": 0.926657263751763,
"number": 694,
"precision": 0.9074585635359116,
"recall": 0.946685878962536
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.30952380952380953,
"number": 33,
"precision": 0.2549019607843137,
"recall": 0.3939393939393939
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9468488990129081,
"eval_accuracy-all": 0.9627942293090357,
"eval_accuracy-das": 0.9646924829157175,
"eval_accuracy-l1": 0.9558339660845355,
"eval_accuracy-l1l2": 0.9474816502151354,
"eval_accuracy-l2": 0.9697544925335359,
"eval_f1": 0.9470953186689227,
"eval_f1-all": 0.9313441483198146,
"eval_f1-das": 0.9477377654662973,
"eval_f1-l1": 0.9310255747868768,
"eval_f1-l1l2": 0.9406353313209718,
"eval_f1-l2": 0.9317507418397627,
"eval_loss": 0.23691155016422272,
"eval_precision": 0.945069788383611,
"eval_precision-all": 0.919359450957964,
"eval_precision-das": 0.9399267399267399,
"eval_precision-l1": 0.9165818921668362,
"eval_precision-l1l2": 0.9306029579067122,
"eval_precision-l2": 0.9229261920313521,
"eval_recall": 0.9491295500791318,
"eval_recall-all": 0.943645435867332,
"eval_recall-das": 0.9556797020484171,
"eval_recall-l1": 0.9459317585301837,
"eval_recall-l1l2": 0.9508863702412089,
"eval_recall-l2": 0.940745672436751,
"eval_runtime": 6.2943,
"eval_samples_per_second": 107.399,
"eval_steps_per_second": 6.832,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9318181818181819,
"number": 519,
"precision": 0.9162011173184358,
"recall": 0.9479768786127167
},
"eval_ACT_L1": {
"f1": 0.9470644850818095,
"number": 503,
"precision": 0.917910447761194,
"recall": 0.9781312127236581
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9823529411764708,
"number": 678,
"precision": 0.9794721407624634,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.12903225806451615,
"number": 30,
"precision": 0.125,
"recall": 0.13333333333333333
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9453836150845253,
"number": 762,
"precision": 0.9368556701030928,
"recall": 0.9540682414698163
},
"eval_PER": {
"f1": 0.9631811487481591,
"number": 676,
"precision": 0.9589442815249267,
"recall": 0.9674556213017751
},
"eval_SPAT": {
"f1": 0.9571428571428571,
"number": 694,
"precision": 0.9490084985835694,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.29885057471264365,
"number": 33,
"precision": 0.24074074074074073,
"recall": 0.3939393939393939
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9477347506960263,
"eval_accuracy-all": 0.9635535307517085,
"eval_accuracy-das": 0.9658314350797267,
"eval_accuracy-l1": 0.9579853201721084,
"eval_accuracy-l1l2": 0.9481144014173627,
"eval_accuracy-l2": 0.9691217413313086,
"eval_f1": 0.9496841155234658,
"eval_f1-all": 0.9389179755671903,
"eval_f1-das": 0.9519391352755613,
"eval_f1-l1": 0.9427609427609427,
"eval_f1-l1l2": 0.9418202764976958,
"eval_f1-l2": 0.9339966832504146,
"eval_loss": 0.21212993562221527,
"eval_precision": 0.9477595136230579,
"eval_precision-all": 0.93052752954742,
"eval_precision-das": 0.948594674556213,
"eval_precision-l1": 0.9304703476482618,
"eval_precision-l1l2": 0.9334855837853269,
"eval_precision-l2": 0.930601454064772,
"eval_recall": 0.9516165498530409,
"eval_recall-all": 0.9474611094804813,
"eval_recall-das": 0.9553072625698324,
"eval_recall-l1": 0.9553805774278216,
"eval_recall-l1l2": 0.9503051438535309,
"eval_recall-l2": 0.9374167776298269,
"eval_runtime": 6.0489,
"eval_samples_per_second": 111.755,
"eval_steps_per_second": 7.109,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9243856332703214,
"number": 519,
"precision": 0.9072356215213359,
"recall": 0.9421965317919075
},
"eval_ACT_L1": {
"f1": 0.9485935984481086,
"number": 503,
"precision": 0.9261363636363636,
"recall": 0.9721669980119284
},
"eval_ACT_L2": {
"f1": 0.0,
"number": 16,
"precision": 0.0,
"recall": 0.0
},
"eval_CARDINAL": {
"f1": 0.9831254585473221,
"number": 678,
"precision": 0.9781021897810219,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.2535211267605634,
"number": 30,
"precision": 0.21951219512195122,
"recall": 0.3
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9397278029812053,
"number": 762,
"precision": 0.9282970550576184,
"recall": 0.9514435695538058
},
"eval_PER": {
"f1": 0.9742078113485629,
"number": 676,
"precision": 0.9706314243759178,
"recall": 0.977810650887574
},
"eval_SPAT": {
"f1": 0.9484978540772532,
"number": 694,
"precision": 0.9417613636363636,
"recall": 0.9553314121037464
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.6486486486486487,
"number": 33,
"precision": 0.5853658536585366,
"recall": 0.7272727272727273
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9503923057453809,
"eval_accuracy-all": 0.9634902556314857,
"eval_accuracy-das": 0.9702606934953176,
"eval_accuracy-l1": 0.9583649708934447,
"eval_accuracy-l1l2": 0.9508985067071627,
"eval_accuracy-l2": 0.9686155403695267,
"eval_f1": 0.9554728891894939,
"eval_f1-all": 0.9421511627906977,
"eval_f1-das": 0.956747726007054,
"eval_f1-l1": 0.9442860844778439,
"eval_f1-l1l2": 0.948141745894555,
"eval_f1-l2": 0.9394240317775571,
"eval_loss": 0.18599489331245422,
"eval_precision": 0.9527877697841727,
"eval_precision-all": 0.9331989634321912,
"eval_precision-das": 0.9537379718726869,
"eval_precision-l1": 0.932446264073695,
"eval_precision-l1l2": 0.9400171379605827,
"eval_precision-l2": 0.934167215273206,
"eval_recall": 0.9581731856206195,
"eval_recall-all": 0.9512767830936307,
"eval_recall-das": 0.9597765363128492,
"eval_recall-l1": 0.9564304461942257,
"eval_recall-l1l2": 0.95640802092415,
"eval_recall-l2": 0.9447403462050599,
"eval_runtime": 6.6597,
"eval_samples_per_second": 101.506,
"eval_steps_per_second": 6.457,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9190207156308852,
"number": 519,
"precision": 0.8987108655616943,
"recall": 0.9402697495183044
},
"eval_ACT_L1": {
"f1": 0.9472656249999999,
"number": 503,
"precision": 0.9309021113243762,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.15789473684210525,
"number": 16,
"precision": 0.13636363636363635,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9867841409691629,
"number": 678,
"precision": 0.9824561403508771,
"recall": 0.9911504424778761
},
"eval_DESC": {
"f1": 0.29629629629629634,
"number": 30,
"precision": 0.23529411764705882,
"recall": 0.4
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9518229166666666,
"number": 762,
"precision": 0.9444444444444444,
"recall": 0.9593175853018373
},
"eval_PER": {
"f1": 0.9690721649484536,
"number": 676,
"precision": 0.9648093841642229,
"recall": 0.9733727810650887
},
"eval_SPAT": {
"f1": 0.9548387096774194,
"number": 694,
"precision": 0.9500713266761769,
"recall": 0.9596541786743515
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.823529411764706,
"number": 33,
"precision": 0.8,
"recall": 0.8484848484848485
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9468488990129081,
"eval_accuracy-all": 0.960642875221463,
"eval_accuracy-das": 0.9701341432548722,
"eval_accuracy-l1": 0.9546950139205265,
"eval_accuracy-l1l2": 0.9473550999746899,
"eval_accuracy-l2": 0.9665907365223994,
"eval_f1": 0.9580797836375928,
"eval_f1-all": 0.9464960744402442,
"eval_f1-das": 0.9602378298030472,
"eval_f1-l1": 0.9435233160621762,
"eval_f1-l1l2": 0.9526004898429622,
"eval_f1-l2": 0.9502982107355864,
"eval_loss": 0.182948499917984,
"eval_precision": 0.9550662772410694,
"eval_precision-all": 0.9377700950734659,
"eval_precision-das": 0.9581015943641082,
"eval_precision-l1": 0.931457800511509,
"eval_precision-l1l2": 0.9445714285714286,
"eval_precision-l2": 0.945910290237467,
"eval_recall": 0.961112367171603,
"eval_recall-all": 0.9553859700616378,
"eval_recall-das": 0.9623836126629423,
"eval_recall-l1": 0.9559055118110236,
"eval_recall-l1l2": 0.960767218831735,
"eval_recall-l2": 0.9547270306258322,
"eval_runtime": 6.3516,
"eval_samples_per_second": 106.43,
"eval_steps_per_second": 6.77,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9289099526066352,
"number": 519,
"precision": 0.914179104477612,
"recall": 0.9441233140655106
},
"eval_ACT_L1": {
"f1": 0.9530332681017614,
"number": 503,
"precision": 0.9383429672447013,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.1818181818181818,
"number": 16,
"precision": 0.17647058823529413,
"recall": 0.1875
},
"eval_CARDINAL": {
"f1": 0.9874723655121592,
"number": 678,
"precision": 0.9867452135493373,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.35294117647058826,
"number": 30,
"precision": 0.3157894736842105,
"recall": 0.4
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9505851755526658,
"number": 762,
"precision": 0.9420103092783505,
"recall": 0.9593175853018373
},
"eval_PER": {
"f1": 0.9748892171344165,
"number": 676,
"precision": 0.9734513274336283,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9577060931899642,
"number": 694,
"precision": 0.9529243937232525,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8285714285714285,
"number": 33,
"precision": 0.7837837837837838,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.0,
"number": 6,
"precision": 0.0,
"recall": 0.0
},
"eval_accuracy": 0.9483675018982536,
"eval_accuracy-all": 0.9605163249810175,
"eval_accuracy-das": 0.9707668944570995,
"eval_accuracy-l1": 0.9549481144014174,
"eval_accuracy-l1l2": 0.9495064540622628,
"eval_accuracy-l2": 0.9660845355606176,
"eval_f1": 0.9564628919467629,
"eval_f1-all": 0.9511448155169899,
"eval_f1-das": 0.9598811292719168,
"eval_f1-l1": 0.9513147617807862,
"eval_f1-l1l2": 0.9554655870445344,
"eval_f1-l2": 0.9509283819628648,
"eval_loss": 0.19901591539382935,
"eval_precision": 0.9543101507990097,
"eval_precision-all": 0.9452173913043478,
"eval_precision-das": 0.9573916265283439,
"eval_precision-l1": 0.943698347107438,
"eval_precision-l1l2": 0.9507913669064748,
"eval_precision-l2": 0.9471598414795245,
"eval_recall": 0.9586253673976939,
"eval_recall-all": 0.9571470501907837,
"eval_recall-das": 0.9623836126629423,
"eval_recall-l1": 0.9590551181102362,
"eval_recall-l1l2": 0.960185992444057,
"eval_recall-l2": 0.9547270306258322,
"eval_runtime": 6.3187,
"eval_samples_per_second": 106.983,
"eval_steps_per_second": 6.805,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.1804,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9382716049382717,
"number": 519,
"precision": 0.9250936329588015,
"recall": 0.9518304431599229
},
"eval_ACT_L1": {
"f1": 0.9585798816568047,
"number": 503,
"precision": 0.9510763209393346,
"recall": 0.9662027833001988
},
"eval_ACT_L2": {
"f1": 0.41025641025641024,
"number": 16,
"precision": 0.34782608695652173,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9831748354059985,
"number": 678,
"precision": 0.9753265602322206,
"recall": 0.9911504424778761
},
"eval_DESC": {
"f1": 0.4473684210526315,
"number": 30,
"precision": 0.3695652173913043,
"recall": 0.5666666666666667
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9503916449086163,
"number": 762,
"precision": 0.9454545454545454,
"recall": 0.9553805774278216
},
"eval_PER": {
"f1": 0.9734513274336284,
"number": 676,
"precision": 0.9705882352941176,
"recall": 0.9763313609467456
},
"eval_SPAT": {
"f1": 0.9512893982808024,
"number": 694,
"precision": 0.9458689458689459,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7936507936507938,
"number": 33,
"precision": 0.8333333333333334,
"recall": 0.7575757575757576
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.5,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9555808656036446,
"eval_accuracy-all": 0.967160212604404,
"eval_accuracy-das": 0.9707668944570995,
"eval_accuracy-l1": 0.961781827385472,
"eval_accuracy-l1l2": 0.9558339660845355,
"eval_accuracy-l2": 0.9725385978233358,
"eval_f1": 0.9617733544446958,
"eval_f1-all": 0.9506046918257322,
"eval_f1-das": 0.9622466059140785,
"eval_f1-l1": 0.9505723204994797,
"eval_f1-l1l2": 0.9573267756400984,
"eval_f1-l2": 0.9506459092414706,
"eval_loss": 0.17258137464523315,
"eval_precision": 0.9622086444897036,
"eval_precision-all": 0.9438657407407407,
"eval_precision-das": 0.9609955423476969,
"eval_precision-l1": 0.9422382671480144,
"eval_precision-l1l2": 0.9530529953917051,
"eval_precision-l2": 0.9459459459459459,
"eval_recall": 0.9613384580601402,
"eval_recall-all": 0.9574405635456413,
"eval_recall-das": 0.9635009310986965,
"eval_recall-l1": 0.9590551181102362,
"eval_recall-l1l2": 0.9616390584132519,
"eval_recall-l2": 0.9553928095872171,
"eval_runtime": 6.352,
"eval_samples_per_second": 106.422,
"eval_steps_per_second": 6.769,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9343339587242027,
"number": 519,
"precision": 0.9104204753199269,
"recall": 0.9595375722543352
},
"eval_ACT_L1": {
"f1": 0.9561830574488801,
"number": 503,
"precision": 0.9370229007633588,
"recall": 0.9761431411530815
},
"eval_ACT_L2": {
"f1": 0.358974358974359,
"number": 16,
"precision": 0.30434782608695654,
"recall": 0.4375
},
"eval_CARDINAL": {
"f1": 0.9875091844232182,
"number": 678,
"precision": 0.9838945827232797,
"recall": 0.9911504424778761
},
"eval_DESC": {
"f1": 0.38961038961038963,
"number": 30,
"precision": 0.3191489361702128,
"recall": 0.5
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9499024072869227,
"number": 762,
"precision": 0.9419354838709677,
"recall": 0.958005249343832
},
"eval_PER": {
"f1": 0.9771554900515844,
"number": 676,
"precision": 0.973568281938326,
"recall": 0.9807692307692307
},
"eval_SPAT": {
"f1": 0.9521770164168452,
"number": 694,
"precision": 0.9434229137199435,
"recall": 0.9610951008645533
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8787878787878788,
"number": 33,
"precision": 0.8787878787878788,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.5,
"number": 6,
"precision": 0.4,
"recall": 0.6666666666666666
},
"eval_accuracy": 0.9477347506960263,
"eval_accuracy-all": 0.9626676790685902,
"eval_accuracy-das": 0.9689951910908631,
"eval_accuracy-l1": 0.9562136168058719,
"eval_accuracy-l1l2": 0.9482409516578082,
"eval_accuracy-l2": 0.9691217413313086,
"eval_f1": 0.9593422682734541,
"eval_f1-all": 0.9514140681653372,
"eval_f1-das": 0.9622501850481124,
"eval_f1-l1": 0.9503105590062113,
"eval_f1-l1l2": 0.9570852534562212,
"eval_f1-l2": 0.9528208512042231,
"eval_loss": 0.1915351301431656,
"eval_precision": 0.9557899461400359,
"eval_precision-all": 0.9403669724770642,
"eval_precision-das": 0.9562339095255609,
"eval_precision-l1": 0.9372128637059725,
"eval_precision-l1l2": 0.9486154724521838,
"eval_precision-l2": 0.9444081098757358,
"eval_recall": 0.9629210942799005,
"eval_recall-all": 0.962723803933079,
"eval_recall-das": 0.9683426443202979,
"eval_recall-l1": 0.9637795275590552,
"eval_recall-l1l2": 0.965707643126998,
"eval_recall-l2": 0.9613848202396804,
"eval_runtime": 6.3274,
"eval_samples_per_second": 106.838,
"eval_steps_per_second": 6.796,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9278350515463917,
"number": 519,
"precision": 0.9032846715328468,
"recall": 0.953757225433526
},
"eval_ACT_L1": {
"f1": 0.9502439024390243,
"number": 503,
"precision": 0.9329501915708812,
"recall": 0.9681908548707754
},
"eval_ACT_L2": {
"f1": 0.380952380952381,
"number": 16,
"precision": 0.3076923076923077,
"recall": 0.5
},
"eval_CARDINAL": {
"f1": 0.9831254585473221,
"number": 678,
"precision": 0.9781021897810219,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.4210526315789474,
"number": 30,
"precision": 0.34782608695652173,
"recall": 0.5333333333333333
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9478487614080835,
"number": 762,
"precision": 0.9417098445595855,
"recall": 0.9540682414698163
},
"eval_PER": {
"f1": 0.9785977859778597,
"number": 676,
"precision": 0.9764359351988218,
"recall": 0.9807692307692307
},
"eval_SPAT": {
"f1": 0.9563350035790981,
"number": 694,
"precision": 0.9502133712660028,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8787878787878788,
"number": 33,
"precision": 0.8787878787878788,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.4,
"number": 6,
"precision": 0.5,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9583649708934447,
"eval_accuracy-all": 0.9676664135661858,
"eval_accuracy-das": 0.9773475069602632,
"eval_accuracy-l1": 0.964819033156163,
"eval_accuracy-l1l2": 0.958997722095672,
"eval_accuracy-l2": 0.9705137939762085,
"eval_f1": 0.9606760563380281,
"eval_f1-all": 0.9510103212676261,
"eval_f1-das": 0.9645179268066134,
"eval_f1-l1": 0.9514915693904021,
"eval_f1-l1l2": 0.9574130215100333,
"eval_f1-l2": 0.9503968253968254,
"eval_loss": 0.16211041808128357,
"eval_precision": 0.9575471698113207,
"eval_precision-all": 0.9421082949308756,
"eval_precision-das": 0.9621942179392142,
"eval_precision-l1": 0.9405128205128205,
"eval_precision-l1l2": 0.9512335054503729,
"eval_precision-l2": 0.9441524310118266,
"eval_recall": 0.9638254578340493,
"eval_recall-all": 0.9600821837393602,
"eval_recall-das": 0.966852886405959,
"eval_recall-l1": 0.9627296587926509,
"eval_recall-l1l2": 0.963673350770125,
"eval_recall-l2": 0.9567243675099867,
"eval_runtime": 6.3446,
"eval_samples_per_second": 106.548,
"eval_steps_per_second": 6.777,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.926829268292683,
"number": 519,
"precision": 0.903107861060329,
"recall": 0.9518304431599229
},
"eval_ACT_L1": {
"f1": 0.9494163424124514,
"number": 503,
"precision": 0.9295238095238095,
"recall": 0.9701789264413518
},
"eval_ACT_L2": {
"f1": 0.3157894736842105,
"number": 16,
"precision": 0.2727272727272727,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9845928099779897,
"number": 678,
"precision": 0.9795620437956204,
"recall": 0.9896755162241888
},
"eval_DESC": {
"f1": 0.32608695652173914,
"number": 30,
"precision": 0.24193548387096775,
"recall": 0.5
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9449125081011017,
"number": 762,
"precision": 0.9334186939820742,
"recall": 0.9566929133858267
},
"eval_PER": {
"f1": 0.9704579025110782,
"number": 676,
"precision": 0.9690265486725663,
"recall": 0.9718934911242604
},
"eval_SPAT": {
"f1": 0.9458689458689459,
"number": 694,
"precision": 0.9352112676056338,
"recall": 0.9567723342939481
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.7878787878787878,
"number": 33,
"precision": 0.7878787878787878,
"recall": 0.7878787878787878
},
"eval_TITREP": {
"f1": 0.28571428571428575,
"number": 6,
"precision": 0.25,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9541888129587446,
"eval_accuracy-all": 0.9685522652493039,
"eval_accuracy-das": 0.9691217413313086,
"eval_accuracy-l1": 0.9625411288281448,
"eval_accuracy-l1l2": 0.9549481144014174,
"eval_accuracy-l2": 0.9745634016704632,
"eval_f1": 0.9562970452758117,
"eval_f1-all": 0.9428612758570809,
"eval_f1-das": 0.9577777777777778,
"eval_f1-l1": 0.9402061855670103,
"eval_f1-l1l2": 0.9518608995545338,
"eval_f1-l2": 0.9462578305308275,
"eval_loss": 0.17513133585453033,
"eval_precision": 0.9504242965609647,
"eval_precision-all": 0.9295493439817456,
"eval_precision-das": 0.9524861878453039,
"eval_precision-l1": 0.9235443037974683,
"eval_precision-l1l2": 0.9414440022740194,
"eval_precision-l2": 0.9372958850424559,
"eval_recall": 0.962242821614289,
"eval_recall-all": 0.9565600234810684,
"eval_recall-das": 0.9631284916201117,
"eval_recall-l1": 0.9574803149606299,
"eval_recall-l1l2": 0.962510897994769,
"eval_recall-l2": 0.9553928095872171,
"eval_runtime": 6.5477,
"eval_samples_per_second": 103.242,
"eval_steps_per_second": 6.567,
"step": 1300
},
{
"epoch": 3.67,
"eval_ACT": {
"f1": 0.9325735992402658,
"number": 519,
"precision": 0.9194756554307116,
"recall": 0.9460500963391136
},
"eval_ACT_L1": {
"f1": 0.9603960396039604,
"number": 503,
"precision": 0.9566074950690335,
"recall": 0.9642147117296223
},
"eval_ACT_L2": {
"f1": 0.27906976744186046,
"number": 16,
"precision": 0.2222222222222222,
"recall": 0.375
},
"eval_CARDINAL": {
"f1": 0.9823529411764708,
"number": 678,
"precision": 0.9794721407624634,
"recall": 0.9852507374631269
},
"eval_DESC": {
"f1": 0.3614457831325301,
"number": 30,
"precision": 0.2830188679245283,
"recall": 0.5
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9366925064599483,
"number": 762,
"precision": 0.9223918575063613,
"recall": 0.9514435695538058
},
"eval_PER": {
"f1": 0.9764011799410028,
"number": 676,
"precision": 0.9735294117647059,
"recall": 0.9792899408284024
},
"eval_SPAT": {
"f1": 0.9571428571428571,
"number": 694,
"precision": 0.9490084985835694,
"recall": 0.9654178674351584
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.8656716417910447,
"number": 33,
"precision": 0.8529411764705882,
"recall": 0.8787878787878788
},
"eval_TITREP": {
"f1": 0.25,
"number": 6,
"precision": 0.2,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.945709946848899,
"eval_accuracy-all": 0.9593773728170083,
"eval_accuracy-das": 0.967603138445963,
"eval_accuracy-l1": 0.9546950139205265,
"eval_accuracy-l1l2": 0.9464692482915718,
"eval_accuracy-l2": 0.9640597317134902,
"eval_f1": 0.9548213081591369,
"eval_f1-all": 0.9466202494923122,
"eval_f1-das": 0.9599555061179089,
"eval_f1-l1": 0.9514411841080239,
"eval_f1-l1l2": 0.9515989628349178,
"eval_f1-l2": 0.9405192244495562,
"eval_loss": 0.2079046368598938,
"eval_precision": 0.9492737430167598,
"eval_precision-all": 0.935761399483797,
"eval_precision-das": 0.955703211517165,
"eval_precision-l1": 0.9414182939362795,
"eval_precision-l1l2": 0.9434447300771208,
"eval_precision-l2": 0.9286177806619078,
"eval_recall": 0.9604340945059914,
"eval_recall-all": 0.9577340769004989,
"eval_recall-das": 0.964245810055866,
"eval_recall-l1": 0.9616797900262467,
"eval_recall-l1l2": 0.959895379250218,
"eval_recall-l2": 0.9527296937416777,
"eval_runtime": 6.2012,
"eval_samples_per_second": 109.01,
"eval_steps_per_second": 6.934,
"step": 1400
},
{
"epoch": 3.94,
"learning_rate": 7e-05,
"loss": 0.1142,
"step": 1500
},
{
"epoch": 3.94,
"eval_ACT": {
"f1": 0.9420702754036088,
"number": 519,
"precision": 0.9288389513108615,
"recall": 0.9556840077071291
},
"eval_ACT_L1": {
"f1": 0.9574468085106382,
"number": 503,
"precision": 0.9322033898305084,
"recall": 0.9840954274353877
},
"eval_ACT_L2": {
"f1": 0.10526315789473684,
"number": 16,
"precision": 0.3333333333333333,
"recall": 0.0625
},
"eval_CARDINAL": {
"f1": 0.9874723655121592,
"number": 678,
"precision": 0.9867452135493373,
"recall": 0.9882005899705014
},
"eval_DESC": {
"f1": 0.423076923076923,
"number": 30,
"precision": 0.5,
"recall": 0.36666666666666664
},
"eval_FT": {
"f1": 0.22222222222222224,
"number": 7,
"precision": 0.5,
"recall": 0.14285714285714285
},
"eval_LOC": {
"f1": 0.9548133595284872,
"number": 762,
"precision": 0.9529411764705882,
"recall": 0.9566929133858267
},
"eval_PER": {
"f1": 0.9830258302583026,
"number": 676,
"precision": 0.9808541973490427,
"recall": 0.985207100591716
},
"eval_SPAT": {
"f1": 0.9577060931899642,
"number": 694,
"precision": 0.9529243937232525,
"recall": 0.962536023054755
},
"eval_TITRE": {
"f1": 0.0,
"number": 2,
"precision": 0.0,
"recall": 0.0
},
"eval_TITREH": {
"f1": 0.923076923076923,
"number": 33,
"precision": 0.9375,
"recall": 0.9090909090909091
},
"eval_TITREP": {
"f1": 0.30769230769230765,
"number": 6,
"precision": 0.2857142857142857,
"recall": 0.3333333333333333
},
"eval_accuracy": 0.9608959757023539,
"eval_accuracy-all": 0.9707668944570995,
"eval_accuracy-das": 0.9735509997468995,
"eval_accuracy-l1": 0.9673500379650721,
"eval_accuracy-l1l2": 0.9611490761832447,
"eval_accuracy-l2": 0.9741837509491268,
"eval_f1": 0.9663456090651559,
"eval_f1-all": 0.9586994727592267,
"eval_f1-das": 0.9682215201635384,
"eval_f1-l1": 0.9588327253778008,
"eval_f1-l1l2": 0.9645348837209302,
"eval_f1-l2": 0.9585284280936456,
"eval_loss": 0.18689921498298645,
"eval_precision": 0.9686506133575647,
"eval_precision-all": 0.9567377959660918,
"eval_precision-das": 0.966246290801187,
"eval_precision-l1": 0.9518882565959649,
"eval_precision-l1l2": 0.964815353300378,
"eval_precision-l2": 0.9630376344086021,
"eval_recall": 0.9640515487225865,
"eval_recall-all": 0.9606692104490754,
"eval_recall-das": 0.9702048417132216,
"eval_recall-l1": 0.9658792650918635,
"eval_recall-l1l2": 0.9642545771578029,
"eval_recall-l2": 0.9540612516644474,
"eval_runtime": 6.34,
"eval_samples_per_second": 106.625,
"eval_steps_per_second": 6.782,
"step": 1500
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 611851151350824.0,
"trial_name": null,
"trial_params": null
}