layoutlmv3 / trainer_state.json
MonkeeZhang's picture
new update
06ab5ca
{
"best_metric": null,
"best_model_checkpoint": null,
"epoch": 7.874015748031496,
"global_step": 1000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.16,
"eval_accuracy": 0.8157711500522223,
"eval_f1": 0.5942329873125721,
"eval_loss": 0.4848455488681793,
"eval_precision": 0.5368903709879116,
"eval_recall": 0.6652892561983471,
"eval_runtime": 2.2498,
"eval_samples_per_second": 41.337,
"eval_steps_per_second": 1.333,
"step": 20
},
{
"epoch": 0.31,
"eval_accuracy": 0.8389520714865962,
"eval_f1": 0.7553421368547419,
"eval_loss": 0.39182421565055847,
"eval_precision": 0.705697622252131,
"eval_recall": 0.8125,
"eval_runtime": 2.9557,
"eval_samples_per_second": 31.465,
"eval_steps_per_second": 1.015,
"step": 40
},
{
"epoch": 0.47,
"eval_accuracy": 0.8849947777648833,
"eval_f1": 0.8393364928909953,
"eval_loss": 0.34172168374061584,
"eval_precision": 0.7753940455341506,
"eval_recall": 0.9147727272727273,
"eval_runtime": 2.9806,
"eval_samples_per_second": 31.202,
"eval_steps_per_second": 1.007,
"step": 60
},
{
"epoch": 0.63,
"eval_accuracy": 0.8782929093652083,
"eval_f1": 0.878610002347969,
"eval_loss": 0.3457355201244354,
"eval_precision": 0.8054240206629358,
"eval_recall": 0.9664256198347108,
"eval_runtime": 3.288,
"eval_samples_per_second": 28.285,
"eval_steps_per_second": 0.912,
"step": 80
},
{
"epoch": 0.79,
"eval_accuracy": 0.9183880700940003,
"eval_f1": 0.8993830090175606,
"eval_loss": 0.26329365372657776,
"eval_precision": 0.8318700614574188,
"eval_recall": 0.9788223140495868,
"eval_runtime": 3.262,
"eval_samples_per_second": 28.51,
"eval_steps_per_second": 0.92,
"step": 100
},
{
"epoch": 0.94,
"eval_accuracy": 0.9218695601717535,
"eval_f1": 0.908175497482618,
"eval_loss": 0.27159208059310913,
"eval_precision": 0.847427293064877,
"eval_recall": 0.9783057851239669,
"eval_runtime": 2.2237,
"eval_samples_per_second": 41.822,
"eval_steps_per_second": 1.349,
"step": 120
},
{
"epoch": 1.1,
"eval_accuracy": 0.931965881397238,
"eval_f1": 0.8820210939416238,
"eval_loss": 0.20828573405742645,
"eval_precision": 0.8397944885567492,
"eval_recall": 0.9287190082644629,
"eval_runtime": 2.2685,
"eval_samples_per_second": 40.996,
"eval_steps_per_second": 1.322,
"step": 140
},
{
"epoch": 1.26,
"eval_accuracy": 0.893669490541952,
"eval_f1": 0.8734673859735164,
"eval_loss": 0.33937641978263855,
"eval_precision": 0.8314659197012139,
"eval_recall": 0.9199380165289256,
"eval_runtime": 3.2652,
"eval_samples_per_second": 28.482,
"eval_steps_per_second": 0.919,
"step": 160
},
{
"epoch": 1.42,
"eval_accuracy": 0.883079958222119,
"eval_f1": 0.8970068347867075,
"eval_loss": 0.35709869861602783,
"eval_precision": 0.8248807975726051,
"eval_recall": 0.9829545454545454,
"eval_runtime": 3.2871,
"eval_samples_per_second": 28.292,
"eval_steps_per_second": 0.913,
"step": 180
},
{
"epoch": 1.57,
"eval_accuracy": 0.9112800278519206,
"eval_f1": 0.8886283704572099,
"eval_loss": 0.2868669033050537,
"eval_precision": 0.8136539287247746,
"eval_recall": 0.9788223140495868,
"eval_runtime": 2.9919,
"eval_samples_per_second": 31.084,
"eval_steps_per_second": 1.003,
"step": 200
},
{
"epoch": 1.73,
"eval_accuracy": 0.9393350353951492,
"eval_f1": 0.9247259439707675,
"eval_loss": 0.201907679438591,
"eval_precision": 0.8750576302443522,
"eval_recall": 0.9803719008264463,
"eval_runtime": 2.2839,
"eval_samples_per_second": 40.72,
"eval_steps_per_second": 1.314,
"step": 220
},
{
"epoch": 1.89,
"eval_accuracy": 0.9525937101079262,
"eval_f1": 0.9215399610136452,
"eval_loss": 0.1594531089067459,
"eval_precision": 0.8722324723247232,
"eval_recall": 0.9767561983471075,
"eval_runtime": 2.9584,
"eval_samples_per_second": 31.436,
"eval_steps_per_second": 1.014,
"step": 240
},
{
"epoch": 2.05,
"eval_accuracy": 0.9378263896947894,
"eval_f1": 0.9166058837831268,
"eval_loss": 0.22776451706886292,
"eval_precision": 0.8658704639412035,
"eval_recall": 0.9736570247933884,
"eval_runtime": 3.2621,
"eval_samples_per_second": 28.509,
"eval_steps_per_second": 0.92,
"step": 260
},
{
"epoch": 2.2,
"eval_accuracy": 0.9292677265869792,
"eval_f1": 0.8771048002010556,
"eval_loss": 0.23985013365745544,
"eval_precision": 0.8541360744003916,
"eval_recall": 0.9013429752066116,
"eval_runtime": 2.2706,
"eval_samples_per_second": 40.959,
"eval_steps_per_second": 1.321,
"step": 280
},
{
"epoch": 2.36,
"eval_accuracy": 0.9322850179876987,
"eval_f1": 0.9097725568607848,
"eval_loss": 0.2839757800102234,
"eval_precision": 0.8813559322033898,
"eval_recall": 0.9400826446280992,
"eval_runtime": 3.2602,
"eval_samples_per_second": 28.525,
"eval_steps_per_second": 0.92,
"step": 300
},
{
"epoch": 2.52,
"eval_accuracy": 0.9572356968782639,
"eval_f1": 0.9368919930157147,
"eval_loss": 0.15871362388134003,
"eval_precision": 0.9059334298118669,
"eval_recall": 0.9700413223140496,
"eval_runtime": 2.2505,
"eval_samples_per_second": 41.325,
"eval_steps_per_second": 1.333,
"step": 320
},
{
"epoch": 2.68,
"eval_accuracy": 0.9558431008471626,
"eval_f1": 0.9427135678391959,
"eval_loss": 0.16202741861343384,
"eval_precision": 0.9178082191780822,
"eval_recall": 0.96900826446281,
"eval_runtime": 3.2378,
"eval_samples_per_second": 28.723,
"eval_steps_per_second": 0.927,
"step": 340
},
{
"epoch": 2.83,
"eval_accuracy": 0.9299059997679007,
"eval_f1": 0.9343610144206862,
"eval_loss": 0.27064642310142517,
"eval_precision": 0.9007670182166826,
"eval_recall": 0.9705578512396694,
"eval_runtime": 3.2832,
"eval_samples_per_second": 28.326,
"eval_steps_per_second": 0.914,
"step": 360
},
{
"epoch": 2.99,
"eval_accuracy": 0.9477486364163862,
"eval_f1": 0.9423980222496909,
"eval_loss": 0.18907134234905243,
"eval_precision": 0.9037458511142722,
"eval_recall": 0.984504132231405,
"eval_runtime": 3.2921,
"eval_samples_per_second": 28.25,
"eval_steps_per_second": 0.911,
"step": 380
},
{
"epoch": 3.15,
"eval_accuracy": 0.9234072182894278,
"eval_f1": 0.9175810155651952,
"eval_loss": 0.26186808943748474,
"eval_precision": 0.9067070095814422,
"eval_recall": 0.9287190082644629,
"eval_runtime": 3.296,
"eval_samples_per_second": 28.216,
"eval_steps_per_second": 0.91,
"step": 400
},
{
"epoch": 3.31,
"eval_accuracy": 0.9601949634443542,
"eval_f1": 0.9384654342871613,
"eval_loss": 0.1693572849035263,
"eval_precision": 0.9205166418281172,
"eval_recall": 0.9571280991735537,
"eval_runtime": 2.2486,
"eval_samples_per_second": 41.36,
"eval_steps_per_second": 1.334,
"step": 420
},
{
"epoch": 3.46,
"eval_accuracy": 0.9532900081234769,
"eval_f1": 0.9351432880844646,
"eval_loss": 0.20067894458770752,
"eval_precision": 0.910871694417238,
"eval_recall": 0.9607438016528925,
"eval_runtime": 3.2966,
"eval_samples_per_second": 28.211,
"eval_steps_per_second": 0.91,
"step": 440
},
{
"epoch": 3.62,
"eval_accuracy": 0.9529998839503308,
"eval_f1": 0.9408805031446541,
"eval_loss": 0.2007509469985962,
"eval_precision": 0.9171162334477685,
"eval_recall": 0.9659090909090909,
"eval_runtime": 2.9788,
"eval_samples_per_second": 31.22,
"eval_steps_per_second": 1.007,
"step": 460
},
{
"epoch": 3.78,
"eval_accuracy": 0.9438609724962284,
"eval_f1": 0.9448345035105317,
"eval_loss": 0.2780458927154541,
"eval_precision": 0.9181286549707602,
"eval_recall": 0.9731404958677686,
"eval_runtime": 2.2763,
"eval_samples_per_second": 40.855,
"eval_steps_per_second": 1.318,
"step": 480
},
{
"epoch": 3.94,
"learning_rate": 3.5e-05,
"loss": 0.2747,
"step": 500
},
{
"epoch": 3.94,
"eval_accuracy": 0.9434838110711384,
"eval_f1": 0.9407256004087889,
"eval_loss": 0.22288289666175842,
"eval_precision": 0.9307381193124368,
"eval_recall": 0.9509297520661157,
"eval_runtime": 2.2152,
"eval_samples_per_second": 41.983,
"eval_steps_per_second": 1.354,
"step": 500
},
{
"epoch": 4.09,
"eval_accuracy": 0.9413659046071718,
"eval_f1": 0.9442211055276382,
"eval_loss": 0.2373497188091278,
"eval_precision": 0.9192759295499021,
"eval_recall": 0.9705578512396694,
"eval_runtime": 2.286,
"eval_samples_per_second": 40.682,
"eval_steps_per_second": 1.312,
"step": 520
},
{
"epoch": 4.25,
"eval_accuracy": 0.9290066148311478,
"eval_f1": 0.9232756393696718,
"eval_loss": 0.32156404852867126,
"eval_precision": 0.9235142118863049,
"eval_recall": 0.9230371900826446,
"eval_runtime": 3.2781,
"eval_samples_per_second": 28.371,
"eval_steps_per_second": 0.915,
"step": 540
},
{
"epoch": 4.41,
"eval_accuracy": 0.9621387954044331,
"eval_f1": 0.9501378100726634,
"eval_loss": 0.1727248579263687,
"eval_precision": 0.9226277372262773,
"eval_recall": 0.9793388429752066,
"eval_runtime": 3.2891,
"eval_samples_per_second": 28.275,
"eval_steps_per_second": 0.912,
"step": 560
},
{
"epoch": 4.57,
"eval_accuracy": 0.9612974353023094,
"eval_f1": 0.9563451776649746,
"eval_loss": 0.2031358927488327,
"eval_precision": 0.9401197604790419,
"eval_recall": 0.9731404958677686,
"eval_runtime": 2.9761,
"eval_samples_per_second": 31.249,
"eval_steps_per_second": 1.008,
"step": 580
},
{
"epoch": 4.72,
"eval_accuracy": 0.9507079029824765,
"eval_f1": 0.9494897959183674,
"eval_loss": 0.24843396246433258,
"eval_precision": 0.9380040322580645,
"eval_recall": 0.9612603305785123,
"eval_runtime": 2.242,
"eval_samples_per_second": 41.481,
"eval_steps_per_second": 1.338,
"step": 600
},
{
"epoch": 4.88,
"eval_accuracy": 0.9590054543344552,
"eval_f1": 0.9607390300230947,
"eval_loss": 0.2189687043428421,
"eval_precision": 0.9546149923508415,
"eval_recall": 0.9669421487603306,
"eval_runtime": 3.2795,
"eval_samples_per_second": 28.358,
"eval_steps_per_second": 0.915,
"step": 620
},
{
"epoch": 5.04,
"eval_accuracy": 0.9571486596263201,
"eval_f1": 0.9600409836065573,
"eval_loss": 0.25752872228622437,
"eval_precision": 0.9522357723577236,
"eval_recall": 0.9679752066115702,
"eval_runtime": 2.2527,
"eval_samples_per_second": 41.284,
"eval_steps_per_second": 1.332,
"step": 640
},
{
"epoch": 5.2,
"eval_accuracy": 0.9608622490425902,
"eval_f1": 0.9593869731800767,
"eval_loss": 0.24718773365020752,
"eval_precision": 0.9489641232945932,
"eval_recall": 0.9700413223140496,
"eval_runtime": 2.2796,
"eval_samples_per_second": 40.796,
"eval_steps_per_second": 1.316,
"step": 660
},
{
"epoch": 5.35,
"eval_accuracy": 0.9522165486828362,
"eval_f1": 0.9561671763506625,
"eval_loss": 0.2798936367034912,
"eval_precision": 0.9436619718309859,
"eval_recall": 0.96900826446281,
"eval_runtime": 3.2922,
"eval_samples_per_second": 28.249,
"eval_steps_per_second": 0.911,
"step": 680
},
{
"epoch": 5.51,
"eval_accuracy": 0.9556400139259603,
"eval_f1": 0.9535588086824837,
"eval_loss": 0.26087334752082825,
"eval_precision": 0.9323790720631787,
"eval_recall": 0.9757231404958677,
"eval_runtime": 2.2499,
"eval_samples_per_second": 41.335,
"eval_steps_per_second": 1.333,
"step": 700
},
{
"epoch": 5.67,
"eval_accuracy": 0.9529418591157015,
"eval_f1": 0.9502170028082715,
"eval_loss": 0.23053081333637238,
"eval_precision": 0.939424533064109,
"eval_recall": 0.9612603305785123,
"eval_runtime": 3.2663,
"eval_samples_per_second": 28.473,
"eval_steps_per_second": 0.918,
"step": 720
},
{
"epoch": 5.83,
"eval_accuracy": 0.9524486480213531,
"eval_f1": 0.954763709881223,
"eval_loss": 0.2539260983467102,
"eval_precision": 0.9346857991093518,
"eval_recall": 0.9757231404958677,
"eval_runtime": 3.298,
"eval_samples_per_second": 28.199,
"eval_steps_per_second": 0.91,
"step": 740
},
{
"epoch": 5.98,
"eval_accuracy": 0.9543634675641175,
"eval_f1": 0.9617654606107262,
"eval_loss": 0.28202250599861145,
"eval_precision": 0.9556348801631821,
"eval_recall": 0.9679752066115702,
"eval_runtime": 3.2935,
"eval_samples_per_second": 28.237,
"eval_steps_per_second": 0.911,
"step": 760
},
{
"epoch": 6.14,
"eval_accuracy": 0.9599048392712081,
"eval_f1": 0.9617065021845285,
"eval_loss": 0.23321200907230377,
"eval_precision": 0.9570332480818414,
"eval_recall": 0.9664256198347108,
"eval_runtime": 3.2967,
"eval_samples_per_second": 28.21,
"eval_steps_per_second": 0.91,
"step": 780
},
{
"epoch": 6.3,
"eval_accuracy": 0.9590054543344552,
"eval_f1": 0.961734693877551,
"eval_loss": 0.25181254744529724,
"eval_precision": 0.9501008064516129,
"eval_recall": 0.9736570247933884,
"eval_runtime": 2.9863,
"eval_samples_per_second": 31.142,
"eval_steps_per_second": 1.005,
"step": 800
},
{
"epoch": 6.46,
"eval_accuracy": 0.95752582105141,
"eval_f1": 0.9602258147292788,
"eval_loss": 0.2890544533729553,
"eval_precision": 0.954105048444671,
"eval_recall": 0.9664256198347108,
"eval_runtime": 2.2411,
"eval_samples_per_second": 41.497,
"eval_steps_per_second": 1.339,
"step": 820
},
{
"epoch": 6.61,
"eval_accuracy": 0.9568875478704886,
"eval_f1": 0.9569451563300871,
"eval_loss": 0.29066193103790283,
"eval_precision": 0.9496439471007121,
"eval_recall": 0.9643595041322314,
"eval_runtime": 2.2281,
"eval_samples_per_second": 41.74,
"eval_steps_per_second": 1.346,
"step": 840
},
{
"epoch": 6.77,
"eval_accuracy": 0.9598178020192643,
"eval_f1": 0.9613118114271074,
"eval_loss": 0.26129651069641113,
"eval_precision": 0.9537366548042705,
"eval_recall": 0.96900826446281,
"eval_runtime": 2.2516,
"eval_samples_per_second": 41.305,
"eval_steps_per_second": 1.332,
"step": 860
},
{
"epoch": 6.93,
"eval_accuracy": 0.9592085412556575,
"eval_f1": 0.96229802513465,
"eval_loss": 0.25751829147338867,
"eval_precision": 0.9556800815078961,
"eval_recall": 0.96900826446281,
"eval_runtime": 2.2645,
"eval_samples_per_second": 41.068,
"eval_steps_per_second": 1.325,
"step": 880
},
{
"epoch": 7.09,
"eval_accuracy": 0.9583381687362191,
"eval_f1": 0.9625832906201948,
"eval_loss": 0.26336678862571716,
"eval_precision": 0.9552390640895219,
"eval_recall": 0.9700413223140496,
"eval_runtime": 2.2487,
"eval_samples_per_second": 41.357,
"eval_steps_per_second": 1.334,
"step": 900
},
{
"epoch": 7.24,
"eval_accuracy": 0.9581640942323314,
"eval_f1": 0.9588550983899822,
"eval_loss": 0.2639918923377991,
"eval_precision": 0.9489124936772888,
"eval_recall": 0.96900826446281,
"eval_runtime": 2.996,
"eval_samples_per_second": 31.041,
"eval_steps_per_second": 1.001,
"step": 920
},
{
"epoch": 7.4,
"eval_accuracy": 0.9608622490425902,
"eval_f1": 0.9594284256187804,
"eval_loss": 0.2650795876979828,
"eval_precision": 0.9480584972264247,
"eval_recall": 0.9710743801652892,
"eval_runtime": 3.2719,
"eval_samples_per_second": 28.424,
"eval_steps_per_second": 0.917,
"step": 940
},
{
"epoch": 7.56,
"eval_accuracy": 0.9626900313334107,
"eval_f1": 0.9609992352791231,
"eval_loss": 0.26358404755592346,
"eval_precision": 0.9486663311524912,
"eval_recall": 0.9736570247933884,
"eval_runtime": 3.271,
"eval_samples_per_second": 28.432,
"eval_steps_per_second": 0.917,
"step": 960
},
{
"epoch": 7.72,
"eval_accuracy": 0.9627190437507253,
"eval_f1": 0.9622256253190403,
"eval_loss": 0.2597278356552124,
"eval_precision": 0.9510595358224017,
"eval_recall": 0.9736570247933884,
"eval_runtime": 2.9416,
"eval_samples_per_second": 31.616,
"eval_steps_per_second": 1.02,
"step": 980
},
{
"epoch": 7.87,
"learning_rate": 0.0,
"loss": 0.0555,
"step": 1000
},
{
"epoch": 7.87,
"eval_accuracy": 0.9627190437507253,
"eval_f1": 0.961489415965315,
"eval_loss": 0.25795629620552063,
"eval_precision": 0.9496221662468514,
"eval_recall": 0.9736570247933884,
"eval_runtime": 3.3,
"eval_samples_per_second": 28.182,
"eval_steps_per_second": 0.909,
"step": 1000
},
{
"epoch": 7.87,
"step": 1000,
"total_flos": 2101461798354944.0,
"train_loss": 0.16514424514770507,
"train_runtime": 1048.0167,
"train_samples_per_second": 7.633,
"train_steps_per_second": 0.954
}
],
"max_steps": 1000,
"num_train_epochs": 8,
"total_flos": 2101461798354944.0,
"trial_name": null,
"trial_params": null
}