m0_flat_ner_ocr_ptrn_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
20c292d
{
"best_metric": 0.9717367050948308,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/42-flat-ner-pero-ocr-pretrained_camembert_ner/checkpoint-1400",
"epoch": 3.674540682414698,
"global_step": 1400,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.9256820319849483,
"number": 519,
"precision": 0.9044117647058824,
"recall": 0.9479768786127167
},
"eval_CARDINAL": {
"f1": 0.9780701754385964,
"number": 678,
"precision": 0.9695652173913043,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9407166123778501,
"number": 761,
"precision": 0.9328165374677002,
"recall": 0.9487516425755584
},
"eval_PER": {
"f1": 0.9334308705193856,
"number": 679,
"precision": 0.9273255813953488,
"recall": 0.9396170839469808
},
"eval_TITRE": {
"f1": 0.44776119402985076,
"number": 41,
"precision": 0.5769230769230769,
"recall": 0.36585365853658536
},
"eval_accuracy": 0.9630473297899266,
"eval_f1": 0.9380432772332162,
"eval_loss": 0.22555255889892578,
"eval_precision": 0.9316678912564291,
"eval_recall": 0.9445065176908752,
"eval_runtime": 2.7451,
"eval_samples_per_second": 246.258,
"eval_steps_per_second": 15.664,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.9429657794676807,
"number": 519,
"precision": 0.9305816135084428,
"recall": 0.9556840077071291
},
"eval_CARDINAL": {
"f1": 0.9809104258443465,
"number": 678,
"precision": 0.9766081871345029,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.938961038961039,
"number": 761,
"precision": 0.9281129653401797,
"recall": 0.9500657030223391
},
"eval_PER": {
"f1": 0.9655172413793105,
"number": 679,
"precision": 0.9619883040935673,
"recall": 0.9690721649484536
},
"eval_TITRE": {
"f1": 0.575,
"number": 41,
"precision": 0.5897435897435898,
"recall": 0.5609756097560976
},
"eval_accuracy": 0.9681093394077449,
"eval_f1": 0.9504071058475203,
"eval_loss": 0.14738017320632935,
"eval_precision": 0.9444648767929386,
"eval_recall": 0.9564245810055866,
"eval_runtime": 2.0679,
"eval_samples_per_second": 326.898,
"eval_steps_per_second": 20.794,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9559386973180076,
"number": 519,
"precision": 0.9504761904761905,
"recall": 0.9614643545279383
},
"eval_CARDINAL": {
"f1": 0.9845474613686535,
"number": 678,
"precision": 0.9823788546255506,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.4615384615384615,
"number": 7,
"precision": 0.5,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9639344262295081,
"number": 761,
"precision": 0.9620418848167539,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9624724061810155,
"number": 679,
"precision": 0.961764705882353,
"recall": 0.9631811487481591
},
"eval_TITRE": {
"f1": 0.6933333333333332,
"number": 41,
"precision": 0.7647058823529411,
"recall": 0.6341463414634146
},
"eval_accuracy": 0.9758289040749177,
"eval_f1": 0.9622325581395349,
"eval_loss": 0.1064079999923706,
"eval_precision": 0.9613382899628253,
"eval_recall": 0.9631284916201117,
"eval_runtime": 2.071,
"eval_samples_per_second": 326.419,
"eval_steps_per_second": 20.763,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9364928909952606,
"number": 519,
"precision": 0.9216417910447762,
"recall": 0.9518304431599229
},
"eval_CARDINAL": {
"f1": 0.9845246868091377,
"number": 678,
"precision": 0.9837997054491899,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9541884816753926,
"number": 761,
"precision": 0.9504563233376793,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9823529411764705,
"number": 679,
"precision": 0.9809104258443465,
"recall": 0.9837997054491899
},
"eval_TITRE": {
"f1": 0.7654320987654322,
"number": 41,
"precision": 0.775,
"recall": 0.7560975609756098
},
"eval_accuracy": 0.9712730954188813,
"eval_f1": 0.9617952522255193,
"eval_loss": 0.1030876561999321,
"eval_precision": 0.9578869597340229,
"eval_recall": 0.9657355679702049,
"eval_runtime": 2.0342,
"eval_samples_per_second": 332.316,
"eval_steps_per_second": 21.138,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.2317,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.9608404966571156,
"number": 519,
"precision": 0.9526515151515151,
"recall": 0.9691714836223507
},
"eval_CARDINAL": {
"f1": 0.9859985261606484,
"number": 678,
"precision": 0.9852724594992637,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9454545454545454,
"number": 761,
"precision": 0.9345314505776636,
"recall": 0.9566360052562418
},
"eval_PER": {
"f1": 0.9685442574981712,
"number": 679,
"precision": 0.9622093023255814,
"recall": 0.9749631811487481
},
"eval_TITRE": {
"f1": 0.6,
"number": 41,
"precision": 0.6153846153846154,
"recall": 0.5853658536585366
},
"eval_accuracy": 0.9719058466211086,
"eval_f1": 0.9585338763420954,
"eval_loss": 0.10161029547452927,
"eval_precision": 0.9528892160471107,
"eval_recall": 0.964245810055866,
"eval_runtime": 2.1114,
"eval_samples_per_second": 320.168,
"eval_steps_per_second": 20.366,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9579349904397705,
"number": 519,
"precision": 0.9506641366223909,
"recall": 0.9653179190751445
},
"eval_CARDINAL": {
"f1": 0.9845474613686535,
"number": 678,
"precision": 0.9823788546255506,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.36363636363636365,
"number": 7,
"precision": 0.5,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9625738673670386,
"number": 761,
"precision": 0.9619422572178478,
"recall": 0.9632063074901446
},
"eval_PER": {
"f1": 0.9742836149889786,
"number": 679,
"precision": 0.9721407624633431,
"recall": 0.9764359351988218
},
"eval_TITRE": {
"f1": 0.7317073170731707,
"number": 41,
"precision": 0.7317073170731707,
"recall": 0.7317073170731707
},
"eval_accuracy": 0.9779802581624905,
"eval_f1": 0.9654403567447045,
"eval_loss": 0.08714007586240768,
"eval_precision": 0.9632925472747497,
"eval_recall": 0.9675977653631285,
"eval_runtime": 4.5111,
"eval_samples_per_second": 149.853,
"eval_steps_per_second": 9.532,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9476688867745005,
"number": 519,
"precision": 0.9360902255639098,
"recall": 0.9595375722543352
},
"eval_CARDINAL": {
"f1": 0.9867452135493373,
"number": 678,
"precision": 0.9852941176470589,
"recall": 0.9882005899705014
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9587965990843689,
"number": 761,
"precision": 0.9544270833333334,
"recall": 0.9632063074901446
},
"eval_PER": {
"f1": 0.969208211143695,
"number": 679,
"precision": 0.964963503649635,
"recall": 0.9734904270986745
},
"eval_TITRE": {
"f1": 0.7804878048780488,
"number": 41,
"precision": 0.7804878048780488,
"recall": 0.7804878048780488
},
"eval_accuracy": 0.9765882055175905,
"eval_f1": 0.9625509825732296,
"eval_loss": 0.08122637122869492,
"eval_precision": 0.9582871908453304,
"eval_recall": 0.966852886405959,
"eval_runtime": 2.7384,
"eval_samples_per_second": 246.857,
"eval_steps_per_second": 15.702,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9514747859181732,
"number": 519,
"precision": 0.9398496240601504,
"recall": 0.9633911368015414
},
"eval_CARDINAL": {
"f1": 0.9874908020603386,
"number": 678,
"precision": 0.9853157121879589,
"recall": 0.9896755162241888
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9652914210870989,
"number": 761,
"precision": 0.9621409921671018,
"recall": 0.9684625492772667
},
"eval_PER": {
"f1": 0.9706314243759177,
"number": 679,
"precision": 0.9677891654465594,
"recall": 0.9734904270986745
},
"eval_TITRE": {
"f1": 0.8311688311688312,
"number": 41,
"precision": 0.8888888888888888,
"recall": 0.7804878048780488
},
"eval_accuracy": 0.9787395596051632,
"eval_f1": 0.9665800222799851,
"eval_loss": 0.07897698879241943,
"eval_precision": 0.9637171417993335,
"eval_recall": 0.9694599627560522,
"eval_runtime": 2.0295,
"eval_samples_per_second": 333.085,
"eval_steps_per_second": 21.187,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9570200573065903,
"number": 519,
"precision": 0.9488636363636364,
"recall": 0.9653179190751445
},
"eval_CARDINAL": {
"f1": 0.9859778597785978,
"number": 678,
"precision": 0.9867060561299852,
"recall": 0.9852507374631269
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.958688524590164,
"number": 761,
"precision": 0.9568062827225131,
"recall": 0.9605781865965834
},
"eval_PER": {
"f1": 0.9816041206769683,
"number": 679,
"precision": 0.9808823529411764,
"recall": 0.9823269513991163
},
"eval_TITRE": {
"f1": 0.8354430379746836,
"number": 41,
"precision": 0.868421052631579,
"recall": 0.8048780487804879
},
"eval_accuracy": 0.9784864591242723,
"eval_f1": 0.968186046511628,
"eval_loss": 0.08038043230772018,
"eval_precision": 0.9672862453531599,
"eval_recall": 0.9690875232774674,
"eval_runtime": 2.0985,
"eval_samples_per_second": 322.128,
"eval_steps_per_second": 20.49,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.0696,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.970334928229665,
"number": 519,
"precision": 0.9638783269961977,
"recall": 0.976878612716763
},
"eval_CARDINAL": {
"f1": 0.9845474613686535,
"number": 678,
"precision": 0.9823788546255506,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.36363636363636365,
"number": 7,
"precision": 0.5,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.962671905697446,
"number": 761,
"precision": 0.9595300261096605,
"recall": 0.9658344283837057
},
"eval_PER": {
"f1": 0.9808823529411764,
"number": 679,
"precision": 0.9794419970631424,
"recall": 0.9823269513991163
},
"eval_TITRE": {
"f1": 0.7594936708860759,
"number": 41,
"precision": 0.7894736842105263,
"recall": 0.7317073170731707
},
"eval_accuracy": 0.982536066818527,
"eval_f1": 0.9700799107972496,
"eval_loss": 0.07389234751462936,
"eval_precision": 0.9681008902077152,
"eval_recall": 0.9720670391061452,
"eval_runtime": 3.1328,
"eval_samples_per_second": 215.784,
"eval_steps_per_second": 13.726,
"step": 1000
},
{
"epoch": 2.89,
"eval_ACT": {
"f1": 0.9571020019065777,
"number": 519,
"precision": 0.9471698113207547,
"recall": 0.9672447013487476
},
"eval_CARDINAL": {
"f1": 0.9889462048636699,
"number": 678,
"precision": 0.9882179675994109,
"recall": 0.9896755162241888
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9625738673670386,
"number": 761,
"precision": 0.9619422572178478,
"recall": 0.9632063074901446
},
"eval_PER": {
"f1": 0.9823529411764705,
"number": 679,
"precision": 0.9809104258443465,
"recall": 0.9837997054491899
},
"eval_TITRE": {
"f1": 0.8433734939759037,
"number": 41,
"precision": 0.8333333333333334,
"recall": 0.8536585365853658
},
"eval_accuracy": 0.9808909136927361,
"eval_f1": 0.9699108469539376,
"eval_loss": 0.07423367351293564,
"eval_precision": 0.9673953316042979,
"eval_recall": 0.97243947858473,
"eval_runtime": 2.3205,
"eval_samples_per_second": 291.313,
"eval_steps_per_second": 18.53,
"step": 1100
},
{
"epoch": 3.15,
"eval_ACT": {
"f1": 0.9578544061302681,
"number": 519,
"precision": 0.9523809523809523,
"recall": 0.9633911368015414
},
"eval_CARDINAL": {
"f1": 0.9852724594992636,
"number": 678,
"precision": 0.9838235294117647,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.3333333333333333,
"number": 7,
"precision": 0.4,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9619921363040629,
"number": 761,
"precision": 0.9594771241830066,
"recall": 0.9645203679369251
},
"eval_PER": {
"f1": 0.9794117647058823,
"number": 679,
"precision": 0.9779735682819384,
"recall": 0.9808541973490427
},
"eval_TITRE": {
"f1": 0.8048780487804877,
"number": 41,
"precision": 0.8048780487804879,
"recall": 0.8048780487804879
},
"eval_accuracy": 0.9803847127309542,
"eval_f1": 0.967670011148272,
"eval_loss": 0.08098369836807251,
"eval_precision": 0.9655172413793104,
"eval_recall": 0.9698324022346368,
"eval_runtime": 2.0371,
"eval_samples_per_second": 331.847,
"eval_steps_per_second": 21.109,
"step": 1200
},
{
"epoch": 3.41,
"eval_ACT": {
"f1": 0.9578544061302681,
"number": 519,
"precision": 0.9523809523809523,
"recall": 0.9633911368015414
},
"eval_CARDINAL": {
"f1": 0.9830508474576272,
"number": 678,
"precision": 0.9823269513991163,
"recall": 0.9837758112094396
},
"eval_FT": {
"f1": 0.5,
"number": 7,
"precision": 0.4444444444444444,
"recall": 0.5714285714285714
},
"eval_LOC": {
"f1": 0.9607329842931938,
"number": 761,
"precision": 0.9569752281616688,
"recall": 0.9645203679369251
},
"eval_PER": {
"f1": 0.9786921381337251,
"number": 679,
"precision": 0.9765395894428153,
"recall": 0.9808541973490427
},
"eval_TITRE": {
"f1": 0.7317073170731707,
"number": 41,
"precision": 0.7317073170731707,
"recall": 0.7317073170731707
},
"eval_accuracy": 0.9816502151354087,
"eval_f1": 0.965478841870824,
"eval_loss": 0.06854782998561859,
"eval_precision": 0.9622641509433962,
"eval_recall": 0.9687150837988827,
"eval_runtime": 2.0277,
"eval_samples_per_second": 333.39,
"eval_steps_per_second": 21.207,
"step": 1300
},
{
"epoch": 3.67,
"eval_ACT": {
"f1": 0.9655172413793104,
"number": 519,
"precision": 0.96,
"recall": 0.9710982658959537
},
"eval_CARDINAL": {
"f1": 0.9845474613686535,
"number": 678,
"precision": 0.9823788546255506,
"recall": 0.9867256637168141
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9665573770491803,
"number": 761,
"precision": 0.9646596858638743,
"recall": 0.9684625492772667
},
"eval_PER": {
"f1": 0.9808541973490427,
"number": 679,
"precision": 0.9808541973490427,
"recall": 0.9808541973490427
},
"eval_TITRE": {
"f1": 0.8395061728395061,
"number": 41,
"precision": 0.85,
"recall": 0.8292682926829268
},
"eval_accuracy": 0.9832953682611997,
"eval_f1": 0.9717367050948308,
"eval_loss": 0.06763775646686554,
"eval_precision": 0.9702933531377645,
"eval_recall": 0.9731843575418995,
"eval_runtime": 2.0487,
"eval_samples_per_second": 329.96,
"eval_steps_per_second": 20.989,
"step": 1400
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 566245460738232.0,
"trial_name": null,
"trial_params": null
}