{ "best_metric": 0.9717367050948308, "best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/42-flat-ner-pero-ocr-pretrained_camembert_ner/checkpoint-1400", "epoch": 3.674540682414698, "global_step": 1400, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.26, "eval_ACT": { "f1": 0.9256820319849483, "number": 519, "precision": 0.9044117647058824, "recall": 0.9479768786127167 }, "eval_CARDINAL": { "f1": 0.9780701754385964, "number": 678, "precision": 0.9695652173913043, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.9407166123778501, "number": 761, "precision": 0.9328165374677002, "recall": 0.9487516425755584 }, "eval_PER": { "f1": 0.9334308705193856, "number": 679, "precision": 0.9273255813953488, "recall": 0.9396170839469808 }, "eval_TITRE": { "f1": 0.44776119402985076, "number": 41, "precision": 0.5769230769230769, "recall": 0.36585365853658536 }, "eval_accuracy": 0.9630473297899266, "eval_f1": 0.9380432772332162, "eval_loss": 0.22555255889892578, "eval_precision": 0.9316678912564291, "eval_recall": 0.9445065176908752, "eval_runtime": 2.7451, "eval_samples_per_second": 246.258, "eval_steps_per_second": 15.664, "step": 100 }, { "epoch": 0.52, "eval_ACT": { "f1": 0.9429657794676807, "number": 519, "precision": 0.9305816135084428, "recall": 0.9556840077071291 }, "eval_CARDINAL": { "f1": 0.9809104258443465, "number": 678, "precision": 0.9766081871345029, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.0, "number": 7, "precision": 0.0, "recall": 0.0 }, "eval_LOC": { "f1": 0.938961038961039, "number": 761, "precision": 0.9281129653401797, "recall": 0.9500657030223391 }, "eval_PER": { "f1": 0.9655172413793105, "number": 679, "precision": 0.9619883040935673, "recall": 0.9690721649484536 }, "eval_TITRE": { "f1": 0.575, "number": 41, "precision": 0.5897435897435898, "recall": 0.5609756097560976 }, "eval_accuracy": 0.9681093394077449, "eval_f1": 0.9504071058475203, "eval_loss": 0.14738017320632935, "eval_precision": 0.9444648767929386, "eval_recall": 0.9564245810055866, "eval_runtime": 2.0679, "eval_samples_per_second": 326.898, "eval_steps_per_second": 20.794, "step": 200 }, { "epoch": 0.79, "eval_ACT": { "f1": 0.9559386973180076, "number": 519, "precision": 0.9504761904761905, "recall": 0.9614643545279383 }, "eval_CARDINAL": { "f1": 0.9845474613686535, "number": 678, "precision": 0.9823788546255506, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.4615384615384615, "number": 7, "precision": 0.5, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9639344262295081, "number": 761, "precision": 0.9620418848167539, "recall": 0.9658344283837057 }, "eval_PER": { "f1": 0.9624724061810155, "number": 679, "precision": 0.961764705882353, "recall": 0.9631811487481591 }, "eval_TITRE": { "f1": 0.6933333333333332, "number": 41, "precision": 0.7647058823529411, "recall": 0.6341463414634146 }, "eval_accuracy": 0.9758289040749177, "eval_f1": 0.9622325581395349, "eval_loss": 0.1064079999923706, "eval_precision": 0.9613382899628253, "eval_recall": 0.9631284916201117, "eval_runtime": 2.071, "eval_samples_per_second": 326.419, "eval_steps_per_second": 20.763, "step": 300 }, { "epoch": 1.05, "eval_ACT": { "f1": 0.9364928909952606, "number": 519, "precision": 0.9216417910447762, "recall": 0.9518304431599229 }, "eval_CARDINAL": { "f1": 0.9845246868091377, "number": 678, "precision": 0.9837997054491899, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.5454545454545454, "number": 7, "precision": 0.75, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9541884816753926, "number": 761, "precision": 0.9504563233376793, "recall": 0.9579500657030223 }, "eval_PER": { "f1": 0.9823529411764705, "number": 679, "precision": 0.9809104258443465, "recall": 0.9837997054491899 }, "eval_TITRE": { "f1": 0.7654320987654322, "number": 41, "precision": 0.775, "recall": 0.7560975609756098 }, "eval_accuracy": 0.9712730954188813, "eval_f1": 0.9617952522255193, "eval_loss": 0.1030876561999321, "eval_precision": 0.9578869597340229, "eval_recall": 0.9657355679702049, "eval_runtime": 2.0342, "eval_samples_per_second": 332.316, "eval_steps_per_second": 21.138, "step": 400 }, { "epoch": 1.31, "learning_rate": 9e-05, "loss": 0.2317, "step": 500 }, { "epoch": 1.31, "eval_ACT": { "f1": 0.9608404966571156, "number": 519, "precision": 0.9526515151515151, "recall": 0.9691714836223507 }, "eval_CARDINAL": { "f1": 0.9859985261606484, "number": 678, "precision": 0.9852724594992637, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.5454545454545454, "number": 7, "precision": 0.75, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9454545454545454, "number": 761, "precision": 0.9345314505776636, "recall": 0.9566360052562418 }, "eval_PER": { "f1": 0.9685442574981712, "number": 679, "precision": 0.9622093023255814, "recall": 0.9749631811487481 }, "eval_TITRE": { "f1": 0.6, "number": 41, "precision": 0.6153846153846154, "recall": 0.5853658536585366 }, "eval_accuracy": 0.9719058466211086, "eval_f1": 0.9585338763420954, "eval_loss": 0.10161029547452927, "eval_precision": 0.9528892160471107, "eval_recall": 0.964245810055866, "eval_runtime": 2.1114, "eval_samples_per_second": 320.168, "eval_steps_per_second": 20.366, "step": 500 }, { "epoch": 1.57, "eval_ACT": { "f1": 0.9579349904397705, "number": 519, "precision": 0.9506641366223909, "recall": 0.9653179190751445 }, "eval_CARDINAL": { "f1": 0.9845474613686535, "number": 678, "precision": 0.9823788546255506, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.36363636363636365, "number": 7, "precision": 0.5, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9625738673670386, "number": 761, "precision": 0.9619422572178478, "recall": 0.9632063074901446 }, "eval_PER": { "f1": 0.9742836149889786, "number": 679, "precision": 0.9721407624633431, "recall": 0.9764359351988218 }, "eval_TITRE": { "f1": 0.7317073170731707, "number": 41, "precision": 0.7317073170731707, "recall": 0.7317073170731707 }, "eval_accuracy": 0.9779802581624905, "eval_f1": 0.9654403567447045, "eval_loss": 0.08714007586240768, "eval_precision": 0.9632925472747497, "eval_recall": 0.9675977653631285, "eval_runtime": 4.5111, "eval_samples_per_second": 149.853, "eval_steps_per_second": 9.532, "step": 600 }, { "epoch": 1.84, "eval_ACT": { "f1": 0.9476688867745005, "number": 519, "precision": 0.9360902255639098, "recall": 0.9595375722543352 }, "eval_CARDINAL": { "f1": 0.9867452135493373, "number": 678, "precision": 0.9852941176470589, "recall": 0.9882005899705014 }, "eval_FT": { "f1": 0.4, "number": 7, "precision": 0.6666666666666666, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9587965990843689, "number": 761, "precision": 0.9544270833333334, "recall": 0.9632063074901446 }, "eval_PER": { "f1": 0.969208211143695, "number": 679, "precision": 0.964963503649635, "recall": 0.9734904270986745 }, "eval_TITRE": { "f1": 0.7804878048780488, "number": 41, "precision": 0.7804878048780488, "recall": 0.7804878048780488 }, "eval_accuracy": 0.9765882055175905, "eval_f1": 0.9625509825732296, "eval_loss": 0.08122637122869492, "eval_precision": 0.9582871908453304, "eval_recall": 0.966852886405959, "eval_runtime": 2.7384, "eval_samples_per_second": 246.857, "eval_steps_per_second": 15.702, "step": 700 }, { "epoch": 2.1, "eval_ACT": { "f1": 0.9514747859181732, "number": 519, "precision": 0.9398496240601504, "recall": 0.9633911368015414 }, "eval_CARDINAL": { "f1": 0.9874908020603386, "number": 678, "precision": 0.9853157121879589, "recall": 0.9896755162241888 }, "eval_FT": { "f1": 0.4, "number": 7, "precision": 0.6666666666666666, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9652914210870989, "number": 761, "precision": 0.9621409921671018, "recall": 0.9684625492772667 }, "eval_PER": { "f1": 0.9706314243759177, "number": 679, "precision": 0.9677891654465594, "recall": 0.9734904270986745 }, "eval_TITRE": { "f1": 0.8311688311688312, "number": 41, "precision": 0.8888888888888888, "recall": 0.7804878048780488 }, "eval_accuracy": 0.9787395596051632, "eval_f1": 0.9665800222799851, "eval_loss": 0.07897698879241943, "eval_precision": 0.9637171417993335, "eval_recall": 0.9694599627560522, "eval_runtime": 2.0295, "eval_samples_per_second": 333.085, "eval_steps_per_second": 21.187, "step": 800 }, { "epoch": 2.36, "eval_ACT": { "f1": 0.9570200573065903, "number": 519, "precision": 0.9488636363636364, "recall": 0.9653179190751445 }, "eval_CARDINAL": { "f1": 0.9859778597785978, "number": 678, "precision": 0.9867060561299852, "recall": 0.9852507374631269 }, "eval_FT": { "f1": 0.4, "number": 7, "precision": 0.6666666666666666, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.958688524590164, "number": 761, "precision": 0.9568062827225131, "recall": 0.9605781865965834 }, "eval_PER": { "f1": 0.9816041206769683, "number": 679, "precision": 0.9808823529411764, "recall": 0.9823269513991163 }, "eval_TITRE": { "f1": 0.8354430379746836, "number": 41, "precision": 0.868421052631579, "recall": 0.8048780487804879 }, "eval_accuracy": 0.9784864591242723, "eval_f1": 0.968186046511628, "eval_loss": 0.08038043230772018, "eval_precision": 0.9672862453531599, "eval_recall": 0.9690875232774674, "eval_runtime": 2.0985, "eval_samples_per_second": 322.128, "eval_steps_per_second": 20.49, "step": 900 }, { "epoch": 2.62, "learning_rate": 8e-05, "loss": 0.0696, "step": 1000 }, { "epoch": 2.62, "eval_ACT": { "f1": 0.970334928229665, "number": 519, "precision": 0.9638783269961977, "recall": 0.976878612716763 }, "eval_CARDINAL": { "f1": 0.9845474613686535, "number": 678, "precision": 0.9823788546255506, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.36363636363636365, "number": 7, "precision": 0.5, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.962671905697446, "number": 761, "precision": 0.9595300261096605, "recall": 0.9658344283837057 }, "eval_PER": { "f1": 0.9808823529411764, "number": 679, "precision": 0.9794419970631424, "recall": 0.9823269513991163 }, "eval_TITRE": { "f1": 0.7594936708860759, "number": 41, "precision": 0.7894736842105263, "recall": 0.7317073170731707 }, "eval_accuracy": 0.982536066818527, "eval_f1": 0.9700799107972496, "eval_loss": 0.07389234751462936, "eval_precision": 0.9681008902077152, "eval_recall": 0.9720670391061452, "eval_runtime": 3.1328, "eval_samples_per_second": 215.784, "eval_steps_per_second": 13.726, "step": 1000 }, { "epoch": 2.89, "eval_ACT": { "f1": 0.9571020019065777, "number": 519, "precision": 0.9471698113207547, "recall": 0.9672447013487476 }, "eval_CARDINAL": { "f1": 0.9889462048636699, "number": 678, "precision": 0.9882179675994109, "recall": 0.9896755162241888 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9625738673670386, "number": 761, "precision": 0.9619422572178478, "recall": 0.9632063074901446 }, "eval_PER": { "f1": 0.9823529411764705, "number": 679, "precision": 0.9809104258443465, "recall": 0.9837997054491899 }, "eval_TITRE": { "f1": 0.8433734939759037, "number": 41, "precision": 0.8333333333333334, "recall": 0.8536585365853658 }, "eval_accuracy": 0.9808909136927361, "eval_f1": 0.9699108469539376, "eval_loss": 0.07423367351293564, "eval_precision": 0.9673953316042979, "eval_recall": 0.97243947858473, "eval_runtime": 2.3205, "eval_samples_per_second": 291.313, "eval_steps_per_second": 18.53, "step": 1100 }, { "epoch": 3.15, "eval_ACT": { "f1": 0.9578544061302681, "number": 519, "precision": 0.9523809523809523, "recall": 0.9633911368015414 }, "eval_CARDINAL": { "f1": 0.9852724594992636, "number": 678, "precision": 0.9838235294117647, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.3333333333333333, "number": 7, "precision": 0.4, "recall": 0.2857142857142857 }, "eval_LOC": { "f1": 0.9619921363040629, "number": 761, "precision": 0.9594771241830066, "recall": 0.9645203679369251 }, "eval_PER": { "f1": 0.9794117647058823, "number": 679, "precision": 0.9779735682819384, "recall": 0.9808541973490427 }, "eval_TITRE": { "f1": 0.8048780487804877, "number": 41, "precision": 0.8048780487804879, "recall": 0.8048780487804879 }, "eval_accuracy": 0.9803847127309542, "eval_f1": 0.967670011148272, "eval_loss": 0.08098369836807251, "eval_precision": 0.9655172413793104, "eval_recall": 0.9698324022346368, "eval_runtime": 2.0371, "eval_samples_per_second": 331.847, "eval_steps_per_second": 21.109, "step": 1200 }, { "epoch": 3.41, "eval_ACT": { "f1": 0.9578544061302681, "number": 519, "precision": 0.9523809523809523, "recall": 0.9633911368015414 }, "eval_CARDINAL": { "f1": 0.9830508474576272, "number": 678, "precision": 0.9823269513991163, "recall": 0.9837758112094396 }, "eval_FT": { "f1": 0.5, "number": 7, "precision": 0.4444444444444444, "recall": 0.5714285714285714 }, "eval_LOC": { "f1": 0.9607329842931938, "number": 761, "precision": 0.9569752281616688, "recall": 0.9645203679369251 }, "eval_PER": { "f1": 0.9786921381337251, "number": 679, "precision": 0.9765395894428153, "recall": 0.9808541973490427 }, "eval_TITRE": { "f1": 0.7317073170731707, "number": 41, "precision": 0.7317073170731707, "recall": 0.7317073170731707 }, "eval_accuracy": 0.9816502151354087, "eval_f1": 0.965478841870824, "eval_loss": 0.06854782998561859, "eval_precision": 0.9622641509433962, "eval_recall": 0.9687150837988827, "eval_runtime": 2.0277, "eval_samples_per_second": 333.39, "eval_steps_per_second": 21.207, "step": 1300 }, { "epoch": 3.67, "eval_ACT": { "f1": 0.9655172413793104, "number": 519, "precision": 0.96, "recall": 0.9710982658959537 }, "eval_CARDINAL": { "f1": 0.9845474613686535, "number": 678, "precision": 0.9823788546255506, "recall": 0.9867256637168141 }, "eval_FT": { "f1": 0.5454545454545454, "number": 7, "precision": 0.75, "recall": 0.42857142857142855 }, "eval_LOC": { "f1": 0.9665573770491803, "number": 761, "precision": 0.9646596858638743, "recall": 0.9684625492772667 }, "eval_PER": { "f1": 0.9808541973490427, "number": 679, "precision": 0.9808541973490427, "recall": 0.9808541973490427 }, "eval_TITRE": { "f1": 0.8395061728395061, "number": 41, "precision": 0.85, "recall": 0.8292682926829268 }, "eval_accuracy": 0.9832953682611997, "eval_f1": 0.9717367050948308, "eval_loss": 0.06763775646686554, "eval_precision": 0.9702933531377645, "eval_recall": 0.9731843575418995, "eval_runtime": 2.0487, "eval_samples_per_second": 329.96, "eval_steps_per_second": 20.989, "step": 1400 } ], "max_steps": 5000, "num_train_epochs": 14, "total_flos": 566245460738232.0, "trial_name": null, "trial_params": null }