m0_flat_ner_ref_ptrn_cmbert_io / trainer_state.json
nlpso's picture
Load model and tokenizer
481efee
{
"best_metric": 0.9786205614426474,
"best_model_checkpoint": "/work/stual/res_ICDAR/method_0/tmp/22-flat-ner-ref-pretrained_camembert_ner/checkpoint-1000",
"epoch": 2.6246719160104988,
"global_step": 1000,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.26,
"eval_ACT": {
"f1": 0.9162011173184358,
"number": 519,
"precision": 0.8864864864864865,
"recall": 0.9479768786127167
},
"eval_CARDINAL": {
"f1": 0.9919177075679647,
"number": 678,
"precision": 0.9882869692532943,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.944300518134715,
"number": 761,
"precision": 0.9310344827586207,
"recall": 0.9579500657030223
},
"eval_PER": {
"f1": 0.9288334556126192,
"number": 679,
"precision": 0.9254385964912281,
"recall": 0.9322533136966127
},
"eval_TITRE": {
"f1": 0.32000000000000006,
"number": 40,
"precision": 0.8,
"recall": 0.2
},
"eval_accuracy": 0.9653674280039722,
"eval_f1": 0.9398036673458048,
"eval_loss": 0.20965276658535004,
"eval_precision": 0.934438305709024,
"eval_recall": 0.9452309985096871,
"eval_runtime": 2.353,
"eval_samples_per_second": 287.287,
"eval_steps_per_second": 18.274,
"step": 100
},
{
"epoch": 0.52,
"eval_ACT": {
"f1": 0.9487666034155597,
"number": 519,
"precision": 0.9345794392523364,
"recall": 0.9633911368015414
},
"eval_CARDINAL": {
"f1": 0.9919177075679647,
"number": 678,
"precision": 0.9882869692532943,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9441558441558441,
"number": 761,
"precision": 0.9332477535301669,
"recall": 0.9553219448094612
},
"eval_PER": {
"f1": 0.9618768328445747,
"number": 679,
"precision": 0.9576642335766423,
"recall": 0.9661266568483063
},
"eval_TITRE": {
"f1": 0.525,
"number": 40,
"precision": 0.525,
"recall": 0.525
},
"eval_accuracy": 0.9766633565044687,
"eval_f1": 0.9541250462449131,
"eval_loss": 0.12336099147796631,
"eval_precision": 0.9474650991917708,
"eval_recall": 0.9608792846497765,
"eval_runtime": 2.3033,
"eval_samples_per_second": 293.494,
"eval_steps_per_second": 18.669,
"step": 200
},
{
"epoch": 0.79,
"eval_ACT": {
"f1": 0.9493791786055396,
"number": 519,
"precision": 0.9412878787878788,
"recall": 0.9576107899807321
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.5,
"number": 7,
"precision": 0.6,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.973718791064389,
"number": 761,
"precision": 0.973718791064389,
"recall": 0.973718791064389
},
"eval_PER": {
"f1": 0.9778761061946903,
"number": 679,
"precision": 0.9793205317577548,
"recall": 0.9764359351988218
},
"eval_TITRE": {
"f1": 0.7999999999999999,
"number": 40,
"precision": 0.8571428571428571,
"recall": 0.75
},
"eval_accuracy": 0.9800148957298908,
"eval_f1": 0.9715136846024949,
"eval_loss": 0.0935482531785965,
"eval_precision": 0.9709713435057685,
"eval_recall": 0.9720566318926974,
"eval_runtime": 2.0792,
"eval_samples_per_second": 325.122,
"eval_steps_per_second": 20.681,
"step": 300
},
{
"epoch": 1.05,
"eval_ACT": {
"f1": 0.9456625357483317,
"number": 519,
"precision": 0.9358490566037736,
"recall": 0.9556840077071291
},
"eval_CARDINAL": {
"f1": 0.9926470588235294,
"number": 678,
"precision": 0.9897360703812317,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9677843523997371,
"number": 761,
"precision": 0.968421052631579,
"recall": 0.9671484888304862
},
"eval_PER": {
"f1": 0.9882352941176471,
"number": 679,
"precision": 0.986784140969163,
"recall": 0.9896907216494846
},
"eval_TITRE": {
"f1": 0.8192771084337349,
"number": 40,
"precision": 0.7906976744186046,
"recall": 0.85
},
"eval_accuracy": 0.9784011916583912,
"eval_f1": 0.9717682020802376,
"eval_loss": 0.08334896713495255,
"eval_precision": 0.9688888888888889,
"eval_recall": 0.9746646795827124,
"eval_runtime": 2.0578,
"eval_samples_per_second": 328.512,
"eval_steps_per_second": 20.896,
"step": 400
},
{
"epoch": 1.31,
"learning_rate": 9e-05,
"loss": 0.2168,
"step": 500
},
{
"epoch": 1.31,
"eval_ACT": {
"f1": 0.954110898661568,
"number": 519,
"precision": 0.9468690702087287,
"recall": 0.9614643545279383
},
"eval_CARDINAL": {
"f1": 0.9889298892988929,
"number": 678,
"precision": 0.9896602658788775,
"recall": 0.9882005899705014
},
"eval_FT": {
"f1": 0.0,
"number": 7,
"precision": 0.0,
"recall": 0.0
},
"eval_LOC": {
"f1": 0.9556135770234986,
"number": 761,
"precision": 0.9494163424124513,
"recall": 0.961892247043364
},
"eval_PER": {
"f1": 0.9772893772893771,
"number": 679,
"precision": 0.9723032069970845,
"recall": 0.9823269513991163
},
"eval_TITRE": {
"f1": 0.85,
"number": 40,
"precision": 0.85,
"recall": 0.85
},
"eval_accuracy": 0.977656405163853,
"eval_f1": 0.9660293298682012,
"eval_loss": 0.08229256421327591,
"eval_precision": 0.9626341102478727,
"eval_recall": 0.9694485842026825,
"eval_runtime": 2.0948,
"eval_samples_per_second": 322.711,
"eval_steps_per_second": 20.527,
"step": 500
},
{
"epoch": 1.57,
"eval_ACT": {
"f1": 0.9524714828897339,
"number": 519,
"precision": 0.9399624765478424,
"recall": 0.9653179190751445
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.9652459016393442,
"number": 761,
"precision": 0.9633507853403142,
"recall": 0.9671484888304862
},
"eval_PER": {
"f1": 0.986764705882353,
"number": 679,
"precision": 0.9853157121879589,
"recall": 0.9882179675994109
},
"eval_TITRE": {
"f1": 0.8780487804878048,
"number": 40,
"precision": 0.8571428571428571,
"recall": 0.9
},
"eval_accuracy": 0.9829940417080437,
"eval_f1": 0.9730933382816849,
"eval_loss": 0.07296791672706604,
"eval_precision": 0.9693160813308688,
"eval_recall": 0.9769001490312966,
"eval_runtime": 2.0927,
"eval_samples_per_second": 323.022,
"eval_steps_per_second": 20.547,
"step": 600
},
{
"epoch": 1.84,
"eval_ACT": {
"f1": 0.9654510556621881,
"number": 519,
"precision": 0.9617590822179732,
"recall": 0.9691714836223507
},
"eval_CARDINAL": {
"f1": 0.9919058130978661,
"number": 678,
"precision": 0.9897209985315712,
"recall": 0.9941002949852508
},
"eval_FT": {
"f1": 0.5454545454545454,
"number": 7,
"precision": 0.75,
"recall": 0.42857142857142855
},
"eval_LOC": {
"f1": 0.968586387434555,
"number": 761,
"precision": 0.9647979139504563,
"recall": 0.9724047306176085
},
"eval_PER": {
"f1": 0.986019131714496,
"number": 679,
"precision": 0.9852941176470589,
"recall": 0.9867452135493373
},
"eval_TITRE": {
"f1": 0.9,
"number": 40,
"precision": 0.9,
"recall": 0.9
},
"eval_accuracy": 0.9829940417080437,
"eval_f1": 0.9763896635062279,
"eval_loss": 0.06497417390346527,
"eval_precision": 0.9743970315398887,
"eval_recall": 0.9783904619970194,
"eval_runtime": 2.0484,
"eval_samples_per_second": 330.007,
"eval_steps_per_second": 20.992,
"step": 700
},
{
"epoch": 2.1,
"eval_ACT": {
"f1": 0.9521988527724664,
"number": 519,
"precision": 0.9449715370018975,
"recall": 0.9595375722543352
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9653368214519294,
"number": 761,
"precision": 0.9609375,
"recall": 0.9697766097240473
},
"eval_PER": {
"f1": 0.9867452135493373,
"number": 679,
"precision": 0.9867452135493373,
"recall": 0.9867452135493373
},
"eval_TITRE": {
"f1": 0.925,
"number": 40,
"precision": 0.925,
"recall": 0.925
},
"eval_accuracy": 0.9829940417080437,
"eval_f1": 0.9736157562244518,
"eval_loss": 0.06101168692111969,
"eval_precision": 0.9710896960711638,
"eval_recall": 0.9761549925484352,
"eval_runtime": 2.0382,
"eval_samples_per_second": 331.668,
"eval_steps_per_second": 21.097,
"step": 800
},
{
"epoch": 2.36,
"eval_ACT": {
"f1": 0.9645254074784276,
"number": 519,
"precision": 0.9599236641221374,
"recall": 0.9691714836223507
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9652914210870989,
"number": 761,
"precision": 0.9621409921671018,
"recall": 0.9684625492772667
},
"eval_PER": {
"f1": 0.9852724594992637,
"number": 679,
"precision": 0.9852724594992637,
"recall": 0.9852724594992637
},
"eval_TITRE": {
"f1": 0.925,
"number": 40,
"precision": 0.925,
"recall": 0.925
},
"eval_accuracy": 0.9842353525322741,
"eval_f1": 0.9756369722893807,
"eval_loss": 0.06042904779314995,
"eval_precision": 0.974006683995544,
"eval_recall": 0.9772727272727273,
"eval_runtime": 2.0867,
"eval_samples_per_second": 323.95,
"eval_steps_per_second": 20.606,
"step": 900
},
{
"epoch": 2.62,
"learning_rate": 8e-05,
"loss": 0.0621,
"step": 1000
},
{
"epoch": 2.62,
"eval_ACT": {
"f1": 0.9647283126787417,
"number": 519,
"precision": 0.9547169811320755,
"recall": 0.9749518304431599
},
"eval_CARDINAL": {
"f1": 0.9933774834437086,
"number": 678,
"precision": 0.9911894273127754,
"recall": 0.995575221238938
},
"eval_FT": {
"f1": 0.4,
"number": 7,
"precision": 0.6666666666666666,
"recall": 0.2857142857142857
},
"eval_LOC": {
"f1": 0.9730794484569928,
"number": 761,
"precision": 0.9724409448818898,
"recall": 0.973718791064389
},
"eval_PER": {
"f1": 0.9882179675994109,
"number": 679,
"precision": 0.9882179675994109,
"recall": 0.9882179675994109
},
"eval_TITRE": {
"f1": 0.925,
"number": 40,
"precision": 0.925,
"recall": 0.925
},
"eval_accuracy": 0.9846077457795432,
"eval_f1": 0.9786205614426474,
"eval_loss": 0.06579616665840149,
"eval_precision": 0.9766233766233766,
"eval_recall": 0.9806259314456036,
"eval_runtime": 2.1397,
"eval_samples_per_second": 315.934,
"eval_steps_per_second": 20.096,
"step": 1000
}
],
"max_steps": 5000,
"num_train_epochs": 14,
"total_flos": 406892146317096.0,
"trial_name": null,
"trial_params": null
}