CardioNER.eu_EuroBERT / trainer_state.json
UMCU's picture
Upload 12 files
210060d verified
{
"best_global_step": 264710,
"best_metric": 0.870147919438821,
"best_model_checkpoint": "T:\\laupodteam\\AIOS\\Bram\\language_modeling\\Models\\language_models\\CardioCCC\\EuroBERT\\multilabel_3ldense_20epochs_40splits/fold_0\\checkpoint-264710",
"epoch": 10.0,
"eval_steps": 500,
"global_step": 264710,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.009670960673945073,
"grad_norm": 1.4626084566116333,
"learning_rate": 1.9980733633032377e-05,
"loss": 1.326,
"step": 256
},
{
"epoch": 0.019341921347890145,
"grad_norm": 2.9422495365142822,
"learning_rate": 1.9961391711684486e-05,
"loss": 0.9436,
"step": 512
},
{
"epoch": 0.029012882021835214,
"grad_norm": 3.939150333404541,
"learning_rate": 1.9942049790336598e-05,
"loss": 0.8108,
"step": 768
},
{
"epoch": 0.03868384269578029,
"grad_norm": 3.260474681854248,
"learning_rate": 1.9922707868988706e-05,
"loss": 0.746,
"step": 1024
},
{
"epoch": 0.04835480336972536,
"grad_norm": 2.8487510681152344,
"learning_rate": 1.9903365947640814e-05,
"loss": 0.6876,
"step": 1280
},
{
"epoch": 0.05802576404367043,
"grad_norm": 3.7067031860351562,
"learning_rate": 1.9884024026292926e-05,
"loss": 0.6491,
"step": 1536
},
{
"epoch": 0.06769672471761551,
"grad_norm": 3.1346232891082764,
"learning_rate": 1.9864682104945038e-05,
"loss": 0.6117,
"step": 1792
},
{
"epoch": 0.07736768539156058,
"grad_norm": 3.9794366359710693,
"learning_rate": 1.9845340183597147e-05,
"loss": 0.584,
"step": 2048
},
{
"epoch": 0.08703864606550565,
"grad_norm": 3.7597267627716064,
"learning_rate": 1.9825998262249255e-05,
"loss": 0.5541,
"step": 2304
},
{
"epoch": 0.09670960673945073,
"grad_norm": 3.669264078140259,
"learning_rate": 1.9806656340901363e-05,
"loss": 0.5273,
"step": 2560
},
{
"epoch": 0.10638056741339579,
"grad_norm": 3.203001022338867,
"learning_rate": 1.9787314419553475e-05,
"loss": 0.5148,
"step": 2816
},
{
"epoch": 0.11605152808734086,
"grad_norm": 4.039089202880859,
"learning_rate": 1.9767972498205587e-05,
"loss": 0.4907,
"step": 3072
},
{
"epoch": 0.12572248876128594,
"grad_norm": 3.2784998416900635,
"learning_rate": 1.9748630576857695e-05,
"loss": 0.4825,
"step": 3328
},
{
"epoch": 0.13539344943523102,
"grad_norm": 3.981826066970825,
"learning_rate": 1.9729288655509804e-05,
"loss": 0.4639,
"step": 3584
},
{
"epoch": 0.1450644101091761,
"grad_norm": 4.3725690841674805,
"learning_rate": 1.9709946734161916e-05,
"loss": 0.4522,
"step": 3840
},
{
"epoch": 0.15473537078312116,
"grad_norm": 4.14705753326416,
"learning_rate": 1.969068036719429e-05,
"loss": 0.4452,
"step": 4096
},
{
"epoch": 0.16440633145706623,
"grad_norm": 3.336223840713501,
"learning_rate": 1.96713384458464e-05,
"loss": 0.4292,
"step": 4352
},
{
"epoch": 0.1740772921310113,
"grad_norm": 4.36456823348999,
"learning_rate": 1.9651996524498508e-05,
"loss": 0.4108,
"step": 4608
},
{
"epoch": 0.18374825280495638,
"grad_norm": 3.929685354232788,
"learning_rate": 1.9632654603150617e-05,
"loss": 0.403,
"step": 4864
},
{
"epoch": 0.19341921347890145,
"grad_norm": 4.6235671043396,
"learning_rate": 1.961331268180273e-05,
"loss": 0.3899,
"step": 5120
},
{
"epoch": 0.2030901741528465,
"grad_norm": 4.0524492263793945,
"learning_rate": 1.959397076045484e-05,
"loss": 0.3913,
"step": 5376
},
{
"epoch": 0.21276113482679157,
"grad_norm": 3.8945560455322266,
"learning_rate": 1.957462883910695e-05,
"loss": 0.3781,
"step": 5632
},
{
"epoch": 0.22243209550073664,
"grad_norm": 4.181601047515869,
"learning_rate": 1.9555286917759057e-05,
"loss": 0.3758,
"step": 5888
},
{
"epoch": 0.23210305617468172,
"grad_norm": 5.5385308265686035,
"learning_rate": 1.9536020550791436e-05,
"loss": 0.3646,
"step": 6144
},
{
"epoch": 0.2417740168486268,
"grad_norm": 5.160412311553955,
"learning_rate": 1.9516678629443545e-05,
"loss": 0.3572,
"step": 6400
},
{
"epoch": 0.2514449775225719,
"grad_norm": 6.071929931640625,
"learning_rate": 1.9497336708095653e-05,
"loss": 0.3453,
"step": 6656
},
{
"epoch": 0.26111593819651696,
"grad_norm": 4.409694671630859,
"learning_rate": 1.947799478674776e-05,
"loss": 0.3504,
"step": 6912
},
{
"epoch": 0.27078689887046203,
"grad_norm": 4.06134033203125,
"learning_rate": 1.9458652865399873e-05,
"loss": 0.3404,
"step": 7168
},
{
"epoch": 0.2804578595444071,
"grad_norm": 3.8032515048980713,
"learning_rate": 1.9439310944051982e-05,
"loss": 0.34,
"step": 7424
},
{
"epoch": 0.2901288202183522,
"grad_norm": 4.95781135559082,
"learning_rate": 1.9419969022704094e-05,
"loss": 0.3249,
"step": 7680
},
{
"epoch": 0.29979978089229725,
"grad_norm": 3.898789167404175,
"learning_rate": 1.9400627101356202e-05,
"loss": 0.3218,
"step": 7936
},
{
"epoch": 0.3094707415662423,
"grad_norm": 4.6803717613220215,
"learning_rate": 1.9381285180008314e-05,
"loss": 0.3144,
"step": 8192
},
{
"epoch": 0.3191417022401874,
"grad_norm": 6.2057600021362305,
"learning_rate": 1.936201881304069e-05,
"loss": 0.3056,
"step": 8448
},
{
"epoch": 0.32881266291413247,
"grad_norm": 4.742001056671143,
"learning_rate": 1.9342676891692798e-05,
"loss": 0.3031,
"step": 8704
},
{
"epoch": 0.33848362358807754,
"grad_norm": 5.605335235595703,
"learning_rate": 1.9323334970344906e-05,
"loss": 0.2989,
"step": 8960
},
{
"epoch": 0.3481545842620226,
"grad_norm": 5.512292861938477,
"learning_rate": 1.9303993048997015e-05,
"loss": 0.2838,
"step": 9216
},
{
"epoch": 0.3578255449359677,
"grad_norm": 5.346792697906494,
"learning_rate": 1.9284651127649127e-05,
"loss": 0.2871,
"step": 9472
},
{
"epoch": 0.36749650560991276,
"grad_norm": 3.5019690990448,
"learning_rate": 1.926530920630124e-05,
"loss": 0.2794,
"step": 9728
},
{
"epoch": 0.37716746628385783,
"grad_norm": 4.682333946228027,
"learning_rate": 1.9245967284953347e-05,
"loss": 0.2736,
"step": 9984
},
{
"epoch": 0.3868384269578029,
"grad_norm": 7.038910865783691,
"learning_rate": 1.9226625363605455e-05,
"loss": 0.2786,
"step": 10240
},
{
"epoch": 0.396509387631748,
"grad_norm": 4.099844455718994,
"learning_rate": 1.9207283442257567e-05,
"loss": 0.2721,
"step": 10496
},
{
"epoch": 0.406180348305693,
"grad_norm": 3.918942928314209,
"learning_rate": 1.9187941520909676e-05,
"loss": 0.2704,
"step": 10752
},
{
"epoch": 0.41585130897963807,
"grad_norm": 5.411423683166504,
"learning_rate": 1.9168599599561784e-05,
"loss": 0.2604,
"step": 11008
},
{
"epoch": 0.42552226965358314,
"grad_norm": 7.702000617980957,
"learning_rate": 1.9149257678213896e-05,
"loss": 0.2618,
"step": 11264
},
{
"epoch": 0.4351932303275282,
"grad_norm": 4.103521347045898,
"learning_rate": 1.912999131124627e-05,
"loss": 0.2511,
"step": 11520
},
{
"epoch": 0.4448641910014733,
"grad_norm": 6.066595077514648,
"learning_rate": 1.911064938989838e-05,
"loss": 0.2551,
"step": 11776
},
{
"epoch": 0.45453515167541836,
"grad_norm": 6.25346565246582,
"learning_rate": 1.9091307468550492e-05,
"loss": 0.2499,
"step": 12032
},
{
"epoch": 0.46420611234936343,
"grad_norm": 4.310111045837402,
"learning_rate": 1.90719655472026e-05,
"loss": 0.2403,
"step": 12288
},
{
"epoch": 0.4738770730233085,
"grad_norm": 6.692182540893555,
"learning_rate": 1.9052623625854712e-05,
"loss": 0.24,
"step": 12544
},
{
"epoch": 0.4835480336972536,
"grad_norm": 4.0325751304626465,
"learning_rate": 1.903328170450682e-05,
"loss": 0.2383,
"step": 12800
},
{
"epoch": 0.49321899437119865,
"grad_norm": 4.97512149810791,
"learning_rate": 1.901393978315893e-05,
"loss": 0.2333,
"step": 13056
},
{
"epoch": 0.5028899550451438,
"grad_norm": 4.146473407745361,
"learning_rate": 1.899459786181104e-05,
"loss": 0.2342,
"step": 13312
},
{
"epoch": 0.5125609157190888,
"grad_norm": 6.477240562438965,
"learning_rate": 1.897525594046315e-05,
"loss": 0.23,
"step": 13568
},
{
"epoch": 0.5222318763930339,
"grad_norm": 5.060920715332031,
"learning_rate": 1.895591401911526e-05,
"loss": 0.2317,
"step": 13824
},
{
"epoch": 0.5319028370669789,
"grad_norm": 7.546407222747803,
"learning_rate": 1.893657209776737e-05,
"loss": 0.2235,
"step": 14080
},
{
"epoch": 0.5415737977409241,
"grad_norm": 6.76540994644165,
"learning_rate": 1.8917230176419478e-05,
"loss": 0.2189,
"step": 14336
},
{
"epoch": 0.5512447584148691,
"grad_norm": 6.734369277954102,
"learning_rate": 1.889788825507159e-05,
"loss": 0.2136,
"step": 14592
},
{
"epoch": 0.5609157190888142,
"grad_norm": 4.962408065795898,
"learning_rate": 1.8878546333723698e-05,
"loss": 0.2116,
"step": 14848
},
{
"epoch": 0.5705866797627592,
"grad_norm": 6.1386332511901855,
"learning_rate": 1.8859279966756074e-05,
"loss": 0.212,
"step": 15104
},
{
"epoch": 0.5802576404367044,
"grad_norm": 6.326384544372559,
"learning_rate": 1.8839938045408182e-05,
"loss": 0.2074,
"step": 15360
},
{
"epoch": 0.5899286011106494,
"grad_norm": 6.425912857055664,
"learning_rate": 1.8820596124060294e-05,
"loss": 0.2043,
"step": 15616
},
{
"epoch": 0.5995995617845945,
"grad_norm": 5.6023945808410645,
"learning_rate": 1.8801254202712406e-05,
"loss": 0.205,
"step": 15872
},
{
"epoch": 0.6092705224585395,
"grad_norm": 5.436675071716309,
"learning_rate": 1.8781912281364514e-05,
"loss": 0.2,
"step": 16128
},
{
"epoch": 0.6189414831324846,
"grad_norm": 3.5356578826904297,
"learning_rate": 1.8762570360016623e-05,
"loss": 0.1957,
"step": 16384
},
{
"epoch": 0.6286124438064297,
"grad_norm": 4.914231777191162,
"learning_rate": 1.874322843866873e-05,
"loss": 0.1957,
"step": 16640
},
{
"epoch": 0.6382834044803748,
"grad_norm": 5.829110145568848,
"learning_rate": 1.8723886517320843e-05,
"loss": 0.1936,
"step": 16896
},
{
"epoch": 0.6479543651543198,
"grad_norm": 9.775616645812988,
"learning_rate": 1.8704544595972955e-05,
"loss": 0.194,
"step": 17152
},
{
"epoch": 0.6576253258282649,
"grad_norm": 3.6314735412597656,
"learning_rate": 1.8685202674625063e-05,
"loss": 0.1862,
"step": 17408
},
{
"epoch": 0.66729628650221,
"grad_norm": 4.77644681930542,
"learning_rate": 1.8665860753277172e-05,
"loss": 0.1828,
"step": 17664
},
{
"epoch": 0.6769672471761551,
"grad_norm": 7.319884300231934,
"learning_rate": 1.8646518831929284e-05,
"loss": 0.1879,
"step": 17920
},
{
"epoch": 0.6866382078501001,
"grad_norm": 5.536057949066162,
"learning_rate": 1.8627176910581392e-05,
"loss": 0.1836,
"step": 18176
},
{
"epoch": 0.6963091685240452,
"grad_norm": 5.481319904327393,
"learning_rate": 1.86078349892335e-05,
"loss": 0.1802,
"step": 18432
},
{
"epoch": 0.7059801291979902,
"grad_norm": 6.011005401611328,
"learning_rate": 1.8588493067885612e-05,
"loss": 0.1824,
"step": 18688
},
{
"epoch": 0.7156510898719354,
"grad_norm": 5.187521457672119,
"learning_rate": 1.8569151146537724e-05,
"loss": 0.1763,
"step": 18944
},
{
"epoch": 0.7253220505458804,
"grad_norm": 6.904630661010742,
"learning_rate": 1.8549884779570096e-05,
"loss": 0.1719,
"step": 19200
},
{
"epoch": 0.7349930112198255,
"grad_norm": 7.806436538696289,
"learning_rate": 1.8530542858222208e-05,
"loss": 0.1707,
"step": 19456
},
{
"epoch": 0.7446639718937705,
"grad_norm": 3.597665548324585,
"learning_rate": 1.8511200936874317e-05,
"loss": 0.1706,
"step": 19712
},
{
"epoch": 0.7543349325677157,
"grad_norm": 4.756324291229248,
"learning_rate": 1.849185901552643e-05,
"loss": 0.1689,
"step": 19968
},
{
"epoch": 0.7640058932416607,
"grad_norm": 5.917934894561768,
"learning_rate": 1.8472517094178537e-05,
"loss": 0.1671,
"step": 20224
},
{
"epoch": 0.7736768539156058,
"grad_norm": 7.077094554901123,
"learning_rate": 1.8453175172830645e-05,
"loss": 0.1655,
"step": 20480
},
{
"epoch": 0.7833478145895508,
"grad_norm": 4.210581302642822,
"learning_rate": 1.8433833251482757e-05,
"loss": 0.1576,
"step": 20736
},
{
"epoch": 0.793018775263496,
"grad_norm": 4.523745059967041,
"learning_rate": 1.8414491330134866e-05,
"loss": 0.1601,
"step": 20992
},
{
"epoch": 0.802689735937441,
"grad_norm": 4.547347545623779,
"learning_rate": 1.8395149408786977e-05,
"loss": 0.1583,
"step": 21248
},
{
"epoch": 0.812360696611386,
"grad_norm": 4.029369831085205,
"learning_rate": 1.837588304181935e-05,
"loss": 0.1576,
"step": 21504
},
{
"epoch": 0.8220316572853311,
"grad_norm": 5.123602867126465,
"learning_rate": 1.835654112047146e-05,
"loss": 0.1514,
"step": 21760
},
{
"epoch": 0.8317026179592761,
"grad_norm": 6.265158176422119,
"learning_rate": 1.833719919912357e-05,
"loss": 0.157,
"step": 22016
},
{
"epoch": 0.8413735786332213,
"grad_norm": 8.210796356201172,
"learning_rate": 1.8317857277775682e-05,
"loss": 0.1503,
"step": 22272
},
{
"epoch": 0.8510445393071663,
"grad_norm": 10.078185081481934,
"learning_rate": 1.829851535642779e-05,
"loss": 0.15,
"step": 22528
},
{
"epoch": 0.8607154999811114,
"grad_norm": 6.486992359161377,
"learning_rate": 1.82791734350799e-05,
"loss": 0.1484,
"step": 22784
},
{
"epoch": 0.8703864606550564,
"grad_norm": 6.386577129364014,
"learning_rate": 1.825983151373201e-05,
"loss": 0.1476,
"step": 23040
},
{
"epoch": 0.8800574213290016,
"grad_norm": 7.5579328536987305,
"learning_rate": 1.8240489592384122e-05,
"loss": 0.1458,
"step": 23296
},
{
"epoch": 0.8897283820029466,
"grad_norm": 3.283404588699341,
"learning_rate": 1.8221223225416495e-05,
"loss": 0.144,
"step": 23552
},
{
"epoch": 0.8993993426768917,
"grad_norm": 7.462500095367432,
"learning_rate": 1.8201881304068606e-05,
"loss": 0.1475,
"step": 23808
},
{
"epoch": 0.9090703033508367,
"grad_norm": 4.219975471496582,
"learning_rate": 1.8182539382720715e-05,
"loss": 0.1415,
"step": 24064
},
{
"epoch": 0.9187412640247818,
"grad_norm": 5.009161949157715,
"learning_rate": 1.8163197461372823e-05,
"loss": 0.1395,
"step": 24320
},
{
"epoch": 0.9284122246987269,
"grad_norm": 5.921178340911865,
"learning_rate": 1.8143855540024935e-05,
"loss": 0.1381,
"step": 24576
},
{
"epoch": 0.938083185372672,
"grad_norm": 5.374543190002441,
"learning_rate": 1.8124513618677044e-05,
"loss": 0.1352,
"step": 24832
},
{
"epoch": 0.947754146046617,
"grad_norm": 3.8733317852020264,
"learning_rate": 1.8105171697329152e-05,
"loss": 0.1346,
"step": 25088
},
{
"epoch": 0.9574251067205621,
"grad_norm": 4.049707412719727,
"learning_rate": 1.8085829775981264e-05,
"loss": 0.1319,
"step": 25344
},
{
"epoch": 0.9670960673945072,
"grad_norm": 7.517127990722656,
"learning_rate": 1.806656340901364e-05,
"loss": 0.1271,
"step": 25600
},
{
"epoch": 0.9767670280684523,
"grad_norm": 4.687051773071289,
"learning_rate": 1.8047221487665748e-05,
"loss": 0.1279,
"step": 25856
},
{
"epoch": 0.9864379887423973,
"grad_norm": 4.79626989364624,
"learning_rate": 1.802787956631786e-05,
"loss": 0.1307,
"step": 26112
},
{
"epoch": 0.9961089494163424,
"grad_norm": 4.730831623077393,
"learning_rate": 1.8008537644969968e-05,
"loss": 0.1302,
"step": 26368
},
{
"epoch": 1.0,
"eval_f1_B-DISEASE": 0.7781765393765878,
"eval_f1_B-MEDICATION": 0.9037345902828137,
"eval_f1_B-PROCEDURE": 0.7974038223998922,
"eval_f1_B-SYMPTOM": 0.7777604788347432,
"eval_f1_I-DISEASE": 0.8292819119234635,
"eval_f1_I-MEDICATION": 0.9226245076350295,
"eval_f1_I-PROCEDURE": 0.8287028141772023,
"eval_f1_I-SYMPTOM": 0.7961978076970171,
"eval_f1_O": 0.9184682391128007,
"eval_f1_macro": 0.8391500790488389,
"eval_f1_micro": 0.8767886171279684,
"eval_loss": 0.26655662059783936,
"eval_precision_B-DISEASE": 0.7914206036745407,
"eval_precision_B-MEDICATION": 0.9209310918159985,
"eval_precision_B-PROCEDURE": 0.839345657415725,
"eval_precision_B-SYMPTOM": 0.7863714275719733,
"eval_precision_I-DISEASE": 0.8204249990792915,
"eval_precision_I-MEDICATION": 0.9416267415606586,
"eval_precision_I-PROCEDURE": 0.8691026329930145,
"eval_precision_I-SYMPTOM": 0.7889775161164393,
"eval_precision_O": 0.9252825164715074,
"eval_precision_macro": 0.8537203540776832,
"eval_precision_micro": 0.8833806029697474,
"eval_rauc_macro": 0.9021063420010184,
"eval_rauc_micro": 0.9278253367848399,
"eval_recall_B-DISEASE": 0.7653684461013722,
"eval_recall_B-MEDICATION": 0.8871685353265706,
"eval_recall_B-PROCEDURE": 0.7594541409993155,
"eval_recall_B-SYMPTOM": 0.7693360711841205,
"eval_recall_I-DISEASE": 0.838332141647537,
"eval_recall_I-MEDICATION": 0.9043740413603427,
"eval_recall_I-PROCEDURE": 0.7918920903816495,
"eval_recall_I-SYMPTOM": 0.8035514721684934,
"eval_recall_O": 0.9117535959899989,
"eval_recall_macro": 0.8256922816843777,
"eval_recall_micro": 0.8702942843552489,
"eval_roc_auc_B-DISEASE": 0.8808075963149171,
"eval_roc_auc_B-MEDICATION": 0.9434285957498447,
"eval_roc_auc_B-PROCEDURE": 0.87847497845947,
"eval_roc_auc_B-SYMPTOM": 0.8824080001390723,
"eval_roc_auc_I-DISEASE": 0.9071844217170272,
"eval_roc_auc_I-MEDICATION": 0.9517977149811767,
"eval_roc_auc_I-PROCEDURE": 0.8901357064770181,
"eval_roc_auc_I-SYMPTOM": 0.8850274935590098,
"eval_roc_auc_O": 0.8996925706116287,
"eval_runtime": 61.1466,
"eval_samples_per_second": 177.818,
"eval_steps_per_second": 22.242,
"step": 26471
},
{
"epoch": 1.0057799100902876,
"grad_norm": 3.7280209064483643,
"learning_rate": 1.798919572362208e-05,
"loss": 0.1119,
"step": 26624
},
{
"epoch": 1.0154508707642325,
"grad_norm": 5.684998512268066,
"learning_rate": 1.796985380227419e-05,
"loss": 0.0936,
"step": 26880
},
{
"epoch": 1.0251218314381776,
"grad_norm": 3.695190191268921,
"learning_rate": 1.7950511880926297e-05,
"loss": 0.0955,
"step": 27136
},
{
"epoch": 1.0347927921121227,
"grad_norm": 4.493898868560791,
"learning_rate": 1.793116995957841e-05,
"loss": 0.0922,
"step": 27392
},
{
"epoch": 1.0444637527860678,
"grad_norm": 4.638331413269043,
"learning_rate": 1.7911828038230517e-05,
"loss": 0.0923,
"step": 27648
},
{
"epoch": 1.0541347134600128,
"grad_norm": 4.798746585845947,
"learning_rate": 1.7892561671262893e-05,
"loss": 0.0918,
"step": 27904
},
{
"epoch": 1.0638056741339579,
"grad_norm": 4.274206638336182,
"learning_rate": 1.7873219749915e-05,
"loss": 0.0945,
"step": 28160
},
{
"epoch": 1.073476634807903,
"grad_norm": 3.235424280166626,
"learning_rate": 1.7853877828567113e-05,
"loss": 0.0919,
"step": 28416
},
{
"epoch": 1.0831475954818481,
"grad_norm": 4.507290363311768,
"learning_rate": 1.783453590721922e-05,
"loss": 0.0932,
"step": 28672
},
{
"epoch": 1.092818556155793,
"grad_norm": 10.315567016601562,
"learning_rate": 1.7815193985871333e-05,
"loss": 0.0952,
"step": 28928
},
{
"epoch": 1.1024895168297382,
"grad_norm": 8.936885833740234,
"learning_rate": 1.7795852064523442e-05,
"loss": 0.0899,
"step": 29184
},
{
"epoch": 1.1121604775036833,
"grad_norm": 2.79886531829834,
"learning_rate": 1.777651014317555e-05,
"loss": 0.0901,
"step": 29440
},
{
"epoch": 1.1218314381776284,
"grad_norm": 3.2710986137390137,
"learning_rate": 1.7757168221827662e-05,
"loss": 0.0883,
"step": 29696
},
{
"epoch": 1.1315023988515733,
"grad_norm": 4.917572498321533,
"learning_rate": 1.7737826300479774e-05,
"loss": 0.0896,
"step": 29952
},
{
"epoch": 1.1411733595255185,
"grad_norm": 4.567966938018799,
"learning_rate": 1.7718484379131882e-05,
"loss": 0.0914,
"step": 30208
},
{
"epoch": 1.1508443201994636,
"grad_norm": 3.6949679851531982,
"learning_rate": 1.769914245778399e-05,
"loss": 0.0871,
"step": 30464
},
{
"epoch": 1.1605152808734087,
"grad_norm": 8.372673988342285,
"learning_rate": 1.7679876090816366e-05,
"loss": 0.0909,
"step": 30720
},
{
"epoch": 1.1701862415473536,
"grad_norm": 3.8434600830078125,
"learning_rate": 1.7660534169468478e-05,
"loss": 0.0849,
"step": 30976
},
{
"epoch": 1.1798572022212988,
"grad_norm": 4.115856647491455,
"learning_rate": 1.7641192248120587e-05,
"loss": 0.0904,
"step": 31232
},
{
"epoch": 1.1895281628952439,
"grad_norm": 3.246572971343994,
"learning_rate": 1.7621850326772695e-05,
"loss": 0.0907,
"step": 31488
},
{
"epoch": 1.199199123569189,
"grad_norm": 3.668151617050171,
"learning_rate": 1.7602508405424807e-05,
"loss": 0.0864,
"step": 31744
},
{
"epoch": 1.208870084243134,
"grad_norm": 3.0340752601623535,
"learning_rate": 1.7583166484076915e-05,
"loss": 0.0848,
"step": 32000
},
{
"epoch": 1.218541044917079,
"grad_norm": 4.029708385467529,
"learning_rate": 1.7563824562729027e-05,
"loss": 0.0857,
"step": 32256
},
{
"epoch": 1.2282120055910242,
"grad_norm": 5.181060791015625,
"learning_rate": 1.7544482641381136e-05,
"loss": 0.0863,
"step": 32512
},
{
"epoch": 1.2378829662649693,
"grad_norm": 5.2258124351501465,
"learning_rate": 1.752521627441351e-05,
"loss": 0.0867,
"step": 32768
},
{
"epoch": 1.2475539269389142,
"grad_norm": 10.210968017578125,
"learning_rate": 1.750587435306562e-05,
"loss": 0.0878,
"step": 33024
},
{
"epoch": 1.2572248876128593,
"grad_norm": 3.4898252487182617,
"learning_rate": 1.748653243171773e-05,
"loss": 0.0831,
"step": 33280
},
{
"epoch": 1.2668958482868045,
"grad_norm": 4.27427864074707,
"learning_rate": 1.746719051036984e-05,
"loss": 0.0864,
"step": 33536
},
{
"epoch": 1.2765668089607494,
"grad_norm": 5.286701679229736,
"learning_rate": 1.744784858902195e-05,
"loss": 0.0799,
"step": 33792
},
{
"epoch": 1.2862377696346945,
"grad_norm": 3.2482128143310547,
"learning_rate": 1.742850666767406e-05,
"loss": 0.084,
"step": 34048
},
{
"epoch": 1.2959087303086396,
"grad_norm": 2.9942526817321777,
"learning_rate": 1.7409164746326172e-05,
"loss": 0.0834,
"step": 34304
},
{
"epoch": 1.3055796909825848,
"grad_norm": 9.361547470092773,
"learning_rate": 1.738982282497828e-05,
"loss": 0.0851,
"step": 34560
},
{
"epoch": 1.3152506516565299,
"grad_norm": 5.259056568145752,
"learning_rate": 1.737048090363039e-05,
"loss": 0.0824,
"step": 34816
},
{
"epoch": 1.3249216123304748,
"grad_norm": 4.652898788452148,
"learning_rate": 1.7351138982282497e-05,
"loss": 0.0807,
"step": 35072
},
{
"epoch": 1.33459257300442,
"grad_norm": 3.225607395172119,
"learning_rate": 1.733179706093461e-05,
"loss": 0.0833,
"step": 35328
},
{
"epoch": 1.344263533678365,
"grad_norm": 4.242973804473877,
"learning_rate": 1.7312530693966985e-05,
"loss": 0.0785,
"step": 35584
},
{
"epoch": 1.35393449435231,
"grad_norm": 3.6310012340545654,
"learning_rate": 1.7293188772619093e-05,
"loss": 0.082,
"step": 35840
},
{
"epoch": 1.363605455026255,
"grad_norm": 4.149777412414551,
"learning_rate": 1.72738468512712e-05,
"loss": 0.0788,
"step": 36096
},
{
"epoch": 1.3732764157002002,
"grad_norm": 3.4874989986419678,
"learning_rate": 1.7254504929923313e-05,
"loss": 0.0813,
"step": 36352
},
{
"epoch": 1.3829473763741453,
"grad_norm": 4.847866535186768,
"learning_rate": 1.7235163008575425e-05,
"loss": 0.0762,
"step": 36608
},
{
"epoch": 1.3926183370480905,
"grad_norm": 6.0248332023620605,
"learning_rate": 1.7215821087227534e-05,
"loss": 0.084,
"step": 36864
},
{
"epoch": 1.4022892977220354,
"grad_norm": 12.932506561279297,
"learning_rate": 1.7196479165879642e-05,
"loss": 0.0774,
"step": 37120
},
{
"epoch": 1.4119602583959805,
"grad_norm": 4.421403884887695,
"learning_rate": 1.7177137244531754e-05,
"loss": 0.0745,
"step": 37376
},
{
"epoch": 1.4216312190699256,
"grad_norm": 4.352053165435791,
"learning_rate": 1.7157795323183862e-05,
"loss": 0.0766,
"step": 37632
},
{
"epoch": 1.4313021797438705,
"grad_norm": 3.0803287029266357,
"learning_rate": 1.7138528956216238e-05,
"loss": 0.0786,
"step": 37888
},
{
"epoch": 1.4409731404178157,
"grad_norm": 9.046032905578613,
"learning_rate": 1.7119187034868347e-05,
"loss": 0.0792,
"step": 38144
},
{
"epoch": 1.4506441010917608,
"grad_norm": 5.227222442626953,
"learning_rate": 1.709984511352046e-05,
"loss": 0.0782,
"step": 38400
},
{
"epoch": 1.460315061765706,
"grad_norm": 9.277040481567383,
"learning_rate": 1.7080503192172567e-05,
"loss": 0.0734,
"step": 38656
},
{
"epoch": 1.469986022439651,
"grad_norm": 6.931709289550781,
"learning_rate": 1.706116127082468e-05,
"loss": 0.0745,
"step": 38912
},
{
"epoch": 1.479656983113596,
"grad_norm": 2.403529167175293,
"learning_rate": 1.7041819349476787e-05,
"loss": 0.0713,
"step": 39168
},
{
"epoch": 1.489327943787541,
"grad_norm": 3.0608630180358887,
"learning_rate": 1.7022477428128895e-05,
"loss": 0.0724,
"step": 39424
},
{
"epoch": 1.4989989044614862,
"grad_norm": 2.9378268718719482,
"learning_rate": 1.7003135506781007e-05,
"loss": 0.0719,
"step": 39680
},
{
"epoch": 1.508669865135431,
"grad_norm": 4.745122909545898,
"learning_rate": 1.6983869139813383e-05,
"loss": 0.0755,
"step": 39936
},
{
"epoch": 1.5183408258093762,
"grad_norm": 7.573899745941162,
"learning_rate": 1.696452721846549e-05,
"loss": 0.0731,
"step": 40192
},
{
"epoch": 1.5280117864833214,
"grad_norm": 10.226018905639648,
"learning_rate": 1.69451852971176e-05,
"loss": 0.076,
"step": 40448
},
{
"epoch": 1.5376827471572665,
"grad_norm": 5.051877021789551,
"learning_rate": 1.692584337576971e-05,
"loss": 0.075,
"step": 40704
},
{
"epoch": 1.5473537078312116,
"grad_norm": 4.395775318145752,
"learning_rate": 1.6906501454421823e-05,
"loss": 0.0735,
"step": 40960
},
{
"epoch": 1.5570246685051568,
"grad_norm": 4.498766899108887,
"learning_rate": 1.6887159533073932e-05,
"loss": 0.0729,
"step": 41216
},
{
"epoch": 1.5666956291791017,
"grad_norm": 5.933803558349609,
"learning_rate": 1.686781761172604e-05,
"loss": 0.0748,
"step": 41472
},
{
"epoch": 1.5763665898530468,
"grad_norm": 2.9409236907958984,
"learning_rate": 1.6848475690378152e-05,
"loss": 0.07,
"step": 41728
},
{
"epoch": 1.5860375505269917,
"grad_norm": 8.31312370300293,
"learning_rate": 1.6829209323410528e-05,
"loss": 0.0703,
"step": 41984
},
{
"epoch": 1.5957085112009368,
"grad_norm": 1.95456862449646,
"learning_rate": 1.6809867402062636e-05,
"loss": 0.0709,
"step": 42240
},
{
"epoch": 1.605379471874882,
"grad_norm": 3.6376004219055176,
"learning_rate": 1.6790525480714745e-05,
"loss": 0.0656,
"step": 42496
},
{
"epoch": 1.615050432548827,
"grad_norm": 3.3740224838256836,
"learning_rate": 1.6771183559366853e-05,
"loss": 0.0728,
"step": 42752
},
{
"epoch": 1.6247213932227722,
"grad_norm": 2.608504295349121,
"learning_rate": 1.6751841638018965e-05,
"loss": 0.0723,
"step": 43008
},
{
"epoch": 1.634392353896717,
"grad_norm": 5.380160808563232,
"learning_rate": 1.6732499716671077e-05,
"loss": 0.0686,
"step": 43264
},
{
"epoch": 1.6440633145706622,
"grad_norm": 1.6728038787841797,
"learning_rate": 1.6713157795323185e-05,
"loss": 0.0668,
"step": 43520
},
{
"epoch": 1.6537342752446071,
"grad_norm": 7.20682430267334,
"learning_rate": 1.6693815873975294e-05,
"loss": 0.0689,
"step": 43776
},
{
"epoch": 1.6634052359185523,
"grad_norm": 9.442398071289062,
"learning_rate": 1.667454950700767e-05,
"loss": 0.0669,
"step": 44032
},
{
"epoch": 1.6730761965924974,
"grad_norm": 3.7477312088012695,
"learning_rate": 1.665520758565978e-05,
"loss": 0.0647,
"step": 44288
},
{
"epoch": 1.6827471572664425,
"grad_norm": 4.700344085693359,
"learning_rate": 1.663586566431189e-05,
"loss": 0.0712,
"step": 44544
},
{
"epoch": 1.6924181179403877,
"grad_norm": 3.5288517475128174,
"learning_rate": 1.6616523742963998e-05,
"loss": 0.0678,
"step": 44800
},
{
"epoch": 1.7020890786143328,
"grad_norm": 7.689276695251465,
"learning_rate": 1.659718182161611e-05,
"loss": 0.0668,
"step": 45056
},
{
"epoch": 1.7117600392882777,
"grad_norm": 4.36802339553833,
"learning_rate": 1.657783990026822e-05,
"loss": 0.0625,
"step": 45312
},
{
"epoch": 1.7214309999622228,
"grad_norm": 2.3436222076416016,
"learning_rate": 1.6558573533300594e-05,
"loss": 0.0655,
"step": 45568
},
{
"epoch": 1.7311019606361677,
"grad_norm": 1.5666533708572388,
"learning_rate": 1.6539231611952706e-05,
"loss": 0.0644,
"step": 45824
},
{
"epoch": 1.7407729213101129,
"grad_norm": 4.3904266357421875,
"learning_rate": 1.6519889690604814e-05,
"loss": 0.0634,
"step": 46080
},
{
"epoch": 1.750443881984058,
"grad_norm": 2.4941790103912354,
"learning_rate": 1.6500547769256926e-05,
"loss": 0.0641,
"step": 46336
},
{
"epoch": 1.760114842658003,
"grad_norm": 3.0806963443756104,
"learning_rate": 1.6481205847909034e-05,
"loss": 0.0664,
"step": 46592
},
{
"epoch": 1.7697858033319482,
"grad_norm": 6.179355621337891,
"learning_rate": 1.6461863926561143e-05,
"loss": 0.0626,
"step": 46848
},
{
"epoch": 1.7794567640058934,
"grad_norm": 1.792417287826538,
"learning_rate": 1.644252200521325e-05,
"loss": 0.0623,
"step": 47104
},
{
"epoch": 1.7891277246798383,
"grad_norm": 3.0433876514434814,
"learning_rate": 1.6423180083865363e-05,
"loss": 0.0629,
"step": 47360
},
{
"epoch": 1.7987986853537834,
"grad_norm": 8.955931663513184,
"learning_rate": 1.6403838162517475e-05,
"loss": 0.064,
"step": 47616
},
{
"epoch": 1.8084696460277283,
"grad_norm": 1.9222790002822876,
"learning_rate": 1.6384496241169583e-05,
"loss": 0.062,
"step": 47872
},
{
"epoch": 1.8181406067016734,
"grad_norm": 6.602641582489014,
"learning_rate": 1.6365154319821692e-05,
"loss": 0.0625,
"step": 48128
},
{
"epoch": 1.8278115673756186,
"grad_norm": 3.8623206615448,
"learning_rate": 1.6345812398473804e-05,
"loss": 0.0641,
"step": 48384
},
{
"epoch": 1.8374825280495637,
"grad_norm": 3.5689499378204346,
"learning_rate": 1.6326470477125912e-05,
"loss": 0.061,
"step": 48640
},
{
"epoch": 1.8471534887235088,
"grad_norm": 5.1966705322265625,
"learning_rate": 1.6307128555778024e-05,
"loss": 0.0603,
"step": 48896
},
{
"epoch": 1.856824449397454,
"grad_norm": 8.878084182739258,
"learning_rate": 1.6287862188810396e-05,
"loss": 0.0609,
"step": 49152
},
{
"epoch": 1.8664954100713989,
"grad_norm": 8.031649589538574,
"learning_rate": 1.6268520267462508e-05,
"loss": 0.0609,
"step": 49408
},
{
"epoch": 1.876166370745344,
"grad_norm": 5.966855525970459,
"learning_rate": 1.6249178346114616e-05,
"loss": 0.0603,
"step": 49664
},
{
"epoch": 1.8858373314192889,
"grad_norm": 5.956678867340088,
"learning_rate": 1.622983642476673e-05,
"loss": 0.0571,
"step": 49920
},
{
"epoch": 1.895508292093234,
"grad_norm": 4.6985650062561035,
"learning_rate": 1.6210494503418837e-05,
"loss": 0.0608,
"step": 50176
},
{
"epoch": 1.9051792527671791,
"grad_norm": 2.0274322032928467,
"learning_rate": 1.6191152582070945e-05,
"loss": 0.0601,
"step": 50432
},
{
"epoch": 1.9148502134411243,
"grad_norm": 2.5451152324676514,
"learning_rate": 1.6171810660723057e-05,
"loss": 0.0585,
"step": 50688
},
{
"epoch": 1.9245211741150694,
"grad_norm": 10.576590538024902,
"learning_rate": 1.6152468739375165e-05,
"loss": 0.0604,
"step": 50944
},
{
"epoch": 1.9341921347890145,
"grad_norm": 2.8857650756835938,
"learning_rate": 1.6133126818027277e-05,
"loss": 0.0577,
"step": 51200
},
{
"epoch": 1.9438630954629594,
"grad_norm": 3.5323078632354736,
"learning_rate": 1.6113784896679386e-05,
"loss": 0.0593,
"step": 51456
},
{
"epoch": 1.9535340561369046,
"grad_norm": 1.838157057762146,
"learning_rate": 1.6094442975331498e-05,
"loss": 0.0607,
"step": 51712
},
{
"epoch": 1.9632050168108495,
"grad_norm": 3.0781214237213135,
"learning_rate": 1.6075101053983606e-05,
"loss": 0.0579,
"step": 51968
},
{
"epoch": 1.9728759774847946,
"grad_norm": 3.3382725715637207,
"learning_rate": 1.6055759132635714e-05,
"loss": 0.0583,
"step": 52224
},
{
"epoch": 1.9825469381587397,
"grad_norm": 11.693552017211914,
"learning_rate": 1.6036417211287826e-05,
"loss": 0.06,
"step": 52480
},
{
"epoch": 1.9922178988326849,
"grad_norm": 2.506922960281372,
"learning_rate": 1.6017075289939935e-05,
"loss": 0.0565,
"step": 52736
},
{
"epoch": 2.0,
"eval_f1_B-DISEASE": 0.795667459204617,
"eval_f1_B-MEDICATION": 0.921751878321422,
"eval_f1_B-PROCEDURE": 0.8160781701088163,
"eval_f1_B-SYMPTOM": 0.7897939991838038,
"eval_f1_I-DISEASE": 0.840603319768283,
"eval_f1_I-MEDICATION": 0.9362919771083036,
"eval_f1_I-PROCEDURE": 0.8357941949344769,
"eval_f1_I-SYMPTOM": 0.7996366525364875,
"eval_f1_O": 0.9230678952157123,
"eval_f1_macro": 0.8509650607091025,
"eval_f1_micro": 0.8840404124180135,
"eval_loss": 0.31923601031303406,
"eval_precision_B-DISEASE": 0.8158783079808294,
"eval_precision_B-MEDICATION": 0.9499527856468366,
"eval_precision_B-PROCEDURE": 0.848526831070472,
"eval_precision_B-SYMPTOM": 0.8200744316297579,
"eval_precision_I-DISEASE": 0.8429946510571731,
"eval_precision_I-MEDICATION": 0.9561669515355351,
"eval_precision_I-PROCEDURE": 0.8788058788058788,
"eval_precision_I-SYMPTOM": 0.8278156741398548,
"eval_precision_O": 0.9126516403530364,
"eval_precision_macro": 0.8725407946910416,
"eval_precision_micro": 0.8876748775758254,
"eval_rauc_macro": 0.904220184377927,
"eval_rauc_micro": 0.9331179355327206,
"eval_recall_B-DISEASE": 0.7764337272943602,
"eval_recall_B-MEDICATION": 0.8951770777718455,
"eval_recall_B-PROCEDURE": 0.7860198494182067,
"eval_recall_B-SYMPTOM": 0.7616700889801505,
"eval_recall_I-DISEASE": 0.8382255171289154,
"eval_recall_I-MEDICATION": 0.9172264240757392,
"eval_recall_I-PROCEDURE": 0.7967963312035382,
"eval_recall_I-SYMPTOM": 0.7733129163980228,
"eval_recall_O": 0.9337246601871894,
"eval_recall_macro": 0.8309540658286632,
"eval_recall_micro": 0.8804355875575709,
"eval_roc_auc_B-DISEASE": 0.8865867148232266,
"eval_roc_auc_B-MEDICATION": 0.9474921532385823,
"eval_roc_auc_B-PROCEDURE": 0.8918013132047432,
"eval_roc_auc_B-SYMPTOM": 0.8790279783173326,
"eval_roc_auc_I-DISEASE": 0.9089187734702582,
"eval_roc_auc_I-MEDICATION": 0.9583212327636237,
"eval_roc_auc_I-PROCEDURE": 0.8930449895535946,
"eval_roc_auc_I-SYMPTOM": 0.8741219681493123,
"eval_roc_auc_O": 0.8986665358806698,
"eval_runtime": 61.4999,
"eval_samples_per_second": 176.797,
"eval_steps_per_second": 22.114,
"step": 52942
},
{
"epoch": 2.00188885950663,
"grad_norm": 6.549783706665039,
"learning_rate": 1.5997733368592046e-05,
"loss": 0.0527,
"step": 52992
},
{
"epoch": 2.011559820180575,
"grad_norm": 17.193124771118164,
"learning_rate": 1.597846700162442e-05,
"loss": 0.0401,
"step": 53248
},
{
"epoch": 2.0212307808545202,
"grad_norm": 9.684758186340332,
"learning_rate": 1.595912508027653e-05,
"loss": 0.0405,
"step": 53504
},
{
"epoch": 2.030901741528465,
"grad_norm": 2.453227996826172,
"learning_rate": 1.5939783158928642e-05,
"loss": 0.0412,
"step": 53760
},
{
"epoch": 2.04057270220241,
"grad_norm": 5.099764347076416,
"learning_rate": 1.592044123758075e-05,
"loss": 0.0392,
"step": 54016
},
{
"epoch": 2.050243662876355,
"grad_norm": 2.8053245544433594,
"learning_rate": 1.590109931623286e-05,
"loss": 0.0388,
"step": 54272
},
{
"epoch": 2.0599146235503003,
"grad_norm": 1.1759517192840576,
"learning_rate": 1.5881832949265235e-05,
"loss": 0.0411,
"step": 54528
},
{
"epoch": 2.0695855842242454,
"grad_norm": 5.915517330169678,
"learning_rate": 1.5862491027917343e-05,
"loss": 0.0389,
"step": 54784
},
{
"epoch": 2.0792565448981906,
"grad_norm": 8.0426664352417,
"learning_rate": 1.5843149106569455e-05,
"loss": 0.0382,
"step": 55040
},
{
"epoch": 2.0889275055721357,
"grad_norm": 10.392659187316895,
"learning_rate": 1.5823807185221564e-05,
"loss": 0.0421,
"step": 55296
},
{
"epoch": 2.098598466246081,
"grad_norm": 7.73749303817749,
"learning_rate": 1.5804465263873675e-05,
"loss": 0.0389,
"step": 55552
},
{
"epoch": 2.1082694269200255,
"grad_norm": 5.712843418121338,
"learning_rate": 1.5785123342525784e-05,
"loss": 0.0403,
"step": 55808
},
{
"epoch": 2.1179403875939706,
"grad_norm": 2.4857349395751953,
"learning_rate": 1.5765781421177896e-05,
"loss": 0.0389,
"step": 56064
},
{
"epoch": 2.1276113482679158,
"grad_norm": 2.2378458976745605,
"learning_rate": 1.5746439499830004e-05,
"loss": 0.0395,
"step": 56320
},
{
"epoch": 2.137282308941861,
"grad_norm": 5.0309739112854,
"learning_rate": 1.5727097578482113e-05,
"loss": 0.0407,
"step": 56576
},
{
"epoch": 2.146953269615806,
"grad_norm": 3.6221115589141846,
"learning_rate": 1.570775565713422e-05,
"loss": 0.0413,
"step": 56832
},
{
"epoch": 2.156624230289751,
"grad_norm": 4.810079574584961,
"learning_rate": 1.5688413735786333e-05,
"loss": 0.04,
"step": 57088
},
{
"epoch": 2.1662951909636963,
"grad_norm": 2.51513671875,
"learning_rate": 1.5669071814438445e-05,
"loss": 0.0404,
"step": 57344
},
{
"epoch": 2.1759661516376414,
"grad_norm": 2.1976306438446045,
"learning_rate": 1.5649805447470817e-05,
"loss": 0.0418,
"step": 57600
},
{
"epoch": 2.185637112311586,
"grad_norm": 2.1660706996917725,
"learning_rate": 1.563046352612293e-05,
"loss": 0.0379,
"step": 57856
},
{
"epoch": 2.195308072985531,
"grad_norm": 3.0370383262634277,
"learning_rate": 1.561112160477504e-05,
"loss": 0.0386,
"step": 58112
},
{
"epoch": 2.2049790336594763,
"grad_norm": 2.958423614501953,
"learning_rate": 1.5591855237807413e-05,
"loss": 0.0395,
"step": 58368
},
{
"epoch": 2.2146499943334215,
"grad_norm": 0.8426064848899841,
"learning_rate": 1.5572513316459525e-05,
"loss": 0.0396,
"step": 58624
},
{
"epoch": 2.2243209550073666,
"grad_norm": 2.25600528717041,
"learning_rate": 1.5553171395111633e-05,
"loss": 0.0405,
"step": 58880
},
{
"epoch": 2.2339919156813117,
"grad_norm": 2.133103609085083,
"learning_rate": 1.553382947376374e-05,
"loss": 0.0391,
"step": 59136
},
{
"epoch": 2.243662876355257,
"grad_norm": 27.295085906982422,
"learning_rate": 1.5514487552415853e-05,
"loss": 0.0382,
"step": 59392
},
{
"epoch": 2.253333837029202,
"grad_norm": 3.368842840194702,
"learning_rate": 1.5495145631067962e-05,
"loss": 0.0407,
"step": 59648
},
{
"epoch": 2.2630047977031467,
"grad_norm": 1.4239710569381714,
"learning_rate": 1.5475803709720074e-05,
"loss": 0.0376,
"step": 59904
},
{
"epoch": 2.272675758377092,
"grad_norm": 4.708951473236084,
"learning_rate": 1.5456461788372182e-05,
"loss": 0.0378,
"step": 60160
},
{
"epoch": 2.282346719051037,
"grad_norm": 11.830906867980957,
"learning_rate": 1.5437119867024294e-05,
"loss": 0.0391,
"step": 60416
},
{
"epoch": 2.292017679724982,
"grad_norm": 2.8490591049194336,
"learning_rate": 1.5417777945676402e-05,
"loss": 0.0395,
"step": 60672
},
{
"epoch": 2.301688640398927,
"grad_norm": 3.398808240890503,
"learning_rate": 1.539843602432851e-05,
"loss": 0.0407,
"step": 60928
},
{
"epoch": 2.3113596010728723,
"grad_norm": 4.087090492248535,
"learning_rate": 1.537909410298062e-05,
"loss": 0.0361,
"step": 61184
},
{
"epoch": 2.3210305617468174,
"grad_norm": 2.446629762649536,
"learning_rate": 1.535975218163273e-05,
"loss": 0.0361,
"step": 61440
},
{
"epoch": 2.330701522420762,
"grad_norm": 1.8066984415054321,
"learning_rate": 1.5340410260284843e-05,
"loss": 0.0399,
"step": 61696
},
{
"epoch": 2.3403724830947072,
"grad_norm": 2.6665291786193848,
"learning_rate": 1.532106833893695e-05,
"loss": 0.0396,
"step": 61952
},
{
"epoch": 2.3500434437686524,
"grad_norm": 0.9438909292221069,
"learning_rate": 1.530172641758906e-05,
"loss": 0.0385,
"step": 62208
},
{
"epoch": 2.3597144044425975,
"grad_norm": 1.689215898513794,
"learning_rate": 1.528238449624117e-05,
"loss": 0.0399,
"step": 62464
},
{
"epoch": 2.3693853651165426,
"grad_norm": 2.397761583328247,
"learning_rate": 1.526304257489328e-05,
"loss": 0.0363,
"step": 62720
},
{
"epoch": 2.3790563257904878,
"grad_norm": 17.148651123046875,
"learning_rate": 1.524370065354539e-05,
"loss": 0.0379,
"step": 62976
},
{
"epoch": 2.388727286464433,
"grad_norm": 7.684645652770996,
"learning_rate": 1.52243587321975e-05,
"loss": 0.038,
"step": 63232
},
{
"epoch": 2.398398247138378,
"grad_norm": 2.3121824264526367,
"learning_rate": 1.520501681084961e-05,
"loss": 0.0363,
"step": 63488
},
{
"epoch": 2.408069207812323,
"grad_norm": 4.012951374053955,
"learning_rate": 1.518567488950172e-05,
"loss": 0.0369,
"step": 63744
},
{
"epoch": 2.417740168486268,
"grad_norm": 3.992743730545044,
"learning_rate": 1.5166332968153829e-05,
"loss": 0.037,
"step": 64000
},
{
"epoch": 2.427411129160213,
"grad_norm": 2.0966529846191406,
"learning_rate": 1.5147066601186205e-05,
"loss": 0.0398,
"step": 64256
},
{
"epoch": 2.437082089834158,
"grad_norm": 4.283209800720215,
"learning_rate": 1.5127724679838316e-05,
"loss": 0.0375,
"step": 64512
},
{
"epoch": 2.446753050508103,
"grad_norm": 7.317829608917236,
"learning_rate": 1.5108382758490425e-05,
"loss": 0.0385,
"step": 64768
},
{
"epoch": 2.4564240111820483,
"grad_norm": 2.1492598056793213,
"learning_rate": 1.5089040837142535e-05,
"loss": 0.038,
"step": 65024
},
{
"epoch": 2.4660949718559935,
"grad_norm": 4.824232578277588,
"learning_rate": 1.5069698915794643e-05,
"loss": 0.0404,
"step": 65280
},
{
"epoch": 2.4757659325299386,
"grad_norm": 2.757894992828369,
"learning_rate": 1.5050356994446755e-05,
"loss": 0.0379,
"step": 65536
},
{
"epoch": 2.4854368932038833,
"grad_norm": 3.4582314491271973,
"learning_rate": 1.5031015073098865e-05,
"loss": 0.0352,
"step": 65792
},
{
"epoch": 2.4951078538778284,
"grad_norm": 2.4710917472839355,
"learning_rate": 1.5011673151750974e-05,
"loss": 0.0363,
"step": 66048
},
{
"epoch": 2.5047788145517735,
"grad_norm": 2.776700973510742,
"learning_rate": 1.4992331230403084e-05,
"loss": 0.0358,
"step": 66304
},
{
"epoch": 2.5144497752257187,
"grad_norm": 3.758176326751709,
"learning_rate": 1.4972989309055194e-05,
"loss": 0.0356,
"step": 66560
},
{
"epoch": 2.524120735899664,
"grad_norm": 2.5761642456054688,
"learning_rate": 1.4953647387707304e-05,
"loss": 0.0404,
"step": 66816
},
{
"epoch": 2.533791696573609,
"grad_norm": 1.3668540716171265,
"learning_rate": 1.4934381020739678e-05,
"loss": 0.0366,
"step": 67072
},
{
"epoch": 2.543462657247554,
"grad_norm": 3.8430099487304688,
"learning_rate": 1.4915039099391788e-05,
"loss": 0.0372,
"step": 67328
},
{
"epoch": 2.5531336179214987,
"grad_norm": 5.29500675201416,
"learning_rate": 1.4895697178043897e-05,
"loss": 0.0358,
"step": 67584
},
{
"epoch": 2.5628045785954443,
"grad_norm": 0.8562812805175781,
"learning_rate": 1.4876355256696009e-05,
"loss": 0.0374,
"step": 67840
},
{
"epoch": 2.572475539269389,
"grad_norm": 4.466825008392334,
"learning_rate": 1.4857013335348119e-05,
"loss": 0.0359,
"step": 68096
},
{
"epoch": 2.582146499943334,
"grad_norm": 12.638843536376953,
"learning_rate": 1.4837746968380493e-05,
"loss": 0.0362,
"step": 68352
},
{
"epoch": 2.5918174606172792,
"grad_norm": 4.4277119636535645,
"learning_rate": 1.4818405047032603e-05,
"loss": 0.036,
"step": 68608
},
{
"epoch": 2.6014884212912244,
"grad_norm": 1.1809728145599365,
"learning_rate": 1.4799063125684711e-05,
"loss": 0.035,
"step": 68864
},
{
"epoch": 2.6111593819651695,
"grad_norm": 4.5768327713012695,
"learning_rate": 1.4779721204336823e-05,
"loss": 0.0374,
"step": 69120
},
{
"epoch": 2.6208303426391146,
"grad_norm": 4.537430763244629,
"learning_rate": 1.4760379282988933e-05,
"loss": 0.0344,
"step": 69376
},
{
"epoch": 2.6305013033130598,
"grad_norm": 1.4762442111968994,
"learning_rate": 1.4741037361641042e-05,
"loss": 0.0374,
"step": 69632
},
{
"epoch": 2.6401722639870044,
"grad_norm": 1.5577633380889893,
"learning_rate": 1.4721695440293152e-05,
"loss": 0.0353,
"step": 69888
},
{
"epoch": 2.6498432246609496,
"grad_norm": 4.222722053527832,
"learning_rate": 1.4702353518945262e-05,
"loss": 0.0359,
"step": 70144
},
{
"epoch": 2.6595141853348947,
"grad_norm": 1.9563344717025757,
"learning_rate": 1.4683011597597372e-05,
"loss": 0.0379,
"step": 70400
},
{
"epoch": 2.66918514600884,
"grad_norm": 5.85068416595459,
"learning_rate": 1.466366967624948e-05,
"loss": 0.0344,
"step": 70656
},
{
"epoch": 2.678856106682785,
"grad_norm": 2.2116239070892334,
"learning_rate": 1.464432775490159e-05,
"loss": 0.039,
"step": 70912
},
{
"epoch": 2.68852706735673,
"grad_norm": 4.683871269226074,
"learning_rate": 1.4624985833553702e-05,
"loss": 0.0343,
"step": 71168
},
{
"epoch": 2.698198028030675,
"grad_norm": 1.9998408555984497,
"learning_rate": 1.460564391220581e-05,
"loss": 0.0367,
"step": 71424
},
{
"epoch": 2.70786898870462,
"grad_norm": 1.950804352760315,
"learning_rate": 1.4586301990857921e-05,
"loss": 0.0354,
"step": 71680
},
{
"epoch": 2.7175399493785655,
"grad_norm": 2.9149844646453857,
"learning_rate": 1.456696006951003e-05,
"loss": 0.0339,
"step": 71936
},
{
"epoch": 2.72721091005251,
"grad_norm": 4.158403396606445,
"learning_rate": 1.4547618148162141e-05,
"loss": 0.0358,
"step": 72192
},
{
"epoch": 2.7368818707264553,
"grad_norm": 1.9110437631607056,
"learning_rate": 1.4528351781194517e-05,
"loss": 0.0363,
"step": 72448
},
{
"epoch": 2.7465528314004004,
"grad_norm": 4.942687034606934,
"learning_rate": 1.4509009859846625e-05,
"loss": 0.0331,
"step": 72704
},
{
"epoch": 2.7562237920743455,
"grad_norm": 4.669269561767578,
"learning_rate": 1.4489667938498735e-05,
"loss": 0.0339,
"step": 72960
},
{
"epoch": 2.7658947527482907,
"grad_norm": 2.782804012298584,
"learning_rate": 1.4470326017150846e-05,
"loss": 0.0337,
"step": 73216
},
{
"epoch": 2.775565713422236,
"grad_norm": 0.8589828014373779,
"learning_rate": 1.4450984095802956e-05,
"loss": 0.0348,
"step": 73472
},
{
"epoch": 2.785236674096181,
"grad_norm": 6.355395793914795,
"learning_rate": 1.4431642174455066e-05,
"loss": 0.0347,
"step": 73728
},
{
"epoch": 2.7949076347701256,
"grad_norm": 1.7806596755981445,
"learning_rate": 1.4412300253107174e-05,
"loss": 0.035,
"step": 73984
},
{
"epoch": 2.8045785954440707,
"grad_norm": 5.5398850440979,
"learning_rate": 1.4392958331759286e-05,
"loss": 0.0309,
"step": 74240
},
{
"epoch": 2.814249556118016,
"grad_norm": 1.2205835580825806,
"learning_rate": 1.437369196479166e-05,
"loss": 0.0318,
"step": 74496
},
{
"epoch": 2.823920516791961,
"grad_norm": 4.248105525970459,
"learning_rate": 1.435435004344377e-05,
"loss": 0.0347,
"step": 74752
},
{
"epoch": 2.833591477465906,
"grad_norm": 1.5058479309082031,
"learning_rate": 1.4335083676476144e-05,
"loss": 0.0338,
"step": 75008
},
{
"epoch": 2.8432624381398512,
"grad_norm": 3.8759660720825195,
"learning_rate": 1.4315741755128254e-05,
"loss": 0.0343,
"step": 75264
},
{
"epoch": 2.8529333988137964,
"grad_norm": 16.488771438598633,
"learning_rate": 1.4296399833780366e-05,
"loss": 0.0338,
"step": 75520
},
{
"epoch": 2.862604359487741,
"grad_norm": 6.564029693603516,
"learning_rate": 1.4277057912432475e-05,
"loss": 0.0312,
"step": 75776
},
{
"epoch": 2.8722753201616866,
"grad_norm": 1.345203161239624,
"learning_rate": 1.4257715991084585e-05,
"loss": 0.0332,
"step": 76032
},
{
"epoch": 2.8819462808356313,
"grad_norm": 2.0033822059631348,
"learning_rate": 1.4238374069736693e-05,
"loss": 0.0322,
"step": 76288
},
{
"epoch": 2.8916172415095764,
"grad_norm": 6.844017505645752,
"learning_rate": 1.4219032148388805e-05,
"loss": 0.0319,
"step": 76544
},
{
"epoch": 2.9012882021835216,
"grad_norm": 4.2425150871276855,
"learning_rate": 1.4199690227040915e-05,
"loss": 0.0322,
"step": 76800
},
{
"epoch": 2.9109591628574667,
"grad_norm": 1.8265749216079712,
"learning_rate": 1.4180348305693024e-05,
"loss": 0.0322,
"step": 77056
},
{
"epoch": 2.920630123531412,
"grad_norm": 3.0552210807800293,
"learning_rate": 1.4161006384345134e-05,
"loss": 0.033,
"step": 77312
},
{
"epoch": 2.930301084205357,
"grad_norm": 2.102796792984009,
"learning_rate": 1.4141664462997244e-05,
"loss": 0.0346,
"step": 77568
},
{
"epoch": 2.939972044879302,
"grad_norm": 1.903757929801941,
"learning_rate": 1.4122322541649354e-05,
"loss": 0.0315,
"step": 77824
},
{
"epoch": 2.9496430055532468,
"grad_norm": 9.322936058044434,
"learning_rate": 1.4102980620301462e-05,
"loss": 0.0336,
"step": 78080
},
{
"epoch": 2.959313966227192,
"grad_norm": 1.862209677696228,
"learning_rate": 1.4083714253333838e-05,
"loss": 0.0328,
"step": 78336
},
{
"epoch": 2.968984926901137,
"grad_norm": 3.4806630611419678,
"learning_rate": 1.4064372331985946e-05,
"loss": 0.0321,
"step": 78592
},
{
"epoch": 2.978655887575082,
"grad_norm": 7.490905284881592,
"learning_rate": 1.4045030410638058e-05,
"loss": 0.0321,
"step": 78848
},
{
"epoch": 2.9883268482490273,
"grad_norm": 2.008312940597534,
"learning_rate": 1.4025688489290168e-05,
"loss": 0.032,
"step": 79104
},
{
"epoch": 2.9979978089229724,
"grad_norm": 5.4629645347595215,
"learning_rate": 1.4006346567942277e-05,
"loss": 0.0316,
"step": 79360
},
{
"epoch": 3.0,
"eval_f1_B-DISEASE": 0.8058758050409478,
"eval_f1_B-MEDICATION": 0.9331298806211291,
"eval_f1_B-PROCEDURE": 0.8246479186103336,
"eval_f1_B-SYMPTOM": 0.7958159437899519,
"eval_f1_I-DISEASE": 0.8446797498113607,
"eval_f1_I-MEDICATION": 0.9445428820775924,
"eval_f1_I-PROCEDURE": 0.8431497703012539,
"eval_f1_I-SYMPTOM": 0.8064467139982535,
"eval_f1_O": 0.9242880224344192,
"eval_f1_macro": 0.8580640762983602,
"eval_f1_micro": 0.8867284724320147,
"eval_loss": 0.346194326877594,
"eval_precision_B-DISEASE": 0.8078026619909142,
"eval_precision_B-MEDICATION": 0.9413256066642521,
"eval_precision_B-PROCEDURE": 0.8576841327049256,
"eval_precision_B-SYMPTOM": 0.8196756992055719,
"eval_precision_I-DISEASE": 0.8398561507936508,
"eval_precision_I-MEDICATION": 0.9445678620543743,
"eval_precision_I-PROCEDURE": 0.8685191753683246,
"eval_precision_I-SYMPTOM": 0.8141611818689563,
"eval_precision_O": 0.922143895574372,
"eval_precision_macro": 0.8684151518028158,
"eval_precision_micro": 0.8893727212165927,
"eval_rauc_macro": 0.9135258778318731,
"eval_rauc_micro": 0.9350417116157864,
"eval_recall_B-DISEASE": 0.8039581185055922,
"eval_recall_B-MEDICATION": 0.9250756362342054,
"eval_recall_B-PROCEDURE": 0.7940622861054073,
"eval_recall_B-SYMPTOM": 0.773305954825462,
"eval_recall_I-DISEASE": 0.8495590762553469,
"eval_recall_I-MEDICATION": 0.944517903422013,
"eval_recall_I-PROCEDURE": 0.8192203807518748,
"eval_recall_I-SYMPTOM": 0.7988770685579196,
"eval_recall_O": 0.9264421433839181,
"eval_recall_macro": 0.8483353964490822,
"eval_recall_micro": 0.8840999005950059,
"eval_roc_auc_B-DISEASE": 0.9001994739703317,
"eval_roc_auc_B-MEDICATION": 0.9624199730237505,
"eval_roc_auc_B-PROCEDURE": 0.89589622737178,
"eval_roc_auc_B-SYMPTOM": 0.8848133448211472,
"eval_roc_auc_I-DISEASE": 0.914201809349682,
"eval_roc_auc_I-MEDICATION": 0.9718740532463399,
"eval_roc_auc_I-PROCEDURE": 0.9035684876000457,
"eval_roc_auc_I-SYMPTOM": 0.8852284244551051,
"eval_roc_auc_O": 0.903531106648675,
"eval_runtime": 61.221,
"eval_samples_per_second": 177.602,
"eval_steps_per_second": 22.215,
"step": 79413
},
{
"epoch": 3.0076687695969175,
"grad_norm": 4.327937602996826,
"learning_rate": 1.3987004646594387e-05,
"loss": 0.0237,
"step": 79616
},
{
"epoch": 3.0173397302708627,
"grad_norm": 1.6373872756958008,
"learning_rate": 1.3967662725246499e-05,
"loss": 0.022,
"step": 79872
},
{
"epoch": 3.0270106909448073,
"grad_norm": 3.250305652618408,
"learning_rate": 1.3948320803898607e-05,
"loss": 0.0246,
"step": 80128
},
{
"epoch": 3.0366816516187525,
"grad_norm": 1.6971690654754639,
"learning_rate": 1.3928978882550717e-05,
"loss": 0.0236,
"step": 80384
},
{
"epoch": 3.0463526122926976,
"grad_norm": 5.478879451751709,
"learning_rate": 1.3909636961202826e-05,
"loss": 0.0219,
"step": 80640
},
{
"epoch": 3.0560235729666427,
"grad_norm": 2.4806175231933594,
"learning_rate": 1.3890295039854938e-05,
"loss": 0.0236,
"step": 80896
},
{
"epoch": 3.065694533640588,
"grad_norm": 1.5560436248779297,
"learning_rate": 1.3870953118507046e-05,
"loss": 0.0229,
"step": 81152
},
{
"epoch": 3.075365494314533,
"grad_norm": 10.51571273803711,
"learning_rate": 1.3851611197159156e-05,
"loss": 0.0246,
"step": 81408
},
{
"epoch": 3.085036454988478,
"grad_norm": 4.828140735626221,
"learning_rate": 1.3832269275811265e-05,
"loss": 0.0225,
"step": 81664
},
{
"epoch": 3.0947074156624232,
"grad_norm": 0.9167439937591553,
"learning_rate": 1.3812927354463376e-05,
"loss": 0.0241,
"step": 81920
},
{
"epoch": 3.104378376336368,
"grad_norm": 4.8147454261779785,
"learning_rate": 1.3793585433115487e-05,
"loss": 0.0226,
"step": 82176
},
{
"epoch": 3.114049337010313,
"grad_norm": 5.181445121765137,
"learning_rate": 1.3774243511767595e-05,
"loss": 0.0202,
"step": 82432
},
{
"epoch": 3.123720297684258,
"grad_norm": 1.4374691247940063,
"learning_rate": 1.375497714479997e-05,
"loss": 0.0221,
"step": 82688
},
{
"epoch": 3.1333912583582033,
"grad_norm": 3.805264949798584,
"learning_rate": 1.3735635223452082e-05,
"loss": 0.0241,
"step": 82944
},
{
"epoch": 3.1430622190321484,
"grad_norm": 3.3050577640533447,
"learning_rate": 1.3716368856484456e-05,
"loss": 0.0225,
"step": 83200
},
{
"epoch": 3.1527331797060936,
"grad_norm": 1.6958988904953003,
"learning_rate": 1.3697026935136567e-05,
"loss": 0.0233,
"step": 83456
},
{
"epoch": 3.1624041403800387,
"grad_norm": 2.1749958992004395,
"learning_rate": 1.3677685013788675e-05,
"loss": 0.024,
"step": 83712
},
{
"epoch": 3.1720751010539834,
"grad_norm": 1.0387561321258545,
"learning_rate": 1.3658343092440785e-05,
"loss": 0.0235,
"step": 83968
},
{
"epoch": 3.1817460617279285,
"grad_norm": 4.311033248901367,
"learning_rate": 1.3639001171092895e-05,
"loss": 0.025,
"step": 84224
},
{
"epoch": 3.1914170224018736,
"grad_norm": 1.0629218816757202,
"learning_rate": 1.3619659249745005e-05,
"loss": 0.0242,
"step": 84480
},
{
"epoch": 3.2010879830758188,
"grad_norm": 4.607676029205322,
"learning_rate": 1.3600317328397114e-05,
"loss": 0.0218,
"step": 84736
},
{
"epoch": 3.210758943749764,
"grad_norm": 1.2249504327774048,
"learning_rate": 1.3580975407049224e-05,
"loss": 0.0217,
"step": 84992
},
{
"epoch": 3.220429904423709,
"grad_norm": 3.8173789978027344,
"learning_rate": 1.3561633485701336e-05,
"loss": 0.0212,
"step": 85248
},
{
"epoch": 3.230100865097654,
"grad_norm": 5.286001205444336,
"learning_rate": 1.3542291564353444e-05,
"loss": 0.0234,
"step": 85504
},
{
"epoch": 3.2397718257715993,
"grad_norm": 0.9266921281814575,
"learning_rate": 1.3522949643005554e-05,
"loss": 0.0227,
"step": 85760
},
{
"epoch": 3.2494427864455444,
"grad_norm": 1.9286329746246338,
"learning_rate": 1.3503607721657663e-05,
"loss": 0.0216,
"step": 86016
},
{
"epoch": 3.259113747119489,
"grad_norm": 7.073780536651611,
"learning_rate": 1.3484265800309775e-05,
"loss": 0.0229,
"step": 86272
},
{
"epoch": 3.268784707793434,
"grad_norm": 11.505043983459473,
"learning_rate": 1.3464923878961885e-05,
"loss": 0.0216,
"step": 86528
},
{
"epoch": 3.2784556684673793,
"grad_norm": 2.463899850845337,
"learning_rate": 1.3445581957613993e-05,
"loss": 0.0238,
"step": 86784
},
{
"epoch": 3.2881266291413245,
"grad_norm": 2.2217423915863037,
"learning_rate": 1.3426240036266103e-05,
"loss": 0.0244,
"step": 87040
},
{
"epoch": 3.2977975898152696,
"grad_norm": 2.690162181854248,
"learning_rate": 1.3406898114918213e-05,
"loss": 0.0233,
"step": 87296
},
{
"epoch": 3.3074685504892147,
"grad_norm": 0.6873595118522644,
"learning_rate": 1.3387631747950589e-05,
"loss": 0.0212,
"step": 87552
},
{
"epoch": 3.31713951116316,
"grad_norm": 12.570816040039062,
"learning_rate": 1.3368289826602698e-05,
"loss": 0.021,
"step": 87808
},
{
"epoch": 3.3268104718371045,
"grad_norm": 1.3393861055374146,
"learning_rate": 1.3348947905254808e-05,
"loss": 0.0204,
"step": 88064
},
{
"epoch": 3.3364814325110497,
"grad_norm": 0.6096575856208801,
"learning_rate": 1.332960598390692e-05,
"loss": 0.0218,
"step": 88320
},
{
"epoch": 3.346152393184995,
"grad_norm": 4.549058437347412,
"learning_rate": 1.3310264062559028e-05,
"loss": 0.0232,
"step": 88576
},
{
"epoch": 3.35582335385894,
"grad_norm": 2.827040195465088,
"learning_rate": 1.3290922141211138e-05,
"loss": 0.023,
"step": 88832
},
{
"epoch": 3.365494314532885,
"grad_norm": 4.081531524658203,
"learning_rate": 1.3271580219863246e-05,
"loss": 0.0202,
"step": 89088
},
{
"epoch": 3.37516527520683,
"grad_norm": 16.549381256103516,
"learning_rate": 1.3252238298515358e-05,
"loss": 0.023,
"step": 89344
},
{
"epoch": 3.3848362358807753,
"grad_norm": 1.166902780532837,
"learning_rate": 1.3232896377167468e-05,
"loss": 0.0217,
"step": 89600
},
{
"epoch": 3.3945071965547204,
"grad_norm": 1.8393259048461914,
"learning_rate": 1.3213554455819577e-05,
"loss": 0.0226,
"step": 89856
},
{
"epoch": 3.4041781572286656,
"grad_norm": 3.180155038833618,
"learning_rate": 1.3194288088851953e-05,
"loss": 0.0216,
"step": 90112
},
{
"epoch": 3.4138491179026103,
"grad_norm": 0.5230717658996582,
"learning_rate": 1.3174946167504061e-05,
"loss": 0.022,
"step": 90368
},
{
"epoch": 3.4235200785765554,
"grad_norm": 15.037604331970215,
"learning_rate": 1.3155604246156173e-05,
"loss": 0.0234,
"step": 90624
},
{
"epoch": 3.4331910392505005,
"grad_norm": 11.155952453613281,
"learning_rate": 1.3136262324808283e-05,
"loss": 0.0224,
"step": 90880
},
{
"epoch": 3.4428619999244456,
"grad_norm": 2.1080737113952637,
"learning_rate": 1.3116920403460391e-05,
"loss": 0.023,
"step": 91136
},
{
"epoch": 3.4525329605983908,
"grad_norm": 0.7303668856620789,
"learning_rate": 1.3097578482112501e-05,
"loss": 0.0217,
"step": 91392
},
{
"epoch": 3.462203921272336,
"grad_norm": 0.6222452521324158,
"learning_rate": 1.3078236560764612e-05,
"loss": 0.0219,
"step": 91648
},
{
"epoch": 3.471874881946281,
"grad_norm": 0.8807787299156189,
"learning_rate": 1.3058894639416722e-05,
"loss": 0.0236,
"step": 91904
},
{
"epoch": 3.4815458426202257,
"grad_norm": 0.9494552612304688,
"learning_rate": 1.3039628272449096e-05,
"loss": 0.0208,
"step": 92160
},
{
"epoch": 3.491216803294171,
"grad_norm": 14.498435020446777,
"learning_rate": 1.3020286351101206e-05,
"loss": 0.0241,
"step": 92416
},
{
"epoch": 3.500887763968116,
"grad_norm": 1.3170123100280762,
"learning_rate": 1.3000944429753314e-05,
"loss": 0.0213,
"step": 92672
},
{
"epoch": 3.510558724642061,
"grad_norm": 1.3304574489593506,
"learning_rate": 1.2981602508405426e-05,
"loss": 0.0216,
"step": 92928
},
{
"epoch": 3.520229685316006,
"grad_norm": 0.5469146966934204,
"learning_rate": 1.2962260587057536e-05,
"loss": 0.0198,
"step": 93184
},
{
"epoch": 3.5299006459899513,
"grad_norm": 1.7149643898010254,
"learning_rate": 1.2942918665709645e-05,
"loss": 0.0197,
"step": 93440
},
{
"epoch": 3.5395716066638965,
"grad_norm": 2.092782974243164,
"learning_rate": 1.292365229874202e-05,
"loss": 0.0225,
"step": 93696
},
{
"epoch": 3.549242567337841,
"grad_norm": 1.180370807647705,
"learning_rate": 1.2904310377394132e-05,
"loss": 0.0204,
"step": 93952
},
{
"epoch": 3.5589135280117867,
"grad_norm": 16.842605590820312,
"learning_rate": 1.288496845604624e-05,
"loss": 0.0214,
"step": 94208
},
{
"epoch": 3.5685844886857314,
"grad_norm": 3.62001895904541,
"learning_rate": 1.286562653469835e-05,
"loss": 0.0241,
"step": 94464
},
{
"epoch": 3.5782554493596765,
"grad_norm": 2.4327309131622314,
"learning_rate": 1.284628461335046e-05,
"loss": 0.0192,
"step": 94720
},
{
"epoch": 3.5879264100336217,
"grad_norm": 5.820268154144287,
"learning_rate": 1.2826942692002571e-05,
"loss": 0.0223,
"step": 94976
},
{
"epoch": 3.597597370707567,
"grad_norm": 3.0629537105560303,
"learning_rate": 1.280760077065468e-05,
"loss": 0.02,
"step": 95232
},
{
"epoch": 3.607268331381512,
"grad_norm": 2.9143710136413574,
"learning_rate": 1.278825884930679e-05,
"loss": 0.0198,
"step": 95488
},
{
"epoch": 3.616939292055457,
"grad_norm": 1.7662220001220703,
"learning_rate": 1.2768916927958898e-05,
"loss": 0.0225,
"step": 95744
},
{
"epoch": 3.626610252729402,
"grad_norm": 3.5561130046844482,
"learning_rate": 1.274957500661101e-05,
"loss": 0.0228,
"step": 96000
},
{
"epoch": 3.636281213403347,
"grad_norm": 5.7032470703125,
"learning_rate": 1.273023308526312e-05,
"loss": 0.0208,
"step": 96256
},
{
"epoch": 3.645952174077292,
"grad_norm": 1.8125163316726685,
"learning_rate": 1.2710891163915228e-05,
"loss": 0.0212,
"step": 96512
},
{
"epoch": 3.655623134751237,
"grad_norm": 4.229706764221191,
"learning_rate": 1.2691549242567338e-05,
"loss": 0.0238,
"step": 96768
},
{
"epoch": 3.6652940954251823,
"grad_norm": 1.200060486793518,
"learning_rate": 1.267220732121945e-05,
"loss": 0.0189,
"step": 97024
},
{
"epoch": 3.6749650560991274,
"grad_norm": 3.1629979610443115,
"learning_rate": 1.2652865399871559e-05,
"loss": 0.0207,
"step": 97280
},
{
"epoch": 3.6846360167730725,
"grad_norm": 3.1145436763763428,
"learning_rate": 1.2633523478523669e-05,
"loss": 0.0201,
"step": 97536
},
{
"epoch": 3.6943069774470176,
"grad_norm": 2.600019693374634,
"learning_rate": 1.2614181557175777e-05,
"loss": 0.0208,
"step": 97792
},
{
"epoch": 3.7039779381209623,
"grad_norm": 3.338853120803833,
"learning_rate": 1.2594915190208153e-05,
"loss": 0.0209,
"step": 98048
},
{
"epoch": 3.713648898794908,
"grad_norm": 6.754782676696777,
"learning_rate": 1.2575573268860263e-05,
"loss": 0.0187,
"step": 98304
},
{
"epoch": 3.7233198594688526,
"grad_norm": 3.4177420139312744,
"learning_rate": 1.2556231347512373e-05,
"loss": 0.0216,
"step": 98560
},
{
"epoch": 3.7329908201427977,
"grad_norm": 1.6833980083465576,
"learning_rate": 1.2536889426164482e-05,
"loss": 0.0202,
"step": 98816
},
{
"epoch": 3.742661780816743,
"grad_norm": 2.7053074836730957,
"learning_rate": 1.2517547504816592e-05,
"loss": 0.0191,
"step": 99072
},
{
"epoch": 3.752332741490688,
"grad_norm": 2.020542621612549,
"learning_rate": 1.2498205583468704e-05,
"loss": 0.0195,
"step": 99328
},
{
"epoch": 3.762003702164633,
"grad_norm": 4.648097515106201,
"learning_rate": 1.2478863662120812e-05,
"loss": 0.0208,
"step": 99584
},
{
"epoch": 3.771674662838578,
"grad_norm": 1.1168490648269653,
"learning_rate": 1.2459521740772922e-05,
"loss": 0.0194,
"step": 99840
},
{
"epoch": 3.7813456235125233,
"grad_norm": 0.9811049103736877,
"learning_rate": 1.2440255373805296e-05,
"loss": 0.0207,
"step": 100096
},
{
"epoch": 3.791016584186468,
"grad_norm": 3.2866318225860596,
"learning_rate": 1.2420913452457408e-05,
"loss": 0.0208,
"step": 100352
},
{
"epoch": 3.800687544860413,
"grad_norm": 1.0944135189056396,
"learning_rate": 1.2401571531109518e-05,
"loss": 0.0216,
"step": 100608
},
{
"epoch": 3.8103585055343583,
"grad_norm": 1.5802284479141235,
"learning_rate": 1.2382229609761627e-05,
"loss": 0.0215,
"step": 100864
},
{
"epoch": 3.8200294662083034,
"grad_norm": 15.70626163482666,
"learning_rate": 1.2362887688413737e-05,
"loss": 0.0224,
"step": 101120
},
{
"epoch": 3.8297004268822485,
"grad_norm": 2.241199016571045,
"learning_rate": 1.2343545767065847e-05,
"loss": 0.0203,
"step": 101376
},
{
"epoch": 3.8393713875561937,
"grad_norm": 1.7189942598342896,
"learning_rate": 1.2324203845717957e-05,
"loss": 0.0202,
"step": 101632
},
{
"epoch": 3.849042348230139,
"grad_norm": 3.025250196456909,
"learning_rate": 1.2304861924370065e-05,
"loss": 0.0214,
"step": 101888
},
{
"epoch": 3.8587133089040835,
"grad_norm": 0.44517338275909424,
"learning_rate": 1.2285595557402441e-05,
"loss": 0.0213,
"step": 102144
},
{
"epoch": 3.868384269578029,
"grad_norm": 1.4796372652053833,
"learning_rate": 1.226625363605455e-05,
"loss": 0.0214,
"step": 102400
},
{
"epoch": 3.8780552302519737,
"grad_norm": 3.5950703620910645,
"learning_rate": 1.2246911714706661e-05,
"loss": 0.0195,
"step": 102656
},
{
"epoch": 3.887726190925919,
"grad_norm": 3.87646222114563,
"learning_rate": 1.2227569793358771e-05,
"loss": 0.0194,
"step": 102912
},
{
"epoch": 3.897397151599864,
"grad_norm": 6.18682336807251,
"learning_rate": 1.220822787201088e-05,
"loss": 0.0186,
"step": 103168
},
{
"epoch": 3.907068112273809,
"grad_norm": 4.5957207679748535,
"learning_rate": 1.218888595066299e-05,
"loss": 0.0193,
"step": 103424
},
{
"epoch": 3.9167390729477543,
"grad_norm": 11.035417556762695,
"learning_rate": 1.2169544029315102e-05,
"loss": 0.0193,
"step": 103680
},
{
"epoch": 3.9264100336216994,
"grad_norm": 1.2352112531661987,
"learning_rate": 1.215020210796721e-05,
"loss": 0.0181,
"step": 103936
},
{
"epoch": 3.9360809942956445,
"grad_norm": 0.506557047367096,
"learning_rate": 1.213086018661932e-05,
"loss": 0.0187,
"step": 104192
},
{
"epoch": 3.945751954969589,
"grad_norm": 2.8846030235290527,
"learning_rate": 1.2111593819651694e-05,
"loss": 0.0196,
"step": 104448
},
{
"epoch": 3.9554229156435343,
"grad_norm": 1.4602288007736206,
"learning_rate": 1.2092251898303806e-05,
"loss": 0.0192,
"step": 104704
},
{
"epoch": 3.9650938763174794,
"grad_norm": 13.7206392288208,
"learning_rate": 1.207298553133618e-05,
"loss": 0.0191,
"step": 104960
},
{
"epoch": 3.9747648369914246,
"grad_norm": 1.7238157987594604,
"learning_rate": 1.205364360998829e-05,
"loss": 0.0201,
"step": 105216
},
{
"epoch": 3.9844357976653697,
"grad_norm": 2.0438215732574463,
"learning_rate": 1.20343016886404e-05,
"loss": 0.0182,
"step": 105472
},
{
"epoch": 3.994106758339315,
"grad_norm": 1.2184364795684814,
"learning_rate": 1.2014959767292509e-05,
"loss": 0.019,
"step": 105728
},
{
"epoch": 4.0,
"eval_f1_B-DISEASE": 0.808675320486979,
"eval_f1_B-MEDICATION": 0.9266381766381766,
"eval_f1_B-PROCEDURE": 0.8295174204717594,
"eval_f1_B-SYMPTOM": 0.7980295566502463,
"eval_f1_I-DISEASE": 0.8489476041200179,
"eval_f1_I-MEDICATION": 0.9397869262133368,
"eval_f1_I-PROCEDURE": 0.847453216112688,
"eval_f1_I-SYMPTOM": 0.8079173624618605,
"eval_f1_O": 0.9249064875950979,
"eval_f1_macro": 0.8590968967500181,
"eval_f1_micro": 0.8881361203919136,
"eval_loss": 0.4215824604034424,
"eval_precision_B-DISEASE": 0.8221985408640052,
"eval_precision_B-MEDICATION": 0.927133440228042,
"eval_precision_B-PROCEDURE": 0.8393623543838136,
"eval_precision_B-SYMPTOM": 0.8061812467260345,
"eval_precision_I-DISEASE": 0.8662832447676619,
"eval_precision_I-MEDICATION": 0.9348440443793176,
"eval_precision_I-PROCEDURE": 0.8446231286120726,
"eval_precision_I-SYMPTOM": 0.8113340449395586,
"eval_precision_O": 0.9229153657042629,
"eval_precision_macro": 0.8638750456227521,
"eval_precision_micro": 0.88976580540172,
"eval_rauc_macro": 0.9166627680103409,
"eval_rauc_micro": 0.9362568980657558,
"eval_recall_B-DISEASE": 0.795589751725232,
"eval_recall_B-MEDICATION": 0.9261434418935753,
"eval_recall_B-PROCEDURE": 0.8199007529089665,
"eval_recall_B-SYMPTOM": 0.7900410677618069,
"eval_recall_I-DISEASE": 0.8322921762691454,
"eval_recall_I-MEDICATION": 0.9447823557412599,
"eval_recall_I-PROCEDURE": 0.8503023329824475,
"eval_recall_I-SYMPTOM": 0.8045293359123147,
"eval_recall_O": 0.9269062194588178,
"eval_recall_macro": 0.8544986038503963,
"eval_recall_micro": 0.886512394293185,
"eval_roc_auc_B-DISEASE": 0.8961942453514548,
"eval_roc_auc_B-MEDICATION": 0.9629229597024016,
"eval_roc_auc_B-PROCEDURE": 0.9085987950526558,
"eval_roc_auc_B-SYMPTOM": 0.8929666290562625,
"eval_roc_auc_I-DISEASE": 0.9077573774887775,
"eval_roc_auc_I-MEDICATION": 0.9719339273090749,
"eval_roc_auc_I-PROCEDURE": 0.9175308611542671,
"eval_roc_auc_I-SYMPTOM": 0.8876856873124548,
"eval_roc_auc_O": 0.9043744296657181,
"eval_runtime": 61.4869,
"eval_samples_per_second": 176.835,
"eval_steps_per_second": 22.119,
"step": 105884
},
{
"epoch": 4.00377771901326,
"grad_norm": 0.7948421835899353,
"learning_rate": 1.199561784594462e-05,
"loss": 0.0178,
"step": 105984
},
{
"epoch": 4.013448679687205,
"grad_norm": 0.8098104596138,
"learning_rate": 1.1976275924596729e-05,
"loss": 0.0143,
"step": 106240
},
{
"epoch": 4.02311964036115,
"grad_norm": 3.08135724067688,
"learning_rate": 1.195693400324884e-05,
"loss": 0.0134,
"step": 106496
},
{
"epoch": 4.032790601035095,
"grad_norm": 1.1449787616729736,
"learning_rate": 1.1937592081900948e-05,
"loss": 0.0133,
"step": 106752
},
{
"epoch": 4.0424615617090405,
"grad_norm": 2.6626508235931396,
"learning_rate": 1.1918325714933323e-05,
"loss": 0.0136,
"step": 107008
},
{
"epoch": 4.052132522382985,
"grad_norm": 1.2061920166015625,
"learning_rate": 1.1898983793585435e-05,
"loss": 0.0145,
"step": 107264
},
{
"epoch": 4.06180348305693,
"grad_norm": 0.4288395941257477,
"learning_rate": 1.1879641872237544e-05,
"loss": 0.0127,
"step": 107520
},
{
"epoch": 4.071474443730875,
"grad_norm": 3.4469873905181885,
"learning_rate": 1.1860299950889654e-05,
"loss": 0.0143,
"step": 107776
},
{
"epoch": 4.08114540440482,
"grad_norm": 3.4651808738708496,
"learning_rate": 1.1840958029541762e-05,
"loss": 0.0137,
"step": 108032
},
{
"epoch": 4.090816365078766,
"grad_norm": 4.205618381500244,
"learning_rate": 1.1821616108193874e-05,
"loss": 0.0136,
"step": 108288
},
{
"epoch": 4.10048732575271,
"grad_norm": 0.8337300419807434,
"learning_rate": 1.1802274186845984e-05,
"loss": 0.0126,
"step": 108544
},
{
"epoch": 4.110158286426656,
"grad_norm": 5.309538841247559,
"learning_rate": 1.1782932265498093e-05,
"loss": 0.0137,
"step": 108800
},
{
"epoch": 4.119829247100601,
"grad_norm": 0.6177698969841003,
"learning_rate": 1.1763590344150204e-05,
"loss": 0.0147,
"step": 109056
},
{
"epoch": 4.129500207774546,
"grad_norm": 2.2366254329681396,
"learning_rate": 1.1744248422802313e-05,
"loss": 0.0144,
"step": 109312
},
{
"epoch": 4.139171168448491,
"grad_norm": 1.5923917293548584,
"learning_rate": 1.1724906501454423e-05,
"loss": 0.0124,
"step": 109568
},
{
"epoch": 4.1488421291224356,
"grad_norm": 0.6197337508201599,
"learning_rate": 1.1705564580106531e-05,
"loss": 0.0128,
"step": 109824
},
{
"epoch": 4.158513089796381,
"grad_norm": 1.5513421297073364,
"learning_rate": 1.1686222658758643e-05,
"loss": 0.0133,
"step": 110080
},
{
"epoch": 4.168184050470326,
"grad_norm": 0.4733668863773346,
"learning_rate": 1.1666880737410753e-05,
"loss": 0.013,
"step": 110336
},
{
"epoch": 4.177855011144271,
"grad_norm": 0.9195311069488525,
"learning_rate": 1.1647538816062862e-05,
"loss": 0.0147,
"step": 110592
},
{
"epoch": 4.187525971818216,
"grad_norm": 0.4619844853878021,
"learning_rate": 1.1628272449095237e-05,
"loss": 0.0149,
"step": 110848
},
{
"epoch": 4.197196932492162,
"grad_norm": 0.4427216351032257,
"learning_rate": 1.1608930527747346e-05,
"loss": 0.0146,
"step": 111104
},
{
"epoch": 4.206867893166106,
"grad_norm": 2.1087565422058105,
"learning_rate": 1.1589588606399458e-05,
"loss": 0.0141,
"step": 111360
},
{
"epoch": 4.216538853840051,
"grad_norm": 1.2194585800170898,
"learning_rate": 1.1570246685051568e-05,
"loss": 0.0164,
"step": 111616
},
{
"epoch": 4.226209814513997,
"grad_norm": 1.4488071203231812,
"learning_rate": 1.1550904763703676e-05,
"loss": 0.0158,
"step": 111872
},
{
"epoch": 4.235880775187941,
"grad_norm": 5.222316265106201,
"learning_rate": 1.1531562842355786e-05,
"loss": 0.0144,
"step": 112128
},
{
"epoch": 4.245551735861887,
"grad_norm": 0.9832548499107361,
"learning_rate": 1.1512220921007897e-05,
"loss": 0.0148,
"step": 112384
},
{
"epoch": 4.2552226965358315,
"grad_norm": 3.2491071224212646,
"learning_rate": 1.1492878999660007e-05,
"loss": 0.0141,
"step": 112640
},
{
"epoch": 4.264893657209777,
"grad_norm": 0.40463200211524963,
"learning_rate": 1.1473537078312115e-05,
"loss": 0.0153,
"step": 112896
},
{
"epoch": 4.274564617883722,
"grad_norm": 0.7759467363357544,
"learning_rate": 1.1454195156964225e-05,
"loss": 0.0137,
"step": 113152
},
{
"epoch": 4.2842355785576665,
"grad_norm": 5.856504917144775,
"learning_rate": 1.1434853235616337e-05,
"loss": 0.0154,
"step": 113408
},
{
"epoch": 4.293906539231612,
"grad_norm": 1.3605588674545288,
"learning_rate": 1.1415586868648711e-05,
"loss": 0.0154,
"step": 113664
},
{
"epoch": 4.303577499905557,
"grad_norm": 0.4841889441013336,
"learning_rate": 1.1396244947300821e-05,
"loss": 0.0143,
"step": 113920
},
{
"epoch": 4.313248460579502,
"grad_norm": 2.290330171585083,
"learning_rate": 1.137690302595293e-05,
"loss": 0.0124,
"step": 114176
},
{
"epoch": 4.322919421253447,
"grad_norm": 0.6299089193344116,
"learning_rate": 1.135756110460504e-05,
"loss": 0.015,
"step": 114432
},
{
"epoch": 4.3325903819273925,
"grad_norm": 2.6966304779052734,
"learning_rate": 1.1338219183257152e-05,
"loss": 0.0147,
"step": 114688
},
{
"epoch": 4.342261342601337,
"grad_norm": 3.5934536457061768,
"learning_rate": 1.131887726190926e-05,
"loss": 0.0135,
"step": 114944
},
{
"epoch": 4.351932303275283,
"grad_norm": 2.391207218170166,
"learning_rate": 1.129953534056137e-05,
"loss": 0.0127,
"step": 115200
},
{
"epoch": 4.3616032639492275,
"grad_norm": 7.104966640472412,
"learning_rate": 1.1280193419213479e-05,
"loss": 0.0127,
"step": 115456
},
{
"epoch": 4.371274224623172,
"grad_norm": 4.91796875,
"learning_rate": 1.126085149786559e-05,
"loss": 0.0136,
"step": 115712
},
{
"epoch": 4.380945185297118,
"grad_norm": 0.9888034462928772,
"learning_rate": 1.1241509576517699e-05,
"loss": 0.0143,
"step": 115968
},
{
"epoch": 4.390616145971062,
"grad_norm": 5.1639018058776855,
"learning_rate": 1.1222167655169809e-05,
"loss": 0.0127,
"step": 116224
},
{
"epoch": 4.400287106645008,
"grad_norm": 8.415788650512695,
"learning_rate": 1.1202825733821917e-05,
"loss": 0.0145,
"step": 116480
},
{
"epoch": 4.409958067318953,
"grad_norm": 4.235672950744629,
"learning_rate": 1.118348381247403e-05,
"loss": 0.0154,
"step": 116736
},
{
"epoch": 4.419629027992898,
"grad_norm": 1.2345690727233887,
"learning_rate": 1.116414189112614e-05,
"loss": 0.0143,
"step": 116992
},
{
"epoch": 4.429299988666843,
"grad_norm": 8.792167663574219,
"learning_rate": 1.1144799969778248e-05,
"loss": 0.0162,
"step": 117248
},
{
"epoch": 4.438970949340788,
"grad_norm": 2.2384276390075684,
"learning_rate": 1.1125533602810623e-05,
"loss": 0.0141,
"step": 117504
},
{
"epoch": 4.448641910014733,
"grad_norm": 1.041791558265686,
"learning_rate": 1.1106191681462735e-05,
"loss": 0.0136,
"step": 117760
},
{
"epoch": 4.458312870688678,
"grad_norm": 4.7409515380859375,
"learning_rate": 1.1086849760114844e-05,
"loss": 0.0136,
"step": 118016
},
{
"epoch": 4.4679838313626234,
"grad_norm": 0.2378958761692047,
"learning_rate": 1.1067507838766954e-05,
"loss": 0.0147,
"step": 118272
},
{
"epoch": 4.477654792036568,
"grad_norm": 0.31944742798805237,
"learning_rate": 1.1048165917419062e-05,
"loss": 0.0135,
"step": 118528
},
{
"epoch": 4.487325752710514,
"grad_norm": 1.0051418542861938,
"learning_rate": 1.1028899550451438e-05,
"loss": 0.0137,
"step": 118784
},
{
"epoch": 4.496996713384458,
"grad_norm": 1.6819483041763306,
"learning_rate": 1.1009557629103548e-05,
"loss": 0.0156,
"step": 119040
},
{
"epoch": 4.506667674058404,
"grad_norm": 0.40426477789878845,
"learning_rate": 1.0990215707755658e-05,
"loss": 0.0146,
"step": 119296
},
{
"epoch": 4.516338634732349,
"grad_norm": 3.140392303466797,
"learning_rate": 1.0970873786407768e-05,
"loss": 0.0129,
"step": 119552
},
{
"epoch": 4.526009595406293,
"grad_norm": 4.579553604125977,
"learning_rate": 1.0951531865059877e-05,
"loss": 0.0124,
"step": 119808
},
{
"epoch": 4.535680556080239,
"grad_norm": 5.144607067108154,
"learning_rate": 1.0932189943711989e-05,
"loss": 0.0153,
"step": 120064
},
{
"epoch": 4.545351516754184,
"grad_norm": 0.48044607043266296,
"learning_rate": 1.0912848022364097e-05,
"loss": 0.013,
"step": 120320
},
{
"epoch": 4.555022477428129,
"grad_norm": 42.02862548828125,
"learning_rate": 1.0893506101016207e-05,
"loss": 0.0137,
"step": 120576
},
{
"epoch": 4.564693438102074,
"grad_norm": 6.357956886291504,
"learning_rate": 1.0874239734048581e-05,
"loss": 0.0154,
"step": 120832
},
{
"epoch": 4.574364398776019,
"grad_norm": 1.7824290990829468,
"learning_rate": 1.0854897812700693e-05,
"loss": 0.0127,
"step": 121088
},
{
"epoch": 4.584035359449964,
"grad_norm": 1.5723809003829956,
"learning_rate": 1.0835555891352803e-05,
"loss": 0.0129,
"step": 121344
},
{
"epoch": 4.593706320123909,
"grad_norm": 0.8262581825256348,
"learning_rate": 1.0816213970004911e-05,
"loss": 0.0151,
"step": 121600
},
{
"epoch": 4.603377280797854,
"grad_norm": 0.8032371401786804,
"learning_rate": 1.0796872048657022e-05,
"loss": 0.0158,
"step": 121856
},
{
"epoch": 4.613048241471799,
"grad_norm": 0.9602940082550049,
"learning_rate": 1.0777530127309133e-05,
"loss": 0.0142,
"step": 122112
},
{
"epoch": 4.622719202145745,
"grad_norm": 1.9872223138809204,
"learning_rate": 1.0758188205961242e-05,
"loss": 0.0134,
"step": 122368
},
{
"epoch": 4.632390162819689,
"grad_norm": 5.095240116119385,
"learning_rate": 1.0738846284613352e-05,
"loss": 0.014,
"step": 122624
},
{
"epoch": 4.642061123493635,
"grad_norm": 5.41306209564209,
"learning_rate": 1.071950436326546e-05,
"loss": 0.0124,
"step": 122880
},
{
"epoch": 4.6517320841675796,
"grad_norm": 10.439872741699219,
"learning_rate": 1.0700162441917572e-05,
"loss": 0.0148,
"step": 123136
},
{
"epoch": 4.661403044841524,
"grad_norm": 0.26815417408943176,
"learning_rate": 1.068082052056968e-05,
"loss": 0.0132,
"step": 123392
},
{
"epoch": 4.67107400551547,
"grad_norm": 0.6603275537490845,
"learning_rate": 1.0661554153602056e-05,
"loss": 0.0116,
"step": 123648
},
{
"epoch": 4.6807449661894145,
"grad_norm": 7.041431903839111,
"learning_rate": 1.0642212232254165e-05,
"loss": 0.0129,
"step": 123904
},
{
"epoch": 4.69041592686336,
"grad_norm": 0.7987198233604431,
"learning_rate": 1.0622870310906275e-05,
"loss": 0.0129,
"step": 124160
},
{
"epoch": 4.700086887537305,
"grad_norm": 0.14286652207374573,
"learning_rate": 1.0603528389558387e-05,
"loss": 0.0124,
"step": 124416
},
{
"epoch": 4.70975784821125,
"grad_norm": 0.9553490877151489,
"learning_rate": 1.0584186468210495e-05,
"loss": 0.0124,
"step": 124672
},
{
"epoch": 4.719428808885195,
"grad_norm": 0.6493328809738159,
"learning_rate": 1.0564844546862605e-05,
"loss": 0.012,
"step": 124928
},
{
"epoch": 4.729099769559141,
"grad_norm": 0.2133503556251526,
"learning_rate": 1.0545502625514714e-05,
"loss": 0.014,
"step": 125184
},
{
"epoch": 4.738770730233085,
"grad_norm": 2.6697592735290527,
"learning_rate": 1.0526160704166826e-05,
"loss": 0.013,
"step": 125440
},
{
"epoch": 4.748441690907031,
"grad_norm": 0.8658607602119446,
"learning_rate": 1.0506894337199201e-05,
"loss": 0.0131,
"step": 125696
},
{
"epoch": 4.7581126515809755,
"grad_norm": 1.9833451509475708,
"learning_rate": 1.048755241585131e-05,
"loss": 0.013,
"step": 125952
},
{
"epoch": 4.76778361225492,
"grad_norm": 0.19457457959651947,
"learning_rate": 1.046821049450342e-05,
"loss": 0.0142,
"step": 126208
},
{
"epoch": 4.777454572928866,
"grad_norm": 0.9841840863227844,
"learning_rate": 1.044886857315553e-05,
"loss": 0.0123,
"step": 126464
},
{
"epoch": 4.7871255336028105,
"grad_norm": 1.9175962209701538,
"learning_rate": 1.042952665180764e-05,
"loss": 0.0136,
"step": 126720
},
{
"epoch": 4.796796494276756,
"grad_norm": 1.7247178554534912,
"learning_rate": 1.0410184730459748e-05,
"loss": 0.0136,
"step": 126976
},
{
"epoch": 4.806467454950701,
"grad_norm": 2.0652236938476562,
"learning_rate": 1.0390842809111859e-05,
"loss": 0.0112,
"step": 127232
},
{
"epoch": 4.816138415624646,
"grad_norm": 1.1892759799957275,
"learning_rate": 1.037150088776397e-05,
"loss": 0.0125,
"step": 127488
},
{
"epoch": 4.825809376298591,
"grad_norm": 29.004505157470703,
"learning_rate": 1.0352158966416079e-05,
"loss": 0.0112,
"step": 127744
},
{
"epoch": 4.835480336972536,
"grad_norm": 0.5393902659416199,
"learning_rate": 1.0332817045068189e-05,
"loss": 0.0124,
"step": 128000
},
{
"epoch": 4.845151297646481,
"grad_norm": 0.9426546096801758,
"learning_rate": 1.0313475123720297e-05,
"loss": 0.011,
"step": 128256
},
{
"epoch": 4.854822258320426,
"grad_norm": 1.1209189891815186,
"learning_rate": 1.029413320237241e-05,
"loss": 0.0117,
"step": 128512
},
{
"epoch": 4.8644932189943715,
"grad_norm": 0.8620722889900208,
"learning_rate": 1.027479128102452e-05,
"loss": 0.0121,
"step": 128768
},
{
"epoch": 4.874164179668316,
"grad_norm": 0.14039096236228943,
"learning_rate": 1.0255524914056893e-05,
"loss": 0.0145,
"step": 129024
},
{
"epoch": 4.883835140342262,
"grad_norm": 0.5701342821121216,
"learning_rate": 1.0236182992709003e-05,
"loss": 0.0114,
"step": 129280
},
{
"epoch": 4.893506101016206,
"grad_norm": 0.802097499370575,
"learning_rate": 1.0216841071361112e-05,
"loss": 0.0124,
"step": 129536
},
{
"epoch": 4.903177061690151,
"grad_norm": 0.49824589490890503,
"learning_rate": 1.0197499150013224e-05,
"loss": 0.0133,
"step": 129792
},
{
"epoch": 4.912848022364097,
"grad_norm": 1.2195169925689697,
"learning_rate": 1.0178157228665332e-05,
"loss": 0.0134,
"step": 130048
},
{
"epoch": 4.922518983038041,
"grad_norm": 23.420486450195312,
"learning_rate": 1.0158815307317442e-05,
"loss": 0.0125,
"step": 130304
},
{
"epoch": 4.932189943711987,
"grad_norm": 0.8538005948066711,
"learning_rate": 1.013947338596955e-05,
"loss": 0.0124,
"step": 130560
},
{
"epoch": 4.941860904385932,
"grad_norm": 3.506213903427124,
"learning_rate": 1.0120131464621663e-05,
"loss": 0.0125,
"step": 130816
},
{
"epoch": 4.951531865059877,
"grad_norm": 0.5479403734207153,
"learning_rate": 1.0100789543273773e-05,
"loss": 0.0137,
"step": 131072
},
{
"epoch": 4.961202825733822,
"grad_norm": 0.24773092567920685,
"learning_rate": 1.0081447621925881e-05,
"loss": 0.011,
"step": 131328
},
{
"epoch": 4.970873786407767,
"grad_norm": 0.3392595946788788,
"learning_rate": 1.0062105700577991e-05,
"loss": 0.0113,
"step": 131584
},
{
"epoch": 4.980544747081712,
"grad_norm": 9.13214111328125,
"learning_rate": 1.0042763779230103e-05,
"loss": 0.0103,
"step": 131840
},
{
"epoch": 4.990215707755657,
"grad_norm": 0.6798635721206665,
"learning_rate": 1.0023421857882212e-05,
"loss": 0.0112,
"step": 132096
},
{
"epoch": 4.999886668429602,
"grad_norm": 3.8642024993896484,
"learning_rate": 1.0004155490914587e-05,
"loss": 0.0132,
"step": 132352
},
{
"epoch": 5.0,
"eval_f1_B-DISEASE": 0.8076930929582066,
"eval_f1_B-MEDICATION": 0.9320128479657388,
"eval_f1_B-PROCEDURE": 0.8299265901797881,
"eval_f1_B-SYMPTOM": 0.802206734344465,
"eval_f1_I-DISEASE": 0.8443607103813086,
"eval_f1_I-MEDICATION": 0.9473012496676416,
"eval_f1_I-PROCEDURE": 0.8478063590704366,
"eval_f1_I-SYMPTOM": 0.8098297732572185,
"eval_f1_O": 0.9250181548686375,
"eval_f1_macro": 0.8606839458548268,
"eval_f1_micro": 0.8883442580707792,
"eval_loss": 0.4413922429084778,
"eval_precision_B-DISEASE": 0.83231643172733,
"eval_precision_B-MEDICATION": 0.9345142243692969,
"eval_precision_B-PROCEDURE": 0.8534490552391285,
"eval_precision_B-SYMPTOM": 0.8108590008041114,
"eval_precision_I-DISEASE": 0.8482866891605315,
"eval_precision_I-MEDICATION": 0.952467518579907,
"eval_precision_I-PROCEDURE": 0.8695185973099094,
"eval_precision_I-SYMPTOM": 0.8183803238035672,
"eval_precision_O": 0.9206075463451251,
"eval_precision_macro": 0.8711554874821008,
"eval_precision_micro": 0.8905099095411801,
"eval_rauc_macro": 0.9146732071749695,
"eval_rauc_micro": 0.9361508470284178,
"eval_recall_B-DISEASE": 0.784484810026176,
"eval_recall_B-MEDICATION": 0.9295248264815803,
"eval_recall_B-PROCEDURE": 0.8076659822039699,
"eval_recall_B-SYMPTOM": 0.7937371663244354,
"eval_recall_I-DISEASE": 0.8404709040504773,
"eval_recall_I-MEDICATION": 0.9421907230126408,
"eval_recall_I-PROCEDURE": 0.8271520314654786,
"eval_recall_I-SYMPTOM": 0.8014560498603052,
"eval_recall_O": 0.9294712290821007,
"eval_recall_macro": 0.8506837469452404,
"eval_recall_micro": 0.8861891144410676,
"eval_roc_auc_B-DISEASE": 0.8907720240571226,
"eval_roc_auc_B-MEDICATION": 0.964629291931633,
"eval_roc_auc_B-PROCEDURE": 0.9026383818040776,
"eval_roc_auc_B-SYMPTOM": 0.8948664885493695,
"eval_roc_auc_I-DISEASE": 0.9104202960745905,
"eval_roc_auc_I-MEDICATION": 0.9707688588965032,
"eval_roc_auc_I-PROCEDURE": 0.9075291450310622,
"eval_roc_auc_I-SYMPTOM": 0.8868675259287415,
"eval_roc_auc_O": 0.9035668523016245,
"eval_runtime": 61.1266,
"eval_samples_per_second": 177.877,
"eval_steps_per_second": 22.249,
"step": 132355
},
{
"epoch": 5.009557629103547,
"grad_norm": 0.4311939775943756,
"learning_rate": 9.984813569566696e-06,
"loss": 0.0071,
"step": 132608
},
{
"epoch": 5.019228589777493,
"grad_norm": 1.0362738370895386,
"learning_rate": 9.965471648218806e-06,
"loss": 0.0086,
"step": 132864
},
{
"epoch": 5.028899550451437,
"grad_norm": 1.9174968004226685,
"learning_rate": 9.946129726870916e-06,
"loss": 0.0069,
"step": 133120
},
{
"epoch": 5.038570511125383,
"grad_norm": 0.2945270240306854,
"learning_rate": 9.926787805523026e-06,
"loss": 0.0086,
"step": 133376
},
{
"epoch": 5.048241471799328,
"grad_norm": 0.024452047422528267,
"learning_rate": 9.907445884175136e-06,
"loss": 0.0068,
"step": 133632
},
{
"epoch": 5.057912432473272,
"grad_norm": 0.9929279088973999,
"learning_rate": 9.888179517207512e-06,
"loss": 0.0077,
"step": 133888
},
{
"epoch": 5.067583393147218,
"grad_norm": 3.7908236980438232,
"learning_rate": 9.86883759585962e-06,
"loss": 0.0088,
"step": 134144
},
{
"epoch": 5.0772543538211625,
"grad_norm": 1.9607737064361572,
"learning_rate": 9.84949567451173e-06,
"loss": 0.0077,
"step": 134400
},
{
"epoch": 5.086925314495108,
"grad_norm": 4.287957668304443,
"learning_rate": 9.83015375316384e-06,
"loss": 0.0091,
"step": 134656
},
{
"epoch": 5.096596275169053,
"grad_norm": 0.9552005529403687,
"learning_rate": 9.81081183181595e-06,
"loss": 0.0081,
"step": 134912
},
{
"epoch": 5.106267235842998,
"grad_norm": 3.186450481414795,
"learning_rate": 9.79146991046806e-06,
"loss": 0.0074,
"step": 135168
},
{
"epoch": 5.115938196516943,
"grad_norm": 0.3131207525730133,
"learning_rate": 9.772127989120171e-06,
"loss": 0.0076,
"step": 135424
},
{
"epoch": 5.125609157190888,
"grad_norm": 0.2811489701271057,
"learning_rate": 9.75278606777228e-06,
"loss": 0.009,
"step": 135680
},
{
"epoch": 5.135280117864833,
"grad_norm": 0.3740166127681732,
"learning_rate": 9.73344414642439e-06,
"loss": 0.0078,
"step": 135936
},
{
"epoch": 5.144951078538778,
"grad_norm": 1.3230619430541992,
"learning_rate": 9.7141022250765e-06,
"loss": 0.008,
"step": 136192
},
{
"epoch": 5.1546220392127235,
"grad_norm": 0.6120270490646362,
"learning_rate": 9.694835858108874e-06,
"loss": 0.0073,
"step": 136448
},
{
"epoch": 5.164292999886668,
"grad_norm": 4.456196308135986,
"learning_rate": 9.675493936760985e-06,
"loss": 0.01,
"step": 136704
},
{
"epoch": 5.173963960560614,
"grad_norm": 0.2429385632276535,
"learning_rate": 9.656152015413094e-06,
"loss": 0.0088,
"step": 136960
},
{
"epoch": 5.1836349212345585,
"grad_norm": 1.2598743438720703,
"learning_rate": 9.636810094065204e-06,
"loss": 0.0103,
"step": 137216
},
{
"epoch": 5.193305881908504,
"grad_norm": 1.915220022201538,
"learning_rate": 9.617468172717314e-06,
"loss": 0.0098,
"step": 137472
},
{
"epoch": 5.202976842582449,
"grad_norm": 0.8882638812065125,
"learning_rate": 9.598126251369424e-06,
"loss": 0.0094,
"step": 137728
},
{
"epoch": 5.212647803256393,
"grad_norm": 0.10290802270174026,
"learning_rate": 9.578784330021533e-06,
"loss": 0.0085,
"step": 137984
},
{
"epoch": 5.222318763930339,
"grad_norm": 3.6905243396759033,
"learning_rate": 9.559442408673644e-06,
"loss": 0.0105,
"step": 138240
},
{
"epoch": 5.231989724604284,
"grad_norm": 0.27331113815307617,
"learning_rate": 9.540100487325753e-06,
"loss": 0.0096,
"step": 138496
},
{
"epoch": 5.241660685278229,
"grad_norm": 0.3453868627548218,
"learning_rate": 9.520758565977863e-06,
"loss": 0.0093,
"step": 138752
},
{
"epoch": 5.251331645952174,
"grad_norm": 6.686705589294434,
"learning_rate": 9.501416644629973e-06,
"loss": 0.0103,
"step": 139008
},
{
"epoch": 5.2610026066261195,
"grad_norm": 6.24531364440918,
"learning_rate": 9.482074723282083e-06,
"loss": 0.0089,
"step": 139264
},
{
"epoch": 5.270673567300064,
"grad_norm": 5.73491907119751,
"learning_rate": 9.462732801934192e-06,
"loss": 0.0099,
"step": 139520
},
{
"epoch": 5.280344527974009,
"grad_norm": 3.492011308670044,
"learning_rate": 9.443390880586304e-06,
"loss": 0.0078,
"step": 139776
},
{
"epoch": 5.2900154886479545,
"grad_norm": 0.5170190930366516,
"learning_rate": 9.424048959238412e-06,
"loss": 0.0078,
"step": 140032
},
{
"epoch": 5.299686449321899,
"grad_norm": 0.07176166027784348,
"learning_rate": 9.404707037890522e-06,
"loss": 0.008,
"step": 140288
},
{
"epoch": 5.309357409995845,
"grad_norm": 1.4914041757583618,
"learning_rate": 9.385440670922898e-06,
"loss": 0.009,
"step": 140544
},
{
"epoch": 5.319028370669789,
"grad_norm": 2.964844226837158,
"learning_rate": 9.366098749575008e-06,
"loss": 0.0085,
"step": 140800
},
{
"epoch": 5.328699331343735,
"grad_norm": 0.2556954324245453,
"learning_rate": 9.346756828227116e-06,
"loss": 0.0091,
"step": 141056
},
{
"epoch": 5.33837029201768,
"grad_norm": 3.6987621784210205,
"learning_rate": 9.327414906879228e-06,
"loss": 0.0079,
"step": 141312
},
{
"epoch": 5.348041252691624,
"grad_norm": 4.68747615814209,
"learning_rate": 9.308072985531337e-06,
"loss": 0.0087,
"step": 141568
},
{
"epoch": 5.35771221336557,
"grad_norm": 0.4118718206882477,
"learning_rate": 9.288731064183447e-06,
"loss": 0.0096,
"step": 141824
},
{
"epoch": 5.367383174039515,
"grad_norm": 0.3415529429912567,
"learning_rate": 9.269389142835557e-06,
"loss": 0.0088,
"step": 142080
},
{
"epoch": 5.37705413471346,
"grad_norm": 0.10233204811811447,
"learning_rate": 9.250047221487667e-06,
"loss": 0.0082,
"step": 142336
},
{
"epoch": 5.386725095387405,
"grad_norm": 0.2785378396511078,
"learning_rate": 9.230705300139775e-06,
"loss": 0.0107,
"step": 142592
},
{
"epoch": 5.39639605606135,
"grad_norm": 1.3955039978027344,
"learning_rate": 9.211438933172151e-06,
"loss": 0.0081,
"step": 142848
},
{
"epoch": 5.406067016735295,
"grad_norm": 6.009440898895264,
"learning_rate": 9.192097011824261e-06,
"loss": 0.0078,
"step": 143104
},
{
"epoch": 5.415737977409241,
"grad_norm": 0.10272625833749771,
"learning_rate": 9.172755090476371e-06,
"loss": 0.0097,
"step": 143360
},
{
"epoch": 5.425408938083185,
"grad_norm": 5.104133605957031,
"learning_rate": 9.153413169128481e-06,
"loss": 0.0079,
"step": 143616
},
{
"epoch": 5.43507989875713,
"grad_norm": 0.218174010515213,
"learning_rate": 9.13407124778059e-06,
"loss": 0.0088,
"step": 143872
},
{
"epoch": 5.444750859431076,
"grad_norm": 4.509812355041504,
"learning_rate": 9.1147293264327e-06,
"loss": 0.0088,
"step": 144128
},
{
"epoch": 5.45442182010502,
"grad_norm": 0.9697214961051941,
"learning_rate": 9.09538740508481e-06,
"loss": 0.0088,
"step": 144384
},
{
"epoch": 5.464092780778966,
"grad_norm": 1.000596046447754,
"learning_rate": 9.07604548373692e-06,
"loss": 0.0089,
"step": 144640
},
{
"epoch": 5.473763741452911,
"grad_norm": 0.22552327811717987,
"learning_rate": 9.05670356238903e-06,
"loss": 0.009,
"step": 144896
},
{
"epoch": 5.483434702126856,
"grad_norm": 0.7269870042800903,
"learning_rate": 9.03736164104114e-06,
"loss": 0.0097,
"step": 145152
},
{
"epoch": 5.493105662800801,
"grad_norm": 0.3465439975261688,
"learning_rate": 9.018095274073515e-06,
"loss": 0.0102,
"step": 145408
},
{
"epoch": 5.502776623474746,
"grad_norm": 0.6706210970878601,
"learning_rate": 8.998753352725625e-06,
"loss": 0.009,
"step": 145664
},
{
"epoch": 5.512447584148691,
"grad_norm": 36.635414123535156,
"learning_rate": 8.979411431377735e-06,
"loss": 0.0084,
"step": 145920
},
{
"epoch": 5.522118544822636,
"grad_norm": 1.6504905223846436,
"learning_rate": 8.960069510029845e-06,
"loss": 0.008,
"step": 146176
},
{
"epoch": 5.531789505496581,
"grad_norm": 0.5836831331253052,
"learning_rate": 8.940727588681955e-06,
"loss": 0.0087,
"step": 146432
},
{
"epoch": 5.541460466170526,
"grad_norm": 0.684615433216095,
"learning_rate": 8.921385667334065e-06,
"loss": 0.0076,
"step": 146688
},
{
"epoch": 5.551131426844472,
"grad_norm": 2.892833709716797,
"learning_rate": 8.902043745986174e-06,
"loss": 0.0085,
"step": 146944
},
{
"epoch": 5.560802387518416,
"grad_norm": 20.16980743408203,
"learning_rate": 8.882701824638284e-06,
"loss": 0.0084,
"step": 147200
},
{
"epoch": 5.570473348192362,
"grad_norm": 3.590690851211548,
"learning_rate": 8.86343545767066e-06,
"loss": 0.008,
"step": 147456
},
{
"epoch": 5.5801443088663065,
"grad_norm": 0.8185898661613464,
"learning_rate": 8.844093536322768e-06,
"loss": 0.0074,
"step": 147712
},
{
"epoch": 5.589815269540251,
"grad_norm": 0.3533550202846527,
"learning_rate": 8.82475161497488e-06,
"loss": 0.0079,
"step": 147968
},
{
"epoch": 5.599486230214197,
"grad_norm": 1.9578065872192383,
"learning_rate": 8.805409693626988e-06,
"loss": 0.0077,
"step": 148224
},
{
"epoch": 5.6091571908881415,
"grad_norm": 0.17547504603862762,
"learning_rate": 8.786067772279098e-06,
"loss": 0.0086,
"step": 148480
},
{
"epoch": 5.618828151562087,
"grad_norm": 1.6071051359176636,
"learning_rate": 8.766725850931208e-06,
"loss": 0.0085,
"step": 148736
},
{
"epoch": 5.628499112236032,
"grad_norm": 0.8156256079673767,
"learning_rate": 8.747383929583318e-06,
"loss": 0.007,
"step": 148992
},
{
"epoch": 5.638170072909977,
"grad_norm": 11.689854621887207,
"learning_rate": 8.728042008235429e-06,
"loss": 0.0096,
"step": 149248
},
{
"epoch": 5.647841033583922,
"grad_norm": 0.9380402565002441,
"learning_rate": 8.708700086887539e-06,
"loss": 0.0082,
"step": 149504
},
{
"epoch": 5.657511994257867,
"grad_norm": 0.5615717172622681,
"learning_rate": 8.689433719919913e-06,
"loss": 0.0079,
"step": 149760
},
{
"epoch": 5.667182954931812,
"grad_norm": 1.7645057439804077,
"learning_rate": 8.670091798572023e-06,
"loss": 0.0103,
"step": 150016
},
{
"epoch": 5.676853915605757,
"grad_norm": 4.009266376495361,
"learning_rate": 8.650749877224133e-06,
"loss": 0.0089,
"step": 150272
},
{
"epoch": 5.6865248762797025,
"grad_norm": 0.6033828854560852,
"learning_rate": 8.631407955876243e-06,
"loss": 0.0074,
"step": 150528
},
{
"epoch": 5.696195836953647,
"grad_norm": 5.695953369140625,
"learning_rate": 8.612066034528353e-06,
"loss": 0.0087,
"step": 150784
},
{
"epoch": 5.705866797627593,
"grad_norm": 2.7361793518066406,
"learning_rate": 8.592724113180463e-06,
"loss": 0.0083,
"step": 151040
},
{
"epoch": 5.715537758301537,
"grad_norm": 0.26094111800193787,
"learning_rate": 8.573382191832572e-06,
"loss": 0.0083,
"step": 151296
},
{
"epoch": 5.725208718975482,
"grad_norm": 0.7956266403198242,
"learning_rate": 8.554040270484682e-06,
"loss": 0.0098,
"step": 151552
},
{
"epoch": 5.734879679649428,
"grad_norm": 0.28114378452301025,
"learning_rate": 8.534698349136792e-06,
"loss": 0.0093,
"step": 151808
},
{
"epoch": 5.744550640323372,
"grad_norm": 2.0160458087921143,
"learning_rate": 8.515356427788902e-06,
"loss": 0.0099,
"step": 152064
},
{
"epoch": 5.754221600997318,
"grad_norm": 1.1137139797210693,
"learning_rate": 8.496014506441012e-06,
"loss": 0.0082,
"step": 152320
},
{
"epoch": 5.763892561671263,
"grad_norm": 3.6147210597991943,
"learning_rate": 8.476672585093122e-06,
"loss": 0.0083,
"step": 152576
},
{
"epoch": 5.773563522345208,
"grad_norm": 4.814803123474121,
"learning_rate": 8.457330663745231e-06,
"loss": 0.007,
"step": 152832
},
{
"epoch": 5.783234483019153,
"grad_norm": 0.7147836089134216,
"learning_rate": 8.437988742397341e-06,
"loss": 0.0088,
"step": 153088
},
{
"epoch": 5.7929054436930985,
"grad_norm": 1.4864364862442017,
"learning_rate": 8.418646821049451e-06,
"loss": 0.0063,
"step": 153344
},
{
"epoch": 5.802576404367043,
"grad_norm": 0.7108877301216125,
"learning_rate": 8.399304899701561e-06,
"loss": 0.0076,
"step": 153600
},
{
"epoch": 5.812247365040989,
"grad_norm": 2.6084437370300293,
"learning_rate": 8.379962978353671e-06,
"loss": 0.0086,
"step": 153856
},
{
"epoch": 5.821918325714933,
"grad_norm": 0.09771878272294998,
"learning_rate": 8.360696611386045e-06,
"loss": 0.009,
"step": 154112
},
{
"epoch": 5.831589286388878,
"grad_norm": 0.6635453104972839,
"learning_rate": 8.341354690038155e-06,
"loss": 0.0071,
"step": 154368
},
{
"epoch": 5.841260247062824,
"grad_norm": 1.141113042831421,
"learning_rate": 8.322088323070531e-06,
"loss": 0.0076,
"step": 154624
},
{
"epoch": 5.850931207736768,
"grad_norm": 0.8303898572921753,
"learning_rate": 8.30274640172264e-06,
"loss": 0.0096,
"step": 154880
},
{
"epoch": 5.860602168410714,
"grad_norm": 0.5006212592124939,
"learning_rate": 8.28340448037475e-06,
"loss": 0.0076,
"step": 155136
},
{
"epoch": 5.870273129084659,
"grad_norm": 1.09455406665802,
"learning_rate": 8.26406255902686e-06,
"loss": 0.007,
"step": 155392
},
{
"epoch": 5.879944089758604,
"grad_norm": 0.5454290509223938,
"learning_rate": 8.24472063767897e-06,
"loss": 0.0081,
"step": 155648
},
{
"epoch": 5.889615050432549,
"grad_norm": 14.345696449279785,
"learning_rate": 8.22537871633108e-06,
"loss": 0.0097,
"step": 155904
},
{
"epoch": 5.8992860111064935,
"grad_norm": 2.6186184883117676,
"learning_rate": 8.20603679498319e-06,
"loss": 0.0089,
"step": 156160
},
{
"epoch": 5.908956971780439,
"grad_norm": 1.894392967224121,
"learning_rate": 8.186694873635299e-06,
"loss": 0.0078,
"step": 156416
},
{
"epoch": 5.918627932454384,
"grad_norm": 0.8504657745361328,
"learning_rate": 8.167352952287409e-06,
"loss": 0.0089,
"step": 156672
},
{
"epoch": 5.928298893128329,
"grad_norm": 1.3975979089736938,
"learning_rate": 8.148011030939519e-06,
"loss": 0.0076,
"step": 156928
},
{
"epoch": 5.937969853802274,
"grad_norm": 0.12042956799268723,
"learning_rate": 8.128669109591629e-06,
"loss": 0.0073,
"step": 157184
},
{
"epoch": 5.94764081447622,
"grad_norm": 0.7101040482521057,
"learning_rate": 8.10932718824374e-06,
"loss": 0.0084,
"step": 157440
},
{
"epoch": 5.957311775150164,
"grad_norm": 0.049012139439582825,
"learning_rate": 8.08998526689585e-06,
"loss": 0.0078,
"step": 157696
},
{
"epoch": 5.966982735824109,
"grad_norm": 3.6799347400665283,
"learning_rate": 8.070643345547958e-06,
"loss": 0.0069,
"step": 157952
},
{
"epoch": 5.976653696498055,
"grad_norm": 5.190356731414795,
"learning_rate": 8.051301424200068e-06,
"loss": 0.0083,
"step": 158208
},
{
"epoch": 5.986324657171999,
"grad_norm": 0.405319482088089,
"learning_rate": 8.031959502852178e-06,
"loss": 0.0076,
"step": 158464
},
{
"epoch": 5.995995617845945,
"grad_norm": 7.220467567443848,
"learning_rate": 8.012617581504288e-06,
"loss": 0.0076,
"step": 158720
},
{
"epoch": 6.0,
"eval_f1_B-DISEASE": 0.8137172062733137,
"eval_f1_B-MEDICATION": 0.9366835994194485,
"eval_f1_B-PROCEDURE": 0.8338765045843654,
"eval_f1_B-SYMPTOM": 0.802911592516026,
"eval_f1_I-DISEASE": 0.8454658855143709,
"eval_f1_I-MEDICATION": 0.9528172976448839,
"eval_f1_I-PROCEDURE": 0.8516517120332436,
"eval_f1_I-SYMPTOM": 0.8137056001030496,
"eval_f1_O": 0.9249487903086626,
"eval_f1_macro": 0.8639753542663738,
"eval_f1_micro": 0.8895774266140277,
"eval_loss": 0.4695410430431366,
"eval_precision_B-DISEASE": 0.846968981938307,
"eval_precision_B-MEDICATION": 0.9552266419981499,
"eval_precision_B-PROCEDURE": 0.8472406181015453,
"eval_precision_B-SYMPTOM": 0.8153335920685884,
"eval_precision_I-DISEASE": 0.8649620429239743,
"eval_precision_I-MEDICATION": 0.9655191138140747,
"eval_precision_I-PROCEDURE": 0.8750075317409081,
"eval_precision_I-SYMPTOM": 0.8128417937335135,
"eval_precision_O": 0.9181102771519474,
"eval_precision_macro": 0.8779122881634454,
"eval_precision_micro": 0.8910716505650682,
"eval_rauc_macro": 0.9145927366341076,
"eval_rauc_micro": 0.9371255777552341,
"eval_recall_B-DISEASE": 0.7829777107955898,
"eval_recall_B-MEDICATION": 0.9188467698878804,
"eval_recall_B-PROCEDURE": 0.820927446954141,
"eval_recall_B-SYMPTOM": 0.7908624229979466,
"eval_recall_I-DISEASE": 0.8268292376974121,
"eval_recall_I-MEDICATION": 0.9404453377056117,
"eval_recall_I-PROCEDURE": 0.8295103103299143,
"eval_recall_I-SYMPTOM": 0.8145712443584784,
"eval_recall_O": 0.9318899408213067,
"eval_recall_macro": 0.8507622690609201,
"eval_recall_micro": 0.8880882055547169,
"eval_roc_auc_B-DISEASE": 0.8901727076261692,
"eval_roc_auc_B-MEDICATION": 0.9593353648433499,
"eval_roc_auc_B-PROCEDURE": 0.9091887857316173,
"eval_roc_auc_B-SYMPTOM": 0.8934942497238074,
"eval_roc_auc_I-DISEASE": 0.9049857727909453,
"eval_roc_auc_I-MEDICATION": 0.9699894527029364,
"eval_roc_auc_I-PROCEDURE": 0.9089825820626593,
"eval_roc_auc_I-SYMPTOM": 0.8926697963231113,
"eval_roc_auc_O": 0.9025159179023717,
"eval_runtime": 60.8686,
"eval_samples_per_second": 178.631,
"eval_steps_per_second": 22.343,
"step": 158826
},
{
"epoch": 6.0056665785198895,
"grad_norm": 2.5522048473358154,
"learning_rate": 7.993275660156398e-06,
"loss": 0.0067,
"step": 158976
},
{
"epoch": 6.015337539193835,
"grad_norm": 0.1445242464542389,
"learning_rate": 7.973933738808508e-06,
"loss": 0.0056,
"step": 159232
},
{
"epoch": 6.02500849986778,
"grad_norm": 0.8560025095939636,
"learning_rate": 7.954591817460619e-06,
"loss": 0.004,
"step": 159488
},
{
"epoch": 6.034679460541725,
"grad_norm": 0.5683347582817078,
"learning_rate": 7.935249896112727e-06,
"loss": 0.0048,
"step": 159744
},
{
"epoch": 6.04435042121567,
"grad_norm": 0.10347987711429596,
"learning_rate": 7.916059083525368e-06,
"loss": 0.0048,
"step": 160000
},
{
"epoch": 6.054021381889615,
"grad_norm": 0.765963613986969,
"learning_rate": 7.896717162177477e-06,
"loss": 0.0044,
"step": 160256
},
{
"epoch": 6.06369234256356,
"grad_norm": 0.23950816690921783,
"learning_rate": 7.877375240829588e-06,
"loss": 0.0039,
"step": 160512
},
{
"epoch": 6.073363303237505,
"grad_norm": 1.28322434425354,
"learning_rate": 7.858033319481697e-06,
"loss": 0.0058,
"step": 160768
},
{
"epoch": 6.0830342639114505,
"grad_norm": 0.0957738608121872,
"learning_rate": 7.838691398133807e-06,
"loss": 0.0051,
"step": 161024
},
{
"epoch": 6.092705224585395,
"grad_norm": 0.09481767565011978,
"learning_rate": 7.819349476785917e-06,
"loss": 0.006,
"step": 161280
},
{
"epoch": 6.102376185259341,
"grad_norm": 1.084963321685791,
"learning_rate": 7.800007555438027e-06,
"loss": 0.0052,
"step": 161536
},
{
"epoch": 6.1120471459332855,
"grad_norm": 0.19962504506111145,
"learning_rate": 7.780665634090136e-06,
"loss": 0.0063,
"step": 161792
},
{
"epoch": 6.12171810660723,
"grad_norm": 0.44316428899765015,
"learning_rate": 7.761323712742248e-06,
"loss": 0.0055,
"step": 162048
},
{
"epoch": 6.131389067281176,
"grad_norm": 0.096375972032547,
"learning_rate": 7.741981791394356e-06,
"loss": 0.0046,
"step": 162304
},
{
"epoch": 6.14106002795512,
"grad_norm": 0.06923657655715942,
"learning_rate": 7.722639870046466e-06,
"loss": 0.0065,
"step": 162560
},
{
"epoch": 6.150730988629066,
"grad_norm": 0.05641581490635872,
"learning_rate": 7.703373503078842e-06,
"loss": 0.0053,
"step": 162816
},
{
"epoch": 6.160401949303011,
"grad_norm": 0.10804527252912521,
"learning_rate": 7.684031581730952e-06,
"loss": 0.0049,
"step": 163072
},
{
"epoch": 6.170072909976956,
"grad_norm": 0.3508886694908142,
"learning_rate": 7.664689660383062e-06,
"loss": 0.0057,
"step": 163328
},
{
"epoch": 6.179743870650901,
"grad_norm": 0.19692179560661316,
"learning_rate": 7.645347739035172e-06,
"loss": 0.0051,
"step": 163584
},
{
"epoch": 6.1894148313248465,
"grad_norm": 7.462360382080078,
"learning_rate": 7.6260058176872806e-06,
"loss": 0.0052,
"step": 163840
},
{
"epoch": 6.199085791998791,
"grad_norm": 0.0778375118970871,
"learning_rate": 7.6066638963393915e-06,
"loss": 0.0057,
"step": 164096
},
{
"epoch": 6.208756752672736,
"grad_norm": 3.7269153594970703,
"learning_rate": 7.587321974991501e-06,
"loss": 0.0066,
"step": 164352
},
{
"epoch": 6.218427713346681,
"grad_norm": 0.3314465582370758,
"learning_rate": 7.567980053643611e-06,
"loss": 0.0066,
"step": 164608
},
{
"epoch": 6.228098674020626,
"grad_norm": 0.4546041786670685,
"learning_rate": 7.548713686675986e-06,
"loss": 0.0054,
"step": 164864
},
{
"epoch": 6.237769634694572,
"grad_norm": 0.1140669584274292,
"learning_rate": 7.529371765328095e-06,
"loss": 0.0053,
"step": 165120
},
{
"epoch": 6.247440595368516,
"grad_norm": 0.03010609745979309,
"learning_rate": 7.510029843980205e-06,
"loss": 0.0045,
"step": 165376
},
{
"epoch": 6.257111556042462,
"grad_norm": 0.015513704158365726,
"learning_rate": 7.4906879226323145e-06,
"loss": 0.0056,
"step": 165632
},
{
"epoch": 6.266782516716407,
"grad_norm": 0.09134875982999802,
"learning_rate": 7.4713460012844255e-06,
"loss": 0.0066,
"step": 165888
},
{
"epoch": 6.276453477390351,
"grad_norm": 0.016765909269452095,
"learning_rate": 7.452004079936535e-06,
"loss": 0.0053,
"step": 166144
},
{
"epoch": 6.286124438064297,
"grad_norm": 0.5640433430671692,
"learning_rate": 7.432662158588645e-06,
"loss": 0.0049,
"step": 166400
},
{
"epoch": 6.295795398738242,
"grad_norm": 0.21902374923229218,
"learning_rate": 7.413320237240754e-06,
"loss": 0.0064,
"step": 166656
},
{
"epoch": 6.305466359412187,
"grad_norm": 5.544469833374023,
"learning_rate": 7.393978315892864e-06,
"loss": 0.0052,
"step": 166912
},
{
"epoch": 6.315137320086132,
"grad_norm": 0.7227392792701721,
"learning_rate": 7.3746363945449736e-06,
"loss": 0.0054,
"step": 167168
},
{
"epoch": 6.324808280760077,
"grad_norm": 5.256189346313477,
"learning_rate": 7.3552944731970845e-06,
"loss": 0.0057,
"step": 167424
},
{
"epoch": 6.334479241434022,
"grad_norm": 4.659141540527344,
"learning_rate": 7.335952551849194e-06,
"loss": 0.0048,
"step": 167680
},
{
"epoch": 6.344150202107967,
"grad_norm": 0.9072468876838684,
"learning_rate": 7.316610630501304e-06,
"loss": 0.0046,
"step": 167936
},
{
"epoch": 6.353821162781912,
"grad_norm": 0.14295679330825806,
"learning_rate": 7.297268709153413e-06,
"loss": 0.0052,
"step": 168192
},
{
"epoch": 6.363492123455857,
"grad_norm": 0.07267609983682632,
"learning_rate": 7.277926787805523e-06,
"loss": 0.0044,
"step": 168448
},
{
"epoch": 6.373163084129803,
"grad_norm": 0.5884820818901062,
"learning_rate": 7.258584866457633e-06,
"loss": 0.0059,
"step": 168704
},
{
"epoch": 6.382834044803747,
"grad_norm": 0.9420909881591797,
"learning_rate": 7.239318499490009e-06,
"loss": 0.0063,
"step": 168960
},
{
"epoch": 6.392505005477693,
"grad_norm": 0.13994884490966797,
"learning_rate": 7.2199765781421184e-06,
"loss": 0.0047,
"step": 169216
},
{
"epoch": 6.4021759661516375,
"grad_norm": 0.12359564751386642,
"learning_rate": 7.2006346567942286e-06,
"loss": 0.0052,
"step": 169472
},
{
"epoch": 6.411846926825583,
"grad_norm": 2.2115604877471924,
"learning_rate": 7.181292735446338e-06,
"loss": 0.0057,
"step": 169728
},
{
"epoch": 6.421517887499528,
"grad_norm": 0.019372638314962387,
"learning_rate": 7.162101922858978e-06,
"loss": 0.0058,
"step": 169984
},
{
"epoch": 6.4311888481734725,
"grad_norm": 0.07033487409353256,
"learning_rate": 7.142760001511088e-06,
"loss": 0.007,
"step": 170240
},
{
"epoch": 6.440859808847418,
"grad_norm": 0.0495685413479805,
"learning_rate": 7.123418080163198e-06,
"loss": 0.004,
"step": 170496
},
{
"epoch": 6.450530769521363,
"grad_norm": 5.647730350494385,
"learning_rate": 7.104076158815309e-06,
"loss": 0.0056,
"step": 170752
},
{
"epoch": 6.460201730195308,
"grad_norm": 0.04144500568509102,
"learning_rate": 7.084734237467418e-06,
"loss": 0.0045,
"step": 171008
},
{
"epoch": 6.469872690869253,
"grad_norm": 0.04790091514587402,
"learning_rate": 7.065392316119528e-06,
"loss": 0.005,
"step": 171264
},
{
"epoch": 6.479543651543199,
"grad_norm": 0.5807636976242065,
"learning_rate": 7.046050394771637e-06,
"loss": 0.006,
"step": 171520
},
{
"epoch": 6.489214612217143,
"grad_norm": 0.04957037419080734,
"learning_rate": 7.026708473423747e-06,
"loss": 0.0055,
"step": 171776
},
{
"epoch": 6.498885572891089,
"grad_norm": 0.29678839445114136,
"learning_rate": 7.0073665520758576e-06,
"loss": 0.0055,
"step": 172032
},
{
"epoch": 6.5085565335650335,
"grad_norm": 0.12547393143177032,
"learning_rate": 6.988024630727968e-06,
"loss": 0.004,
"step": 172288
},
{
"epoch": 6.518227494238978,
"grad_norm": 0.032738201320171356,
"learning_rate": 6.9687582637603425e-06,
"loss": 0.0062,
"step": 172544
},
{
"epoch": 6.527898454912924,
"grad_norm": 0.013363759964704514,
"learning_rate": 6.949416342412452e-06,
"loss": 0.0053,
"step": 172800
},
{
"epoch": 6.537569415586868,
"grad_norm": 0.12095487862825394,
"learning_rate": 6.930074421064562e-06,
"loss": 0.0059,
"step": 173056
},
{
"epoch": 6.547240376260814,
"grad_norm": 1.4809820652008057,
"learning_rate": 6.910732499716671e-06,
"loss": 0.0045,
"step": 173312
},
{
"epoch": 6.556911336934759,
"grad_norm": 0.11994415521621704,
"learning_rate": 6.891390578368782e-06,
"loss": 0.0045,
"step": 173568
},
{
"epoch": 6.566582297608704,
"grad_norm": 0.5074435472488403,
"learning_rate": 6.8720486570208915e-06,
"loss": 0.0047,
"step": 173824
},
{
"epoch": 6.576253258282649,
"grad_norm": 1.6332694292068481,
"learning_rate": 6.852706735673002e-06,
"loss": 0.0035,
"step": 174080
},
{
"epoch": 6.585924218956594,
"grad_norm": 0.6540184020996094,
"learning_rate": 6.833364814325111e-06,
"loss": 0.005,
"step": 174336
},
{
"epoch": 6.595595179630539,
"grad_norm": 4.0721588134765625,
"learning_rate": 6.814022892977221e-06,
"loss": 0.0043,
"step": 174592
},
{
"epoch": 6.605266140304484,
"grad_norm": 0.34634193778038025,
"learning_rate": 6.79468097162933e-06,
"loss": 0.0063,
"step": 174848
},
{
"epoch": 6.6149371009784295,
"grad_norm": 0.140211820602417,
"learning_rate": 6.775339050281441e-06,
"loss": 0.0036,
"step": 175104
},
{
"epoch": 6.624608061652374,
"grad_norm": 1.9943935871124268,
"learning_rate": 6.7559971289335505e-06,
"loss": 0.0067,
"step": 175360
},
{
"epoch": 6.63427902232632,
"grad_norm": 10.475574493408203,
"learning_rate": 6.736655207585661e-06,
"loss": 0.0054,
"step": 175616
},
{
"epoch": 6.643949983000264,
"grad_norm": 12.580154418945312,
"learning_rate": 6.71731328623777e-06,
"loss": 0.0065,
"step": 175872
},
{
"epoch": 6.653620943674209,
"grad_norm": 0.5796445608139038,
"learning_rate": 6.69797136488988e-06,
"loss": 0.0047,
"step": 176128
},
{
"epoch": 6.663291904348155,
"grad_norm": 0.03411826118826866,
"learning_rate": 6.678629443541989e-06,
"loss": 0.0038,
"step": 176384
},
{
"epoch": 6.672962865022099,
"grad_norm": 0.3479785621166229,
"learning_rate": 6.6592875221941e-06,
"loss": 0.0059,
"step": 176640
},
{
"epoch": 6.682633825696045,
"grad_norm": 0.37940141558647156,
"learning_rate": 6.63994560084621e-06,
"loss": 0.0053,
"step": 176896
},
{
"epoch": 6.69230478636999,
"grad_norm": 0.2881454527378082,
"learning_rate": 6.62060367949832e-06,
"loss": 0.0043,
"step": 177152
},
{
"epoch": 6.701975747043935,
"grad_norm": 0.32211869955062866,
"learning_rate": 6.601261758150429e-06,
"loss": 0.0071,
"step": 177408
},
{
"epoch": 6.71164670771788,
"grad_norm": 0.0830293819308281,
"learning_rate": 6.581919836802539e-06,
"loss": 0.0047,
"step": 177664
},
{
"epoch": 6.7213176683918245,
"grad_norm": 0.6374879479408264,
"learning_rate": 6.5625779154546484e-06,
"loss": 0.005,
"step": 177920
},
{
"epoch": 6.73098862906577,
"grad_norm": 0.42339634895324707,
"learning_rate": 6.543235994106759e-06,
"loss": 0.0057,
"step": 178176
},
{
"epoch": 6.740659589739715,
"grad_norm": 0.21855546534061432,
"learning_rate": 6.523894072758869e-06,
"loss": 0.0044,
"step": 178432
},
{
"epoch": 6.75033055041366,
"grad_norm": 0.17506131529808044,
"learning_rate": 6.5046277057912435e-06,
"loss": 0.0048,
"step": 178688
},
{
"epoch": 6.760001511087605,
"grad_norm": 0.11796054244041443,
"learning_rate": 6.485285784443354e-06,
"loss": 0.0055,
"step": 178944
},
{
"epoch": 6.769672471761551,
"grad_norm": 0.7898224592208862,
"learning_rate": 6.465943863095463e-06,
"loss": 0.0042,
"step": 179200
},
{
"epoch": 6.779343432435495,
"grad_norm": 0.18970559537410736,
"learning_rate": 6.446677496127839e-06,
"loss": 0.0044,
"step": 179456
},
{
"epoch": 6.789014393109441,
"grad_norm": 1.1956768035888672,
"learning_rate": 6.427335574779948e-06,
"loss": 0.0049,
"step": 179712
},
{
"epoch": 6.798685353783386,
"grad_norm": 0.6470310688018799,
"learning_rate": 6.407993653432059e-06,
"loss": 0.005,
"step": 179968
},
{
"epoch": 6.808356314457331,
"grad_norm": 4.411340236663818,
"learning_rate": 6.388651732084168e-06,
"loss": 0.0043,
"step": 180224
},
{
"epoch": 6.818027275131276,
"grad_norm": 0.09347503632307053,
"learning_rate": 6.369309810736278e-06,
"loss": 0.0043,
"step": 180480
},
{
"epoch": 6.8276982358052205,
"grad_norm": 0.007505136076360941,
"learning_rate": 6.3499678893883875e-06,
"loss": 0.0055,
"step": 180736
},
{
"epoch": 6.837369196479166,
"grad_norm": 0.286432683467865,
"learning_rate": 6.330625968040498e-06,
"loss": 0.0039,
"step": 180992
},
{
"epoch": 6.847040157153111,
"grad_norm": 0.2944409251213074,
"learning_rate": 6.311284046692607e-06,
"loss": 0.004,
"step": 181248
},
{
"epoch": 6.856711117827056,
"grad_norm": 0.32838645577430725,
"learning_rate": 6.291942125344718e-06,
"loss": 0.0046,
"step": 181504
},
{
"epoch": 6.866382078501001,
"grad_norm": 0.04531640559434891,
"learning_rate": 6.272600203996827e-06,
"loss": 0.0048,
"step": 181760
},
{
"epoch": 6.876053039174947,
"grad_norm": 0.060415927320718765,
"learning_rate": 6.253258282648937e-06,
"loss": 0.0038,
"step": 182016
},
{
"epoch": 6.885723999848891,
"grad_norm": 0.0581819973886013,
"learning_rate": 6.233916361301047e-06,
"loss": 0.004,
"step": 182272
},
{
"epoch": 6.895394960522836,
"grad_norm": 0.0427870936691761,
"learning_rate": 6.214574439953157e-06,
"loss": 0.005,
"step": 182528
},
{
"epoch": 6.9050659211967815,
"grad_norm": 1.7197208404541016,
"learning_rate": 6.195232518605266e-06,
"loss": 0.0043,
"step": 182784
},
{
"epoch": 6.914736881870726,
"grad_norm": 0.09247897565364838,
"learning_rate": 6.175890597257377e-06,
"loss": 0.0056,
"step": 183040
},
{
"epoch": 6.924407842544672,
"grad_norm": 0.019822193309664726,
"learning_rate": 6.156548675909486e-06,
"loss": 0.0055,
"step": 183296
},
{
"epoch": 6.9340788032186165,
"grad_norm": 1.541544795036316,
"learning_rate": 6.137282308941861e-06,
"loss": 0.0057,
"step": 183552
},
{
"epoch": 6.943749763892562,
"grad_norm": 1.1010373830795288,
"learning_rate": 6.117940387593971e-06,
"loss": 0.0048,
"step": 183808
},
{
"epoch": 6.953420724566507,
"grad_norm": 0.32369253039360046,
"learning_rate": 6.0985984662460805e-06,
"loss": 0.0044,
"step": 184064
},
{
"epoch": 6.963091685240451,
"grad_norm": 0.36643514037132263,
"learning_rate": 6.079332099278456e-06,
"loss": 0.0052,
"step": 184320
},
{
"epoch": 6.972762645914397,
"grad_norm": 4.76845645904541,
"learning_rate": 6.0599901779305655e-06,
"loss": 0.0055,
"step": 184576
},
{
"epoch": 6.982433606588342,
"grad_norm": 0.9248315095901489,
"learning_rate": 6.0406482565826765e-06,
"loss": 0.0057,
"step": 184832
},
{
"epoch": 6.992104567262287,
"grad_norm": 7.52930212020874,
"learning_rate": 6.021306335234786e-06,
"loss": 0.0057,
"step": 185088
},
{
"epoch": 7.0,
"eval_f1_B-DISEASE": 0.8170322475036831,
"eval_f1_B-MEDICATION": 0.9388233174159835,
"eval_f1_B-PROCEDURE": 0.839606661240293,
"eval_f1_B-SYMPTOM": 0.8083601954871582,
"eval_f1_I-DISEASE": 0.8508488239606706,
"eval_f1_I-MEDICATION": 0.9480509127627348,
"eval_f1_I-PROCEDURE": 0.8557830786803291,
"eval_f1_I-SYMPTOM": 0.8172193160347818,
"eval_f1_O": 0.9271939022229883,
"eval_f1_macro": 0.8669909394787357,
"eval_f1_micro": 0.8922796408524778,
"eval_loss": 0.4217996597290039,
"eval_precision_B-DISEASE": 0.8439005833121989,
"eval_precision_B-MEDICATION": 0.9507299270072993,
"eval_precision_B-PROCEDURE": 0.8642271636248359,
"eval_precision_B-SYMPTOM": 0.8188329471244997,
"eval_precision_I-DISEASE": 0.8612162292396158,
"eval_precision_I-MEDICATION": 0.9526327031934209,
"eval_precision_I-PROCEDURE": 0.8682078109649086,
"eval_precision_I-SYMPTOM": 0.8107099237044831,
"eval_precision_O": 0.9254912549627295,
"eval_precision_macro": 0.8773276159037767,
"eval_precision_micro": 0.8938970887232961,
"eval_rauc_macro": 0.9183518246652276,
"eval_rauc_micro": 0.9385967353145594,
"eval_recall_B-DISEASE": 0.7918220036487665,
"eval_recall_B-MEDICATION": 0.9272112475529454,
"eval_recall_B-PROCEDURE": 0.8163501026694046,
"eval_recall_B-SYMPTOM": 0.7981519507186858,
"eval_recall_I-DISEASE": 0.8407280573012708,
"eval_recall_I-MEDICATION": 0.943512984608875,
"eval_recall_I-PROCEDURE": 0.8437089443234025,
"eval_recall_I-SYMPTOM": 0.8238340855362132,
"eval_recall_O": 0.9289028258275723,
"eval_recall_macro": 0.8571358002430152,
"eval_recall_micro": 0.8906680357402255,
"eval_roc_auc_B-DISEASE": 0.8945483627101096,
"eval_roc_auc_B-MEDICATION": 0.9635074195320126,
"eval_roc_auc_B-PROCEDURE": 0.9070703509413875,
"eval_roc_auc_B-SYMPTOM": 0.897166398981839,
"eval_roc_auc_I-DISEASE": 0.9115174466724183,
"eval_roc_auc_I-MEDICATION": 0.9714307242336749,
"eval_roc_auc_I-PROCEDURE": 0.9156151956077059,
"eval_roc_auc_I-SYMPTOM": 0.896927321744982,
"eval_roc_auc_O": 0.9073832015629196,
"eval_runtime": 61.0949,
"eval_samples_per_second": 177.969,
"eval_steps_per_second": 22.26,
"step": 185297
},
{
"epoch": 7.001775527936232,
"grad_norm": 0.7092540860176086,
"learning_rate": 6.001964413886896e-06,
"loss": 0.0041,
"step": 185344
},
{
"epoch": 7.0114464886101775,
"grad_norm": 0.18654197454452515,
"learning_rate": 5.982622492539005e-06,
"loss": 0.0024,
"step": 185600
},
{
"epoch": 7.021117449284122,
"grad_norm": 0.8840870261192322,
"learning_rate": 5.963280571191115e-06,
"loss": 0.0023,
"step": 185856
},
{
"epoch": 7.030788409958068,
"grad_norm": 0.08226889371871948,
"learning_rate": 5.943938649843225e-06,
"loss": 0.0041,
"step": 186112
},
{
"epoch": 7.040459370632012,
"grad_norm": 0.1381804347038269,
"learning_rate": 5.9245967284953355e-06,
"loss": 0.0031,
"step": 186368
},
{
"epoch": 7.050130331305957,
"grad_norm": 2.1430623531341553,
"learning_rate": 5.905254807147445e-06,
"loss": 0.0022,
"step": 186624
},
{
"epoch": 7.059801291979903,
"grad_norm": 0.060144223272800446,
"learning_rate": 5.885912885799555e-06,
"loss": 0.0022,
"step": 186880
},
{
"epoch": 7.069472252653847,
"grad_norm": 0.06146460771560669,
"learning_rate": 5.866570964451664e-06,
"loss": 0.0035,
"step": 187136
},
{
"epoch": 7.079143213327793,
"grad_norm": 1.6876006126403809,
"learning_rate": 5.847229043103775e-06,
"loss": 0.0034,
"step": 187392
},
{
"epoch": 7.088814174001738,
"grad_norm": 2.21935772895813,
"learning_rate": 5.8278871217558845e-06,
"loss": 0.0045,
"step": 187648
},
{
"epoch": 7.098485134675683,
"grad_norm": 0.2139071524143219,
"learning_rate": 5.808545200407995e-06,
"loss": 0.0028,
"step": 187904
},
{
"epoch": 7.108156095349628,
"grad_norm": 0.2530527710914612,
"learning_rate": 5.789203279060104e-06,
"loss": 0.0029,
"step": 188160
},
{
"epoch": 7.117827056023573,
"grad_norm": 0.06350823491811752,
"learning_rate": 5.769861357712214e-06,
"loss": 0.0028,
"step": 188416
},
{
"epoch": 7.127498016697518,
"grad_norm": 0.3266438841819763,
"learning_rate": 5.750519436364323e-06,
"loss": 0.0057,
"step": 188672
},
{
"epoch": 7.137168977371463,
"grad_norm": 0.02727964147925377,
"learning_rate": 5.731253069396698e-06,
"loss": 0.0042,
"step": 188928
},
{
"epoch": 7.146839938045408,
"grad_norm": 0.007432880811393261,
"learning_rate": 5.711911148048809e-06,
"loss": 0.0035,
"step": 189184
},
{
"epoch": 7.156510898719353,
"grad_norm": 0.09012371301651001,
"learning_rate": 5.692569226700918e-06,
"loss": 0.0039,
"step": 189440
},
{
"epoch": 7.166181859393299,
"grad_norm": 0.19539253413677216,
"learning_rate": 5.6732273053530285e-06,
"loss": 0.0039,
"step": 189696
},
{
"epoch": 7.175852820067243,
"grad_norm": 3.682310104370117,
"learning_rate": 5.653885384005138e-06,
"loss": 0.0031,
"step": 189952
},
{
"epoch": 7.185523780741189,
"grad_norm": 0.4140027165412903,
"learning_rate": 5.634543462657248e-06,
"loss": 0.0044,
"step": 190208
},
{
"epoch": 7.195194741415134,
"grad_norm": 0.047425903379917145,
"learning_rate": 5.615201541309357e-06,
"loss": 0.0032,
"step": 190464
},
{
"epoch": 7.204865702089078,
"grad_norm": 0.08099602907896042,
"learning_rate": 5.595859619961468e-06,
"loss": 0.0027,
"step": 190720
},
{
"epoch": 7.214536662763024,
"grad_norm": 2.0335052013397217,
"learning_rate": 5.5765176986135775e-06,
"loss": 0.0038,
"step": 190976
},
{
"epoch": 7.2242076234369685,
"grad_norm": 0.7074165940284729,
"learning_rate": 5.557251331645953e-06,
"loss": 0.0033,
"step": 191232
},
{
"epoch": 7.233878584110914,
"grad_norm": 0.00729184877127409,
"learning_rate": 5.537909410298062e-06,
"loss": 0.0033,
"step": 191488
},
{
"epoch": 7.243549544784859,
"grad_norm": 0.2962284982204437,
"learning_rate": 5.518643043330437e-06,
"loss": 0.0033,
"step": 191744
},
{
"epoch": 7.253220505458804,
"grad_norm": 0.03666882589459419,
"learning_rate": 5.499301121982547e-06,
"loss": 0.0032,
"step": 192000
},
{
"epoch": 7.262891466132749,
"grad_norm": 2.278210163116455,
"learning_rate": 5.479959200634657e-06,
"loss": 0.0026,
"step": 192256
},
{
"epoch": 7.272562426806694,
"grad_norm": 0.6450464129447937,
"learning_rate": 5.460617279286768e-06,
"loss": 0.0031,
"step": 192512
},
{
"epoch": 7.282233387480639,
"grad_norm": 0.011020343750715256,
"learning_rate": 5.441275357938877e-06,
"loss": 0.0026,
"step": 192768
},
{
"epoch": 7.291904348154584,
"grad_norm": 0.848145604133606,
"learning_rate": 5.421933436590987e-06,
"loss": 0.0031,
"step": 193024
},
{
"epoch": 7.30157530882853,
"grad_norm": 0.47598353028297424,
"learning_rate": 5.402591515243096e-06,
"loss": 0.0035,
"step": 193280
},
{
"epoch": 7.311246269502474,
"grad_norm": 0.08850053697824478,
"learning_rate": 5.3832495938952064e-06,
"loss": 0.0028,
"step": 193536
},
{
"epoch": 7.32091723017642,
"grad_norm": 0.14100511372089386,
"learning_rate": 5.363907672547316e-06,
"loss": 0.0028,
"step": 193792
},
{
"epoch": 7.3305881908503645,
"grad_norm": 0.0643409714102745,
"learning_rate": 5.344565751199427e-06,
"loss": 0.0034,
"step": 194048
},
{
"epoch": 7.340259151524309,
"grad_norm": 0.02023415081202984,
"learning_rate": 5.325223829851536e-06,
"loss": 0.0034,
"step": 194304
},
{
"epoch": 7.349930112198255,
"grad_norm": 0.2690616846084595,
"learning_rate": 5.305881908503646e-06,
"loss": 0.0036,
"step": 194560
},
{
"epoch": 7.3596010728721994,
"grad_norm": 1.2020032405853271,
"learning_rate": 5.286539987155755e-06,
"loss": 0.0021,
"step": 194816
},
{
"epoch": 7.369272033546145,
"grad_norm": 0.49315980076789856,
"learning_rate": 5.2671980658078655e-06,
"loss": 0.0033,
"step": 195072
},
{
"epoch": 7.37894299422009,
"grad_norm": 0.03424458205699921,
"learning_rate": 5.247856144459975e-06,
"loss": 0.0034,
"step": 195328
},
{
"epoch": 7.388613954894035,
"grad_norm": 0.5558503270149231,
"learning_rate": 5.228514223112086e-06,
"loss": 0.0039,
"step": 195584
},
{
"epoch": 7.39828491556798,
"grad_norm": 0.1527431756258011,
"learning_rate": 5.209172301764195e-06,
"loss": 0.0025,
"step": 195840
},
{
"epoch": 7.4079558762419255,
"grad_norm": 0.03023804910480976,
"learning_rate": 5.189830380416305e-06,
"loss": 0.0029,
"step": 196096
},
{
"epoch": 7.41762683691587,
"grad_norm": 0.006813144311308861,
"learning_rate": 5.1704884590684145e-06,
"loss": 0.002,
"step": 196352
},
{
"epoch": 7.427297797589815,
"grad_norm": 0.06950301676988602,
"learning_rate": 5.151146537720525e-06,
"loss": 0.0035,
"step": 196608
},
{
"epoch": 7.4369687582637605,
"grad_norm": 0.12590453028678894,
"learning_rate": 5.131804616372634e-06,
"loss": 0.0027,
"step": 196864
},
{
"epoch": 7.446639718937705,
"grad_norm": 1.1601083278656006,
"learning_rate": 5.112462695024745e-06,
"loss": 0.0025,
"step": 197120
},
{
"epoch": 7.456310679611651,
"grad_norm": 1.2641323804855347,
"learning_rate": 5.093120773676854e-06,
"loss": 0.0031,
"step": 197376
},
{
"epoch": 7.465981640285595,
"grad_norm": 0.9254095554351807,
"learning_rate": 5.073778852328964e-06,
"loss": 0.003,
"step": 197632
},
{
"epoch": 7.475652600959541,
"grad_norm": 0.05598944053053856,
"learning_rate": 5.0544369309810736e-06,
"loss": 0.003,
"step": 197888
},
{
"epoch": 7.485323561633486,
"grad_norm": 0.040579646825790405,
"learning_rate": 5.035170564013449e-06,
"loss": 0.0028,
"step": 198144
},
{
"epoch": 7.494994522307431,
"grad_norm": 8.562992095947266,
"learning_rate": 5.0158286426655585e-06,
"loss": 0.0043,
"step": 198400
},
{
"epoch": 7.504665482981376,
"grad_norm": 0.09161358326673508,
"learning_rate": 4.996562275697933e-06,
"loss": 0.0028,
"step": 198656
},
{
"epoch": 7.514336443655321,
"grad_norm": 0.06476159393787384,
"learning_rate": 4.9772203543500435e-06,
"loss": 0.0029,
"step": 198912
},
{
"epoch": 7.524007404329266,
"grad_norm": 0.025177879258990288,
"learning_rate": 4.957878433002154e-06,
"loss": 0.0041,
"step": 199168
},
{
"epoch": 7.533678365003211,
"grad_norm": 0.06914424151182175,
"learning_rate": 4.938536511654263e-06,
"loss": 0.0036,
"step": 199424
},
{
"epoch": 7.543349325677156,
"grad_norm": 0.007711977697908878,
"learning_rate": 4.919194590306373e-06,
"loss": 0.0037,
"step": 199680
},
{
"epoch": 7.553020286351101,
"grad_norm": 0.5741889476776123,
"learning_rate": 4.899852668958483e-06,
"loss": 0.0021,
"step": 199936
},
{
"epoch": 7.562691247025047,
"grad_norm": 0.017532778903841972,
"learning_rate": 4.880510747610593e-06,
"loss": 0.0039,
"step": 200192
},
{
"epoch": 7.572362207698991,
"grad_norm": 0.013444333337247372,
"learning_rate": 4.8611688262627025e-06,
"loss": 0.0032,
"step": 200448
},
{
"epoch": 7.582033168372936,
"grad_norm": 0.1252066045999527,
"learning_rate": 4.8418269049148135e-06,
"loss": 0.0026,
"step": 200704
},
{
"epoch": 7.591704129046882,
"grad_norm": 0.16216708719730377,
"learning_rate": 4.822560537947188e-06,
"loss": 0.0028,
"step": 200960
},
{
"epoch": 7.601375089720826,
"grad_norm": 0.20117320120334625,
"learning_rate": 4.803218616599298e-06,
"loss": 0.0026,
"step": 201216
},
{
"epoch": 7.611046050394772,
"grad_norm": 0.4220730662345886,
"learning_rate": 4.783876695251408e-06,
"loss": 0.0033,
"step": 201472
},
{
"epoch": 7.620717011068717,
"grad_norm": 0.04324984550476074,
"learning_rate": 4.764534773903518e-06,
"loss": 0.0032,
"step": 201728
},
{
"epoch": 7.630387971742662,
"grad_norm": 0.24287299811840057,
"learning_rate": 4.745192852555627e-06,
"loss": 0.0029,
"step": 201984
},
{
"epoch": 7.640058932416607,
"grad_norm": 0.01797611638903618,
"learning_rate": 4.725850931207737e-06,
"loss": 0.0023,
"step": 202240
},
{
"epoch": 7.6497298930905515,
"grad_norm": 0.027291102334856987,
"learning_rate": 4.706509009859847e-06,
"loss": 0.0037,
"step": 202496
},
{
"epoch": 7.659400853764497,
"grad_norm": 0.015763144940137863,
"learning_rate": 4.687167088511957e-06,
"loss": 0.0024,
"step": 202752
},
{
"epoch": 7.669071814438442,
"grad_norm": 2.068912982940674,
"learning_rate": 4.6679007215443315e-06,
"loss": 0.0027,
"step": 203008
},
{
"epoch": 7.678742775112387,
"grad_norm": 0.1518033742904663,
"learning_rate": 4.648558800196442e-06,
"loss": 0.0025,
"step": 203264
},
{
"epoch": 7.688413735786332,
"grad_norm": 0.7454547882080078,
"learning_rate": 4.629216878848552e-06,
"loss": 0.0027,
"step": 203520
},
{
"epoch": 7.698084696460278,
"grad_norm": 0.04685609042644501,
"learning_rate": 4.609874957500661e-06,
"loss": 0.0034,
"step": 203776
},
{
"epoch": 7.707755657134222,
"grad_norm": 0.012423527427017689,
"learning_rate": 4.590533036152771e-06,
"loss": 0.002,
"step": 204032
},
{
"epoch": 7.717426617808167,
"grad_norm": 0.5419167876243591,
"learning_rate": 4.571191114804881e-06,
"loss": 0.0025,
"step": 204288
},
{
"epoch": 7.7270975784821125,
"grad_norm": 0.3725039064884186,
"learning_rate": 4.551849193456991e-06,
"loss": 0.0028,
"step": 204544
},
{
"epoch": 7.736768539156057,
"grad_norm": 0.09141060709953308,
"learning_rate": 4.532507272109101e-06,
"loss": 0.0024,
"step": 204800
},
{
"epoch": 7.746439499830003,
"grad_norm": 0.13550949096679688,
"learning_rate": 4.513165350761211e-06,
"loss": 0.0025,
"step": 205056
},
{
"epoch": 7.7561104605039475,
"grad_norm": 0.005226655397564173,
"learning_rate": 4.49382342941332e-06,
"loss": 0.0027,
"step": 205312
},
{
"epoch": 7.765781421177893,
"grad_norm": 1.0764216184616089,
"learning_rate": 4.47448150806543e-06,
"loss": 0.0029,
"step": 205568
},
{
"epoch": 7.775452381851838,
"grad_norm": 0.019114414229989052,
"learning_rate": 4.45513958671754e-06,
"loss": 0.0023,
"step": 205824
},
{
"epoch": 7.785123342525783,
"grad_norm": 0.214304581284523,
"learning_rate": 4.43579766536965e-06,
"loss": 0.0028,
"step": 206080
},
{
"epoch": 7.794794303199728,
"grad_norm": 0.9313531517982483,
"learning_rate": 4.41645574402176e-06,
"loss": 0.0027,
"step": 206336
},
{
"epoch": 7.804465263873674,
"grad_norm": 0.04551494121551514,
"learning_rate": 4.3971893770541355e-06,
"loss": 0.0025,
"step": 206592
},
{
"epoch": 7.814136224547618,
"grad_norm": 0.25390639901161194,
"learning_rate": 4.377847455706245e-06,
"loss": 0.0028,
"step": 206848
},
{
"epoch": 7.823807185221563,
"grad_norm": 0.4188549816608429,
"learning_rate": 4.358505534358355e-06,
"loss": 0.0035,
"step": 207104
},
{
"epoch": 7.8334781458955085,
"grad_norm": 5.584123134613037,
"learning_rate": 4.339163613010465e-06,
"loss": 0.0029,
"step": 207360
},
{
"epoch": 7.843149106569453,
"grad_norm": 0.09376902878284454,
"learning_rate": 4.319821691662574e-06,
"loss": 0.0025,
"step": 207616
},
{
"epoch": 7.852820067243399,
"grad_norm": 0.007881022058427334,
"learning_rate": 4.3004797703146844e-06,
"loss": 0.0031,
"step": 207872
},
{
"epoch": 7.8624910279173434,
"grad_norm": 0.053988266736269,
"learning_rate": 4.2811378489667946e-06,
"loss": 0.0031,
"step": 208128
},
{
"epoch": 7.872161988591289,
"grad_norm": 0.37332120537757874,
"learning_rate": 4.261795927618904e-06,
"loss": 0.0021,
"step": 208384
},
{
"epoch": 7.881832949265234,
"grad_norm": 0.10056313127279282,
"learning_rate": 4.242454006271014e-06,
"loss": 0.003,
"step": 208640
},
{
"epoch": 7.891503909939178,
"grad_norm": 0.021642550826072693,
"learning_rate": 4.223187639303389e-06,
"loss": 0.003,
"step": 208896
},
{
"epoch": 7.901174870613124,
"grad_norm": 0.15152160823345184,
"learning_rate": 4.203845717955499e-06,
"loss": 0.0028,
"step": 209152
},
{
"epoch": 7.910845831287069,
"grad_norm": 0.05597339943051338,
"learning_rate": 4.184503796607608e-06,
"loss": 0.0026,
"step": 209408
},
{
"epoch": 7.920516791961014,
"grad_norm": 0.026413604617118835,
"learning_rate": 4.165161875259718e-06,
"loss": 0.0027,
"step": 209664
},
{
"epoch": 7.930187752634959,
"grad_norm": 0.086790531873703,
"learning_rate": 4.1458199539118285e-06,
"loss": 0.0018,
"step": 209920
},
{
"epoch": 7.9398587133089045,
"grad_norm": 0.40138956904411316,
"learning_rate": 4.126478032563938e-06,
"loss": 0.0026,
"step": 210176
},
{
"epoch": 7.949529673982849,
"grad_norm": 0.504784107208252,
"learning_rate": 4.107136111216048e-06,
"loss": 0.003,
"step": 210432
},
{
"epoch": 7.959200634656794,
"grad_norm": 0.5855137705802917,
"learning_rate": 4.087794189868158e-06,
"loss": 0.0038,
"step": 210688
},
{
"epoch": 7.968871595330739,
"grad_norm": 0.23986396193504333,
"learning_rate": 4.068452268520267e-06,
"loss": 0.0027,
"step": 210944
},
{
"epoch": 7.978542556004684,
"grad_norm": 0.08508482575416565,
"learning_rate": 4.049110347172377e-06,
"loss": 0.0039,
"step": 211200
},
{
"epoch": 7.98821351667863,
"grad_norm": 2.018085241317749,
"learning_rate": 4.0297684258244875e-06,
"loss": 0.0018,
"step": 211456
},
{
"epoch": 7.997884477352574,
"grad_norm": 0.023388510569930077,
"learning_rate": 4.010502058856862e-06,
"loss": 0.0022,
"step": 211712
},
{
"epoch": 8.0,
"eval_f1_B-DISEASE": 0.8192092717409173,
"eval_f1_B-MEDICATION": 0.9423820224719102,
"eval_f1_B-PROCEDURE": 0.8420637009739406,
"eval_f1_B-SYMPTOM": 0.8127123442808607,
"eval_f1_I-DISEASE": 0.850955341029534,
"eval_f1_I-MEDICATION": 0.949058663755226,
"eval_f1_I-PROCEDURE": 0.8554017038172543,
"eval_f1_I-SYMPTOM": 0.8136104891443594,
"eval_f1_O": 0.9274238987873996,
"eval_f1_macro": 0.868090826222378,
"eval_f1_micro": 0.8928833447754752,
"eval_loss": 0.4737370014190674,
"eval_precision_B-DISEASE": 0.8500213219616205,
"eval_precision_B-MEDICATION": 0.9520523065746458,
"eval_precision_B-PROCEDURE": 0.8641274986493788,
"eval_precision_B-SYMPTOM": 0.8414187307635937,
"eval_precision_I-DISEASE": 0.8638646013066827,
"eval_precision_I-MEDICATION": 0.9557009546283385,
"eval_precision_I-PROCEDURE": 0.8787206030410202,
"eval_precision_I-SYMPTOM": 0.8445731862439002,
"eval_precision_O": 0.9156305475079966,
"eval_precision_macro": 0.8851233056307976,
"eval_precision_micro": 0.895332761029088,
"eval_rauc_macro": 0.9153957194153303,
"eval_rauc_micro": 0.9385898278409849,
"eval_recall_B-DISEASE": 0.7905528674545887,
"eval_recall_B-MEDICATION": 0.9329062110695854,
"eval_recall_B-PROCEDURE": 0.8210985626283368,
"eval_recall_B-SYMPTOM": 0.7859000684462697,
"eval_recall_I-DISEASE": 0.8384262221051443,
"eval_recall_I-MEDICATION": 0.942508065795737,
"eval_recall_I-PROCEDURE": 0.8332884525936988,
"eval_recall_I-SYMPTOM": 0.7848377390930582,
"eval_recall_O": 0.9395250115419437,
"eval_recall_macro": 0.8521159111920403,
"eval_recall_micro": 0.8904472939909823,
"eval_roc_auc_B-DISEASE": 0.8939787349011639,
"eval_roc_auc_B-MEDICATION": 0.966357083606876,
"eval_roc_auc_B-PROCEDURE": 0.9094372113385102,
"eval_roc_auc_B-SYMPTOM": 0.8913483585328563,
"eval_roc_auc_I-DISEASE": 0.9105856356600845,
"eval_roc_auc_I-MEDICATION": 0.9709506682682745,
"eval_roc_auc_I-PROCEDURE": 0.9110413996799644,
"eval_roc_auc_I-SYMPTOM": 0.8811634945418189,
"eval_roc_auc_O": 0.9036988882084248,
"eval_runtime": 61.2016,
"eval_samples_per_second": 177.659,
"eval_steps_per_second": 22.222,
"step": 211768
},
{
"epoch": 8.00755543802652,
"grad_norm": 0.04221045598387718,
"learning_rate": 3.9911601375089725e-06,
"loss": 0.0014,
"step": 211968
},
{
"epoch": 8.017226398700465,
"grad_norm": 0.10489369928836823,
"learning_rate": 3.971818216161083e-06,
"loss": 0.0014,
"step": 212224
},
{
"epoch": 8.02689735937441,
"grad_norm": 0.005116314627230167,
"learning_rate": 3.952476294813192e-06,
"loss": 0.0017,
"step": 212480
},
{
"epoch": 8.036568320048355,
"grad_norm": 0.013480676338076591,
"learning_rate": 3.933134373465302e-06,
"loss": 0.0015,
"step": 212736
},
{
"epoch": 8.0462392807223,
"grad_norm": 0.009527523070573807,
"learning_rate": 3.913792452117412e-06,
"loss": 0.0017,
"step": 212992
},
{
"epoch": 8.055910241396244,
"grad_norm": 0.06975742429494858,
"learning_rate": 3.8944505307695214e-06,
"loss": 0.0018,
"step": 213248
},
{
"epoch": 8.06558120207019,
"grad_norm": 1.0523467063903809,
"learning_rate": 3.8751086094216316e-06,
"loss": 0.0008,
"step": 213504
},
{
"epoch": 8.075252162744135,
"grad_norm": 0.021572506055235863,
"learning_rate": 3.855766688073742e-06,
"loss": 0.0015,
"step": 213760
},
{
"epoch": 8.084923123418081,
"grad_norm": 0.004556609317660332,
"learning_rate": 3.8365003211061165e-06,
"loss": 0.0025,
"step": 214016
},
{
"epoch": 8.094594084092025,
"grad_norm": 0.01564151607453823,
"learning_rate": 3.817158399758226e-06,
"loss": 0.002,
"step": 214272
},
{
"epoch": 8.10426504476597,
"grad_norm": 0.02460288256406784,
"learning_rate": 3.797816478410336e-06,
"loss": 0.0023,
"step": 214528
},
{
"epoch": 8.113936005439916,
"grad_norm": 0.19753815233707428,
"learning_rate": 3.778474557062446e-06,
"loss": 0.0022,
"step": 214784
},
{
"epoch": 8.12360696611386,
"grad_norm": 0.0022627103608101606,
"learning_rate": 3.7591326357145558e-06,
"loss": 0.0027,
"step": 215040
},
{
"epoch": 8.133277926787805,
"grad_norm": 0.027415508404374123,
"learning_rate": 3.7397907143666655e-06,
"loss": 0.0013,
"step": 215296
},
{
"epoch": 8.14294888746175,
"grad_norm": 0.13008584082126617,
"learning_rate": 3.7204487930187756e-06,
"loss": 0.0023,
"step": 215552
},
{
"epoch": 8.152619848135696,
"grad_norm": 0.03469686210155487,
"learning_rate": 3.7011068716708853e-06,
"loss": 0.0017,
"step": 215808
},
{
"epoch": 8.16229080880964,
"grad_norm": 0.27707692980766296,
"learning_rate": 3.681764950322995e-06,
"loss": 0.0016,
"step": 216064
},
{
"epoch": 8.171961769483586,
"grad_norm": 0.001276107388548553,
"learning_rate": 3.662423028975105e-06,
"loss": 0.0019,
"step": 216320
},
{
"epoch": 8.181632730157531,
"grad_norm": 0.1010005995631218,
"learning_rate": 3.6431566620074804e-06,
"loss": 0.0017,
"step": 216576
},
{
"epoch": 8.191303690831475,
"grad_norm": 0.0014761561760678887,
"learning_rate": 3.62381474065959e-06,
"loss": 0.0012,
"step": 216832
},
{
"epoch": 8.20097465150542,
"grad_norm": 0.01065876055508852,
"learning_rate": 3.6044728193117002e-06,
"loss": 0.0018,
"step": 217088
},
{
"epoch": 8.210645612179366,
"grad_norm": 0.013767397962510586,
"learning_rate": 3.58513089796381e-06,
"loss": 0.0019,
"step": 217344
},
{
"epoch": 8.220316572853312,
"grad_norm": 0.06974133104085922,
"learning_rate": 3.5657889766159196e-06,
"loss": 0.0016,
"step": 217600
},
{
"epoch": 8.229987533527256,
"grad_norm": 0.0005238667945377529,
"learning_rate": 3.5464470552680298e-06,
"loss": 0.002,
"step": 217856
},
{
"epoch": 8.239658494201201,
"grad_norm": 0.0016113127348944545,
"learning_rate": 3.5271051339201395e-06,
"loss": 0.0021,
"step": 218112
},
{
"epoch": 8.249329454875147,
"grad_norm": 0.006277918349951506,
"learning_rate": 3.5077632125722496e-06,
"loss": 0.002,
"step": 218368
},
{
"epoch": 8.259000415549092,
"grad_norm": 6.543371200561523,
"learning_rate": 3.4884212912243593e-06,
"loss": 0.0032,
"step": 218624
},
{
"epoch": 8.268671376223036,
"grad_norm": 0.002728199353441596,
"learning_rate": 3.469154924256734e-06,
"loss": 0.0017,
"step": 218880
},
{
"epoch": 8.278342336896982,
"grad_norm": 0.0380263552069664,
"learning_rate": 3.449813002908844e-06,
"loss": 0.0015,
"step": 219136
},
{
"epoch": 8.288013297570927,
"grad_norm": 0.09521731734275818,
"learning_rate": 3.430471081560954e-06,
"loss": 0.0014,
"step": 219392
},
{
"epoch": 8.297684258244871,
"grad_norm": 0.05859646946191788,
"learning_rate": 3.4111291602130637e-06,
"loss": 0.0016,
"step": 219648
},
{
"epoch": 8.307355218918817,
"grad_norm": 0.057360127568244934,
"learning_rate": 3.3917872388651734e-06,
"loss": 0.0015,
"step": 219904
},
{
"epoch": 8.317026179592762,
"grad_norm": 0.005022614262998104,
"learning_rate": 3.3724453175172835e-06,
"loss": 0.0018,
"step": 220160
},
{
"epoch": 8.326697140266708,
"grad_norm": 0.009211408905684948,
"learning_rate": 3.353103396169393e-06,
"loss": 0.0019,
"step": 220416
},
{
"epoch": 8.336368100940652,
"grad_norm": 0.8216173052787781,
"learning_rate": 3.333761474821503e-06,
"loss": 0.0015,
"step": 220672
},
{
"epoch": 8.346039061614597,
"grad_norm": 0.036033984273672104,
"learning_rate": 3.314419553473613e-06,
"loss": 0.0019,
"step": 220928
},
{
"epoch": 8.355710022288543,
"grad_norm": 0.28528496623039246,
"learning_rate": 3.295153186505988e-06,
"loss": 0.0016,
"step": 221184
},
{
"epoch": 8.365380982962487,
"grad_norm": 0.21900594234466553,
"learning_rate": 3.2758112651580976e-06,
"loss": 0.0011,
"step": 221440
},
{
"epoch": 8.375051943636432,
"grad_norm": 0.1995537430047989,
"learning_rate": 3.2564693438102073e-06,
"loss": 0.0011,
"step": 221696
},
{
"epoch": 8.384722904310378,
"grad_norm": 0.05183367431163788,
"learning_rate": 3.2371274224623174e-06,
"loss": 0.0016,
"step": 221952
},
{
"epoch": 8.394393864984323,
"grad_norm": 0.8787815570831299,
"learning_rate": 3.217785501114427e-06,
"loss": 0.0016,
"step": 222208
},
{
"epoch": 8.404064825658267,
"grad_norm": 0.013117530383169651,
"learning_rate": 3.198443579766537e-06,
"loss": 0.0017,
"step": 222464
},
{
"epoch": 8.413735786332213,
"grad_norm": 0.005170230288058519,
"learning_rate": 3.179101658418647e-06,
"loss": 0.0018,
"step": 222720
},
{
"epoch": 8.423406747006158,
"grad_norm": 0.07186521589756012,
"learning_rate": 3.1597597370707567e-06,
"loss": 0.0024,
"step": 222976
},
{
"epoch": 8.433077707680102,
"grad_norm": 0.4515911042690277,
"learning_rate": 3.1404178157228664e-06,
"loss": 0.0023,
"step": 223232
},
{
"epoch": 8.442748668354048,
"grad_norm": 0.05934571474790573,
"learning_rate": 3.121151448755242e-06,
"loss": 0.0024,
"step": 223488
},
{
"epoch": 8.452419629027993,
"grad_norm": 0.5439963936805725,
"learning_rate": 3.1018095274073517e-06,
"loss": 0.0015,
"step": 223744
},
{
"epoch": 8.462090589701939,
"grad_norm": 0.002186891855672002,
"learning_rate": 3.0824676060594614e-06,
"loss": 0.0012,
"step": 224000
},
{
"epoch": 8.471761550375883,
"grad_norm": 0.005363143049180508,
"learning_rate": 3.0631256847115716e-06,
"loss": 0.0019,
"step": 224256
},
{
"epoch": 8.481432511049828,
"grad_norm": 0.8389096856117249,
"learning_rate": 3.0437837633636813e-06,
"loss": 0.0014,
"step": 224512
},
{
"epoch": 8.491103471723774,
"grad_norm": 0.009227742440998554,
"learning_rate": 3.024441842015791e-06,
"loss": 0.0015,
"step": 224768
},
{
"epoch": 8.500774432397717,
"grad_norm": 0.021440809592604637,
"learning_rate": 3.005099920667901e-06,
"loss": 0.0012,
"step": 225024
},
{
"epoch": 8.510445393071663,
"grad_norm": 0.053202465176582336,
"learning_rate": 2.985757999320011e-06,
"loss": 0.0021,
"step": 225280
},
{
"epoch": 8.520116353745609,
"grad_norm": 0.09795872122049332,
"learning_rate": 2.9664160779721205e-06,
"loss": 0.0011,
"step": 225536
},
{
"epoch": 8.529787314419554,
"grad_norm": 0.07053809612989426,
"learning_rate": 2.9470741566242306e-06,
"loss": 0.002,
"step": 225792
},
{
"epoch": 8.539458275093498,
"grad_norm": 0.015584302134811878,
"learning_rate": 2.9277322352763403e-06,
"loss": 0.0017,
"step": 226048
},
{
"epoch": 8.549129235767444,
"grad_norm": 0.014636941254138947,
"learning_rate": 2.9083903139284505e-06,
"loss": 0.002,
"step": 226304
},
{
"epoch": 8.55880019644139,
"grad_norm": 0.002259760396555066,
"learning_rate": 2.88904839258056e-06,
"loss": 0.0022,
"step": 226560
},
{
"epoch": 8.568471157115333,
"grad_norm": 0.1187112033367157,
"learning_rate": 2.86970647123267e-06,
"loss": 0.0019,
"step": 226816
},
{
"epoch": 8.578142117789278,
"grad_norm": 1.316362738609314,
"learning_rate": 2.85036454988478e-06,
"loss": 0.0018,
"step": 227072
},
{
"epoch": 8.587813078463224,
"grad_norm": 0.02268380858004093,
"learning_rate": 2.8310226285368897e-06,
"loss": 0.0015,
"step": 227328
},
{
"epoch": 8.59748403913717,
"grad_norm": 0.11864591389894485,
"learning_rate": 2.8117562615692645e-06,
"loss": 0.0016,
"step": 227584
},
{
"epoch": 8.607154999811113,
"grad_norm": 0.1629875749349594,
"learning_rate": 2.7924143402213743e-06,
"loss": 0.0013,
"step": 227840
},
{
"epoch": 8.616825960485059,
"grad_norm": 0.0012598687317222357,
"learning_rate": 2.7730724188734844e-06,
"loss": 0.0015,
"step": 228096
},
{
"epoch": 8.626496921159005,
"grad_norm": 0.012492740526795387,
"learning_rate": 2.753730497525594e-06,
"loss": 0.0017,
"step": 228352
},
{
"epoch": 8.63616788183295,
"grad_norm": 0.14352132380008698,
"learning_rate": 2.734388576177704e-06,
"loss": 0.0013,
"step": 228608
},
{
"epoch": 8.645838842506894,
"grad_norm": 0.022044667974114418,
"learning_rate": 2.715046654829814e-06,
"loss": 0.0015,
"step": 228864
},
{
"epoch": 8.65550980318084,
"grad_norm": 0.28277599811553955,
"learning_rate": 2.6957047334819236e-06,
"loss": 0.0024,
"step": 229120
},
{
"epoch": 8.665180763854785,
"grad_norm": 0.005805708467960358,
"learning_rate": 2.6763628121340333e-06,
"loss": 0.0018,
"step": 229376
},
{
"epoch": 8.674851724528729,
"grad_norm": 0.042201265692710876,
"learning_rate": 2.6570208907861435e-06,
"loss": 0.0013,
"step": 229632
},
{
"epoch": 8.684522685202674,
"grad_norm": 0.5332639813423157,
"learning_rate": 2.637678969438253e-06,
"loss": 0.001,
"step": 229888
},
{
"epoch": 8.69419364587662,
"grad_norm": 0.001226294320076704,
"learning_rate": 2.618337048090363e-06,
"loss": 0.0021,
"step": 230144
},
{
"epoch": 8.703864606550566,
"grad_norm": 0.008391711860895157,
"learning_rate": 2.598995126742473e-06,
"loss": 0.0018,
"step": 230400
},
{
"epoch": 8.71353556722451,
"grad_norm": 0.005565817467868328,
"learning_rate": 2.5797287597748482e-06,
"loss": 0.0014,
"step": 230656
},
{
"epoch": 8.723206527898455,
"grad_norm": 0.004753118846565485,
"learning_rate": 2.560386838426958e-06,
"loss": 0.0012,
"step": 230912
},
{
"epoch": 8.7328774885724,
"grad_norm": 0.0013271772768348455,
"learning_rate": 2.541044917079068e-06,
"loss": 0.0021,
"step": 231168
},
{
"epoch": 8.742548449246344,
"grad_norm": 0.06540732830762863,
"learning_rate": 2.5217029957311778e-06,
"loss": 0.0017,
"step": 231424
},
{
"epoch": 8.75221940992029,
"grad_norm": 0.16908077895641327,
"learning_rate": 2.5023610743832875e-06,
"loss": 0.002,
"step": 231680
},
{
"epoch": 8.761890370594235,
"grad_norm": 0.29503974318504333,
"learning_rate": 2.4830191530353976e-06,
"loss": 0.0016,
"step": 231936
},
{
"epoch": 8.771561331268181,
"grad_norm": 9.24250316619873,
"learning_rate": 2.4636772316875073e-06,
"loss": 0.0019,
"step": 232192
},
{
"epoch": 8.781232291942125,
"grad_norm": 0.09708067774772644,
"learning_rate": 2.444335310339617e-06,
"loss": 0.0011,
"step": 232448
},
{
"epoch": 8.79090325261607,
"grad_norm": 0.001615343731828034,
"learning_rate": 2.425068943371992e-06,
"loss": 0.0017,
"step": 232704
},
{
"epoch": 8.800574213290016,
"grad_norm": 0.21001236140727997,
"learning_rate": 2.405727022024102e-06,
"loss": 0.0021,
"step": 232960
},
{
"epoch": 8.81024517396396,
"grad_norm": 0.014585831202566624,
"learning_rate": 2.3863851006762117e-06,
"loss": 0.001,
"step": 233216
},
{
"epoch": 8.819916134637905,
"grad_norm": 0.6824801564216614,
"learning_rate": 2.367043179328322e-06,
"loss": 0.0016,
"step": 233472
},
{
"epoch": 8.829587095311851,
"grad_norm": 0.014681616798043251,
"learning_rate": 2.3477012579804315e-06,
"loss": 0.002,
"step": 233728
},
{
"epoch": 8.839258055985797,
"grad_norm": 0.010957110673189163,
"learning_rate": 2.3283593366325417e-06,
"loss": 0.0013,
"step": 233984
},
{
"epoch": 8.84892901665974,
"grad_norm": 1.2413954734802246,
"learning_rate": 2.3090174152846514e-06,
"loss": 0.0011,
"step": 234240
},
{
"epoch": 8.858599977333686,
"grad_norm": 0.1283838450908661,
"learning_rate": 2.289751048317026e-06,
"loss": 0.0011,
"step": 234496
},
{
"epoch": 8.868270938007631,
"grad_norm": 0.030070781707763672,
"learning_rate": 2.2704846813494014e-06,
"loss": 0.0013,
"step": 234752
},
{
"epoch": 8.877941898681575,
"grad_norm": 0.10878092795610428,
"learning_rate": 2.251142760001511e-06,
"loss": 0.0012,
"step": 235008
},
{
"epoch": 8.88761285935552,
"grad_norm": 0.0010157637298107147,
"learning_rate": 2.2318008386536213e-06,
"loss": 0.001,
"step": 235264
},
{
"epoch": 8.897283820029466,
"grad_norm": 0.0011938668321818113,
"learning_rate": 2.212458917305731e-06,
"loss": 0.0012,
"step": 235520
},
{
"epoch": 8.906954780703412,
"grad_norm": 0.0009772476041689515,
"learning_rate": 2.1931169959578407e-06,
"loss": 0.0012,
"step": 235776
},
{
"epoch": 8.916625741377356,
"grad_norm": 0.02653772011399269,
"learning_rate": 2.173775074609951e-06,
"loss": 0.0011,
"step": 236032
},
{
"epoch": 8.926296702051301,
"grad_norm": 0.002025567227974534,
"learning_rate": 2.1544331532620605e-06,
"loss": 0.0011,
"step": 236288
},
{
"epoch": 8.935967662725247,
"grad_norm": 0.07364089787006378,
"learning_rate": 2.1350912319141702e-06,
"loss": 0.0017,
"step": 236544
},
{
"epoch": 8.94563862339919,
"grad_norm": 0.000813729246146977,
"learning_rate": 2.1157493105662803e-06,
"loss": 0.0012,
"step": 236800
},
{
"epoch": 8.955309584073136,
"grad_norm": 0.3964155912399292,
"learning_rate": 2.09640738921839e-06,
"loss": 0.0013,
"step": 237056
},
{
"epoch": 8.964980544747082,
"grad_norm": 0.02675843983888626,
"learning_rate": 2.0770654678704998e-06,
"loss": 0.0013,
"step": 237312
},
{
"epoch": 8.974651505421027,
"grad_norm": 0.45542263984680176,
"learning_rate": 2.05772354652261e-06,
"loss": 0.0009,
"step": 237568
},
{
"epoch": 8.984322466094971,
"grad_norm": 0.004206574056297541,
"learning_rate": 2.0383816251747196e-06,
"loss": 0.0011,
"step": 237824
},
{
"epoch": 8.993993426768917,
"grad_norm": 0.029356837272644043,
"learning_rate": 2.0190397038268293e-06,
"loss": 0.0011,
"step": 238080
},
{
"epoch": 9.0,
"eval_f1_B-DISEASE": 0.820265182517597,
"eval_f1_B-MEDICATION": 0.9411343069617418,
"eval_f1_B-PROCEDURE": 0.8432354734732991,
"eval_f1_B-SYMPTOM": 0.8137595552466991,
"eval_f1_I-DISEASE": 0.853021119122057,
"eval_f1_I-MEDICATION": 0.95037530170013,
"eval_f1_I-PROCEDURE": 0.8561874578893519,
"eval_f1_I-SYMPTOM": 0.8206522616146783,
"eval_f1_O": 0.9278188308044935,
"eval_f1_macro": 0.8696054988144497,
"eval_f1_micro": 0.8938386961399782,
"eval_loss": 0.507999837398529,
"eval_precision_B-DISEASE": 0.8472398343055203,
"eval_precision_B-MEDICATION": 0.9476723204619271,
"eval_precision_B-PROCEDURE": 0.8588731144631766,
"eval_precision_B-SYMPTOM": 0.826393789696542,
"eval_precision_I-DISEASE": 0.8680188544493643,
"eval_precision_I-MEDICATION": 0.9531815279846776,
"eval_precision_I-PROCEDURE": 0.8730946382675522,
"eval_precision_I-SYMPTOM": 0.8215935894536173,
"eval_precision_O": 0.9236782838636837,
"eval_precision_macro": 0.8799717725495623,
"eval_precision_micro": 0.895900159381018,
"eval_rauc_macro": 0.9196513344131847,
"eval_rauc_micro": 0.9392897520293723,
"eval_recall_B-DISEASE": 0.7949551836281431,
"eval_recall_B-MEDICATION": 0.9346858871685353,
"eval_recall_B-PROCEDURE": 0.8281570841889117,
"eval_recall_B-SYMPTOM": 0.8015058179329226,
"eval_recall_I-DISEASE": 0.8385328466237659,
"eval_recall_I-MEDICATION": 0.9475855503252764,
"eval_recall_I-PROCEDURE": 0.8399226419251389,
"eval_recall_I-SYMPTOM": 0.8197130883301096,
"eval_recall_O": 0.9319966663269038,
"eval_recall_macro": 0.8596727518277453,
"eval_recall_micro": 0.8917866979597766,
"eval_roc_auc_B-DISEASE": 0.8961441020336804,
"eval_roc_auc_B-MEDICATION": 0.9672374649513288,
"eval_roc_auc_B-PROCEDURE": 0.9129064100226968,
"eval_roc_auc_B-SYMPTOM": 0.8989321500948878,
"eval_roc_auc_I-DISEASE": 0.9109411921441964,
"eval_roc_auc_I-MEDICATION": 0.973469577978567,
"eval_roc_auc_I-PROCEDURE": 0.9140138334490733,
"eval_roc_auc_I-SYMPTOM": 0.8959855777737502,
"eval_roc_auc_O": 0.9072317012704816,
"eval_runtime": 61.1454,
"eval_samples_per_second": 177.822,
"eval_steps_per_second": 22.242,
"step": 238239
},
{
"epoch": 9.003664387442862,
"grad_norm": 0.0012333148624747992,
"learning_rate": 1.9996977824789394e-06,
"loss": 0.0009,
"step": 238336
},
{
"epoch": 9.013335348116808,
"grad_norm": 0.05198514088988304,
"learning_rate": 1.980355861131049e-06,
"loss": 0.0013,
"step": 238592
},
{
"epoch": 9.023006308790752,
"grad_norm": 0.002556259511038661,
"learning_rate": 1.9610894941634244e-06,
"loss": 0.0007,
"step": 238848
},
{
"epoch": 9.032677269464697,
"grad_norm": 0.017605243250727654,
"learning_rate": 1.941747572815534e-06,
"loss": 0.0003,
"step": 239104
},
{
"epoch": 9.042348230138643,
"grad_norm": 0.2546218931674957,
"learning_rate": 1.9224056514676438e-06,
"loss": 0.0011,
"step": 239360
},
{
"epoch": 9.052019190812587,
"grad_norm": 0.005463745910674334,
"learning_rate": 1.903063730119754e-06,
"loss": 0.0007,
"step": 239616
},
{
"epoch": 9.061690151486532,
"grad_norm": 0.013387962244451046,
"learning_rate": 1.8837218087718636e-06,
"loss": 0.0009,
"step": 239872
},
{
"epoch": 9.071361112160478,
"grad_norm": 0.0036850119940936565,
"learning_rate": 1.8643798874239735e-06,
"loss": 0.0008,
"step": 240128
},
{
"epoch": 9.081032072834423,
"grad_norm": 0.002097562188282609,
"learning_rate": 1.8450379660760835e-06,
"loss": 0.0006,
"step": 240384
},
{
"epoch": 9.090703033508367,
"grad_norm": 0.009374704211950302,
"learning_rate": 1.8256960447281932e-06,
"loss": 0.0007,
"step": 240640
},
{
"epoch": 9.100373994182313,
"grad_norm": 0.009544138796627522,
"learning_rate": 1.806354123380303e-06,
"loss": 0.001,
"step": 240896
},
{
"epoch": 9.110044954856258,
"grad_norm": 0.014574944972991943,
"learning_rate": 1.787012202032413e-06,
"loss": 0.001,
"step": 241152
},
{
"epoch": 9.119715915530202,
"grad_norm": 0.0014770117122679949,
"learning_rate": 1.7676702806845227e-06,
"loss": 0.001,
"step": 241408
},
{
"epoch": 9.129386876204148,
"grad_norm": 0.00023075766512192786,
"learning_rate": 1.7483283593366326e-06,
"loss": 0.0006,
"step": 241664
},
{
"epoch": 9.139057836878093,
"grad_norm": 0.036480896174907684,
"learning_rate": 1.7289864379887425e-06,
"loss": 0.0007,
"step": 241920
},
{
"epoch": 9.148728797552039,
"grad_norm": 0.005274293944239616,
"learning_rate": 1.7096445166408524e-06,
"loss": 0.0008,
"step": 242176
},
{
"epoch": 9.158399758225983,
"grad_norm": 0.0636928603053093,
"learning_rate": 1.6903025952929622e-06,
"loss": 0.0005,
"step": 242432
},
{
"epoch": 9.168070718899928,
"grad_norm": 0.007083303295075893,
"learning_rate": 1.670960673945072e-06,
"loss": 0.0012,
"step": 242688
},
{
"epoch": 9.177741679573874,
"grad_norm": 0.0029853142332285643,
"learning_rate": 1.651618752597182e-06,
"loss": 0.0013,
"step": 242944
},
{
"epoch": 9.187412640247818,
"grad_norm": 0.004745794460177422,
"learning_rate": 1.6322768312492917e-06,
"loss": 0.0008,
"step": 243200
},
{
"epoch": 9.197083600921763,
"grad_norm": 0.029157089069485664,
"learning_rate": 1.6129349099014016e-06,
"loss": 0.0009,
"step": 243456
},
{
"epoch": 9.206754561595709,
"grad_norm": 0.09862171113491058,
"learning_rate": 1.5935929885535115e-06,
"loss": 0.001,
"step": 243712
},
{
"epoch": 9.216425522269654,
"grad_norm": 0.02549828216433525,
"learning_rate": 1.5742510672056212e-06,
"loss": 0.0013,
"step": 243968
},
{
"epoch": 9.226096482943598,
"grad_norm": 0.0003341349947731942,
"learning_rate": 1.5549091458577311e-06,
"loss": 0.0011,
"step": 244224
},
{
"epoch": 9.235767443617544,
"grad_norm": 0.00141440168954432,
"learning_rate": 1.535567224509841e-06,
"loss": 0.0007,
"step": 244480
},
{
"epoch": 9.24543840429149,
"grad_norm": 0.0013356832787394524,
"learning_rate": 1.516225303161951e-06,
"loss": 0.0014,
"step": 244736
},
{
"epoch": 9.255109364965433,
"grad_norm": 0.06080584600567818,
"learning_rate": 1.4968833818140607e-06,
"loss": 0.0006,
"step": 244992
},
{
"epoch": 9.264780325639379,
"grad_norm": 0.11237218230962753,
"learning_rate": 1.4775414604661706e-06,
"loss": 0.0012,
"step": 245248
},
{
"epoch": 9.274451286313324,
"grad_norm": 0.23928683996200562,
"learning_rate": 1.4581995391182805e-06,
"loss": 0.0005,
"step": 245504
},
{
"epoch": 9.28412224698727,
"grad_norm": 0.001771116629242897,
"learning_rate": 1.4388576177703902e-06,
"loss": 0.0011,
"step": 245760
},
{
"epoch": 9.293793207661214,
"grad_norm": 0.0017612532246857882,
"learning_rate": 1.4195156964225001e-06,
"loss": 0.0007,
"step": 246016
},
{
"epoch": 9.303464168335159,
"grad_norm": 0.00843687541782856,
"learning_rate": 1.4002493294548752e-06,
"loss": 0.0018,
"step": 246272
},
{
"epoch": 9.313135129009105,
"grad_norm": 0.07218307256698608,
"learning_rate": 1.380907408106985e-06,
"loss": 0.0007,
"step": 246528
},
{
"epoch": 9.322806089683048,
"grad_norm": 0.00684273662045598,
"learning_rate": 1.361565486759095e-06,
"loss": 0.0005,
"step": 246784
},
{
"epoch": 9.332477050356994,
"grad_norm": 0.0004243789007887244,
"learning_rate": 1.34229911979147e-06,
"loss": 0.0005,
"step": 247040
},
{
"epoch": 9.34214801103094,
"grad_norm": 0.000982985831797123,
"learning_rate": 1.32295719844358e-06,
"loss": 0.0009,
"step": 247296
},
{
"epoch": 9.351818971704885,
"grad_norm": 0.008006760850548744,
"learning_rate": 1.3036152770956897e-06,
"loss": 0.0008,
"step": 247552
},
{
"epoch": 9.361489932378829,
"grad_norm": 0.0012839402770623565,
"learning_rate": 1.2842733557477996e-06,
"loss": 0.0012,
"step": 247808
},
{
"epoch": 9.371160893052775,
"grad_norm": 0.0076642511412501335,
"learning_rate": 1.2649314343999095e-06,
"loss": 0.0007,
"step": 248064
},
{
"epoch": 9.38083185372672,
"grad_norm": 0.0976879671216011,
"learning_rate": 1.2455895130520192e-06,
"loss": 0.0006,
"step": 248320
},
{
"epoch": 9.390502814400666,
"grad_norm": 2.341963291168213,
"learning_rate": 1.2262475917041291e-06,
"loss": 0.0009,
"step": 248576
},
{
"epoch": 9.40017377507461,
"grad_norm": 0.002288688672706485,
"learning_rate": 1.206905670356239e-06,
"loss": 0.0007,
"step": 248832
},
{
"epoch": 9.409844735748555,
"grad_norm": 0.0005827232380397618,
"learning_rate": 1.187563749008349e-06,
"loss": 0.0009,
"step": 249088
},
{
"epoch": 9.4195156964225,
"grad_norm": 0.00030542805325239897,
"learning_rate": 1.1682218276604587e-06,
"loss": 0.0007,
"step": 249344
},
{
"epoch": 9.429186657096444,
"grad_norm": 0.00033465458545833826,
"learning_rate": 1.1488799063125686e-06,
"loss": 0.0007,
"step": 249600
},
{
"epoch": 9.43885761777039,
"grad_norm": 0.0005558193661272526,
"learning_rate": 1.1295379849646785e-06,
"loss": 0.001,
"step": 249856
},
{
"epoch": 9.448528578444336,
"grad_norm": 0.008819201961159706,
"learning_rate": 1.1101960636167882e-06,
"loss": 0.0008,
"step": 250112
},
{
"epoch": 9.458199539118281,
"grad_norm": 0.011124982498586178,
"learning_rate": 1.0908541422688981e-06,
"loss": 0.001,
"step": 250368
},
{
"epoch": 9.467870499792225,
"grad_norm": 0.07561460882425308,
"learning_rate": 1.071512220921008e-06,
"loss": 0.001,
"step": 250624
},
{
"epoch": 9.47754146046617,
"grad_norm": 0.00775932939723134,
"learning_rate": 1.0521702995731177e-06,
"loss": 0.0008,
"step": 250880
},
{
"epoch": 9.487212421140116,
"grad_norm": 0.0026791319251060486,
"learning_rate": 1.032903932605493e-06,
"loss": 0.0009,
"step": 251136
},
{
"epoch": 9.49688338181406,
"grad_norm": 0.0014814439928159118,
"learning_rate": 1.0135620112576027e-06,
"loss": 0.0009,
"step": 251392
},
{
"epoch": 9.506554342488005,
"grad_norm": 0.17079958319664001,
"learning_rate": 9.942200899097126e-07,
"loss": 0.0008,
"step": 251648
},
{
"epoch": 9.516225303161951,
"grad_norm": 0.006455567199736834,
"learning_rate": 9.748781685618225e-07,
"loss": 0.0008,
"step": 251904
},
{
"epoch": 9.525896263835897,
"grad_norm": 0.0035214037634432316,
"learning_rate": 9.555362472139324e-07,
"loss": 0.0003,
"step": 252160
},
{
"epoch": 9.53556722450984,
"grad_norm": 0.0005882234545424581,
"learning_rate": 9.361943258660422e-07,
"loss": 0.0004,
"step": 252416
},
{
"epoch": 9.545238185183786,
"grad_norm": 0.00487788300961256,
"learning_rate": 9.168524045181521e-07,
"loss": 0.0011,
"step": 252672
},
{
"epoch": 9.554909145857732,
"grad_norm": 0.0005454017664305866,
"learning_rate": 8.975104831702619e-07,
"loss": 0.0009,
"step": 252928
},
{
"epoch": 9.564580106531675,
"grad_norm": 0.0002963479782920331,
"learning_rate": 8.782441162026368e-07,
"loss": 0.0008,
"step": 253184
},
{
"epoch": 9.574251067205621,
"grad_norm": 0.014803556725382805,
"learning_rate": 8.589021948547467e-07,
"loss": 0.0007,
"step": 253440
},
{
"epoch": 9.583922027879566,
"grad_norm": 0.0010204812278971076,
"learning_rate": 8.395602735068565e-07,
"loss": 0.0006,
"step": 253696
},
{
"epoch": 9.593592988553512,
"grad_norm": 0.000603766180574894,
"learning_rate": 8.202183521589665e-07,
"loss": 0.0005,
"step": 253952
},
{
"epoch": 9.603263949227456,
"grad_norm": 0.0006934937555342913,
"learning_rate": 8.008764308110763e-07,
"loss": 0.0004,
"step": 254208
},
{
"epoch": 9.612934909901401,
"grad_norm": 0.002163499826565385,
"learning_rate": 7.815345094631861e-07,
"loss": 0.0012,
"step": 254464
},
{
"epoch": 9.622605870575347,
"grad_norm": 0.009007874876260757,
"learning_rate": 7.62192588115296e-07,
"loss": 0.0009,
"step": 254720
},
{
"epoch": 9.632276831249293,
"grad_norm": 0.001189779955893755,
"learning_rate": 7.42850666767406e-07,
"loss": 0.0007,
"step": 254976
},
{
"epoch": 9.641947791923236,
"grad_norm": 0.006172012072056532,
"learning_rate": 7.235087454195158e-07,
"loss": 0.0008,
"step": 255232
},
{
"epoch": 9.651618752597182,
"grad_norm": 0.0028820731677114964,
"learning_rate": 7.041668240716256e-07,
"loss": 0.0009,
"step": 255488
},
{
"epoch": 9.661289713271128,
"grad_norm": 0.002549013588577509,
"learning_rate": 6.848249027237356e-07,
"loss": 0.0005,
"step": 255744
},
{
"epoch": 9.670960673945071,
"grad_norm": 0.0011592130176723003,
"learning_rate": 6.654829813758454e-07,
"loss": 0.0005,
"step": 256000
},
{
"epoch": 9.680631634619017,
"grad_norm": 0.009473592974245548,
"learning_rate": 6.461410600279553e-07,
"loss": 0.0006,
"step": 256256
},
{
"epoch": 9.690302595292962,
"grad_norm": 0.013225371949374676,
"learning_rate": 6.267991386800651e-07,
"loss": 0.0006,
"step": 256512
},
{
"epoch": 9.699973555966906,
"grad_norm": 0.0005315671442076564,
"learning_rate": 6.0753277171244e-07,
"loss": 0.0009,
"step": 256768
},
{
"epoch": 9.709644516640852,
"grad_norm": 0.07691678404808044,
"learning_rate": 5.881908503645499e-07,
"loss": 0.001,
"step": 257024
},
{
"epoch": 9.719315477314797,
"grad_norm": 0.00017236363783013076,
"learning_rate": 5.688489290166599e-07,
"loss": 0.0007,
"step": 257280
},
{
"epoch": 9.728986437988743,
"grad_norm": 0.00099793984554708,
"learning_rate": 5.495070076687697e-07,
"loss": 0.0016,
"step": 257536
},
{
"epoch": 9.738657398662687,
"grad_norm": 0.0005514703807421029,
"learning_rate": 5.301650863208795e-07,
"loss": 0.0004,
"step": 257792
},
{
"epoch": 9.748328359336632,
"grad_norm": 0.0029203654266893864,
"learning_rate": 5.108231649729894e-07,
"loss": 0.0007,
"step": 258048
},
{
"epoch": 9.757999320010578,
"grad_norm": 0.0004254644736647606,
"learning_rate": 4.914812436250992e-07,
"loss": 0.0016,
"step": 258304
},
{
"epoch": 9.767670280684523,
"grad_norm": 0.0031043547205626965,
"learning_rate": 4.721393222772091e-07,
"loss": 0.0005,
"step": 258560
},
{
"epoch": 9.777341241358467,
"grad_norm": 0.002943431492894888,
"learning_rate": 4.5279740092931894e-07,
"loss": 0.0008,
"step": 258816
},
{
"epoch": 9.787012202032413,
"grad_norm": 0.00015551786054857075,
"learning_rate": 4.334554795814288e-07,
"loss": 0.0011,
"step": 259072
},
{
"epoch": 9.796683162706358,
"grad_norm": 0.0021992865949869156,
"learning_rate": 4.1411355823353867e-07,
"loss": 0.0011,
"step": 259328
},
{
"epoch": 9.806354123380302,
"grad_norm": 0.3576786518096924,
"learning_rate": 3.947716368856485e-07,
"loss": 0.0011,
"step": 259584
},
{
"epoch": 9.816025084054248,
"grad_norm": 0.001682179281488061,
"learning_rate": 3.7542971553775834e-07,
"loss": 0.0007,
"step": 259840
},
{
"epoch": 9.825696044728193,
"grad_norm": 0.0001894651068141684,
"learning_rate": 3.560877941898682e-07,
"loss": 0.0007,
"step": 260096
},
{
"epoch": 9.835367005402139,
"grad_norm": 0.11490330845117569,
"learning_rate": 3.3674587284197807e-07,
"loss": 0.0006,
"step": 260352
},
{
"epoch": 9.845037966076083,
"grad_norm": 0.00011810084106400609,
"learning_rate": 3.1740395149408793e-07,
"loss": 0.0005,
"step": 260608
},
{
"epoch": 9.854708926750028,
"grad_norm": 0.0006803704309277236,
"learning_rate": 2.9806203014619774e-07,
"loss": 0.0005,
"step": 260864
},
{
"epoch": 9.864379887423974,
"grad_norm": 0.0036548932548612356,
"learning_rate": 2.787201087983076e-07,
"loss": 0.0007,
"step": 261120
},
{
"epoch": 9.874050848097918,
"grad_norm": 0.0011051982874050736,
"learning_rate": 2.5937818745041747e-07,
"loss": 0.0009,
"step": 261376
},
{
"epoch": 9.883721808771863,
"grad_norm": 0.010463064536452293,
"learning_rate": 2.4003626610252733e-07,
"loss": 0.0006,
"step": 261632
},
{
"epoch": 9.893392769445809,
"grad_norm": 0.0015552444383502007,
"learning_rate": 2.2069434475463717e-07,
"loss": 0.0004,
"step": 261888
},
{
"epoch": 9.903063730119754,
"grad_norm": 0.00023192820663098246,
"learning_rate": 2.0135242340674704e-07,
"loss": 0.0005,
"step": 262144
},
{
"epoch": 9.912734690793698,
"grad_norm": 2.180852174758911,
"learning_rate": 1.8201050205885687e-07,
"loss": 0.0008,
"step": 262400
},
{
"epoch": 9.922405651467644,
"grad_norm": 0.2690439820289612,
"learning_rate": 1.6266858071096674e-07,
"loss": 0.0005,
"step": 262656
},
{
"epoch": 9.93207661214159,
"grad_norm": 0.0014845479745417833,
"learning_rate": 1.4340221374334178e-07,
"loss": 0.0007,
"step": 262912
},
{
"epoch": 9.941747572815533,
"grad_norm": 0.0010751072550192475,
"learning_rate": 1.2406029239545164e-07,
"loss": 0.0017,
"step": 263168
},
{
"epoch": 9.951418533489479,
"grad_norm": 0.005477603990584612,
"learning_rate": 1.0479392542782669e-07,
"loss": 0.0003,
"step": 263424
},
{
"epoch": 9.961089494163424,
"grad_norm": 0.003662185976281762,
"learning_rate": 8.545200407993654e-08,
"loss": 0.001,
"step": 263680
},
{
"epoch": 9.97076045483737,
"grad_norm": 0.0006105359643697739,
"learning_rate": 6.611008273204639e-08,
"loss": 0.001,
"step": 263936
},
{
"epoch": 9.980431415511314,
"grad_norm": 0.0005147479241713881,
"learning_rate": 4.676816138415625e-08,
"loss": 0.0006,
"step": 264192
},
{
"epoch": 9.99010237618526,
"grad_norm": 0.002465909579768777,
"learning_rate": 2.7426240036266103e-08,
"loss": 0.0007,
"step": 264448
},
{
"epoch": 9.999773336859205,
"grad_norm": 0.0049901618622243404,
"learning_rate": 8.084318688375959e-09,
"loss": 0.0008,
"step": 264704
},
{
"epoch": 10.0,
"eval_f1_B-DISEASE": 0.8212511199804513,
"eval_f1_B-MEDICATION": 0.9441194996850535,
"eval_f1_B-PROCEDURE": 0.8438837081733407,
"eval_f1_B-SYMPTOM": 0.8142008132624335,
"eval_f1_I-DISEASE": 0.8531332420369243,
"eval_f1_I-MEDICATION": 0.9504971609841921,
"eval_f1_I-PROCEDURE": 0.855959918699867,
"eval_f1_I-SYMPTOM": 0.8203061784176257,
"eval_f1_O": 0.9279796337095003,
"eval_f1_macro": 0.870147919438821,
"eval_f1_micro": 0.8940428457113243,
"eval_loss": 0.5246506333351135,
"eval_precision_B-DISEASE": 0.8439357160793505,
"eval_precision_B-MEDICATION": 0.9548598471059337,
"eval_precision_B-PROCEDURE": 0.8662552367223749,
"eval_precision_B-SYMPTOM": 0.8270493539504342,
"eval_precision_I-DISEASE": 0.8624838159699522,
"eval_precision_I-MEDICATION": 0.9581855315489627,
"eval_precision_I-PROCEDURE": 0.8779157051309547,
"eval_precision_I-SYMPTOM": 0.8292179488587081,
"eval_precision_O": 0.9223528464068083,
"eval_precision_macro": 0.8824728890859421,
"eval_precision_micro": 0.8962622493770654,
"eval_rauc_macro": 0.918932582829971,
"eval_rauc_micro": 0.9393388823070546,
"eval_recall_B-DISEASE": 0.7997541048623781,
"eval_recall_B-MEDICATION": 0.9336180815091654,
"eval_recall_B-PROCEDURE": 0.8226386036960985,
"eval_recall_B-SYMPTOM": 0.8017453798767967,
"eval_recall_I-DISEASE": 0.8439832411344849,
"eval_recall_I-MEDICATION": 0.942931189506532,
"eval_recall_I-PROCEDURE": 0.8350755220446033,
"eval_recall_I-SYMPTOM": 0.8115839243498818,
"eval_recall_O": 0.9336754945048357,
"eval_recall_macro": 0.858333949053864,
"eval_recall_micro": 0.8918344066604195,
"eval_roc_auc_B-DISEASE": 0.898501130076159,
"eval_roc_auc_B-MEDICATION": 0.9667188383374489,
"eval_roc_auc_B-PROCEDURE": 0.9102252873491329,
"eval_roc_auc_B-SYMPTOM": 0.8990597025985936,
"eval_roc_auc_I-DISEASE": 0.9132048321619536,
"eval_roc_auc_I-MEDICATION": 0.9711798590609849,
"eval_roc_auc_I-PROCEDURE": 0.9118804724182935,
"eval_roc_auc_I-SYMPTOM": 0.8927663421914375,
"eval_roc_auc_O": 0.9068567812757345,
"eval_runtime": 60.9219,
"eval_samples_per_second": 178.474,
"eval_steps_per_second": 22.324,
"step": 264710
}
],
"logging_steps": 256,
"max_steps": 264710,
"num_input_tokens_seen": 0,
"num_train_epochs": 10,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 1.5034084397459712e+18,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}