| { |
| "best_metric": 0.6937354988399073, |
| "best_model_checkpoint": "outputs/models/distilbert-clinical-ner/checkpoint-770", |
| "epoch": 77.0, |
| "eval_steps": 500, |
| "global_step": 770, |
| "is_hyper_param_search": false, |
| "is_local_process_zero": true, |
| "is_world_process_zero": true, |
| "log_history": [ |
| { |
| "epoch": 1.0, |
| "eval_f1": 0.019590382902938554, |
| "eval_loss": 4.235354900360107, |
| "eval_precision": 0.01608187134502924, |
| "eval_recall": 0.025056947608200455, |
| "eval_runtime": 0.1555, |
| "eval_samples_per_second": 128.613, |
| "eval_steps_per_second": 12.861, |
| "step": 10 |
| }, |
| { |
| "epoch": 2.0, |
| "eval_f1": 0.023399014778325126, |
| "eval_loss": 4.040920734405518, |
| "eval_precision": 0.02546916890080429, |
| "eval_recall": 0.02164009111617312, |
| "eval_runtime": 0.1064, |
| "eval_samples_per_second": 187.984, |
| "eval_steps_per_second": 18.798, |
| "step": 20 |
| }, |
| { |
| "epoch": 3.0, |
| "eval_f1": 0.0045045045045045045, |
| "eval_loss": 3.6175544261932373, |
| "eval_precision": 0.2, |
| "eval_recall": 0.002277904328018223, |
| "eval_runtime": 0.1035, |
| "eval_samples_per_second": 193.236, |
| "eval_steps_per_second": 19.324, |
| "step": 30 |
| }, |
| { |
| "epoch": 4.0, |
| "eval_f1": 0.0, |
| "eval_loss": 3.0632073879241943, |
| "eval_precision": 0.0, |
| "eval_recall": 0.0, |
| "eval_runtime": 0.1056, |
| "eval_samples_per_second": 189.304, |
| "eval_steps_per_second": 18.93, |
| "step": 40 |
| }, |
| { |
| "epoch": 5.0, |
| "grad_norm": 2.285052537918091, |
| "learning_rate": 1e-05, |
| "loss": 3.7184, |
| "step": 50 |
| }, |
| { |
| "epoch": 5.0, |
| "eval_f1": 0.0, |
| "eval_loss": 2.6725738048553467, |
| "eval_precision": 0.0, |
| "eval_recall": 0.0, |
| "eval_runtime": 0.1038, |
| "eval_samples_per_second": 192.708, |
| "eval_steps_per_second": 19.271, |
| "step": 50 |
| }, |
| { |
| "epoch": 6.0, |
| "eval_f1": 0.0022753128555176336, |
| "eval_loss": 2.3172459602355957, |
| "eval_precision": 1.0, |
| "eval_recall": 0.0011389521640091116, |
| "eval_runtime": 0.1056, |
| "eval_samples_per_second": 189.369, |
| "eval_steps_per_second": 18.937, |
| "step": 60 |
| }, |
| { |
| "epoch": 7.0, |
| "eval_f1": 0.24705882352941175, |
| "eval_loss": 2.010183334350586, |
| "eval_precision": 0.34854771784232363, |
| "eval_recall": 0.19134396355353075, |
| "eval_runtime": 0.1045, |
| "eval_samples_per_second": 191.384, |
| "eval_steps_per_second": 19.138, |
| "step": 70 |
| }, |
| { |
| "epoch": 8.0, |
| "eval_f1": 0.3578104138851802, |
| "eval_loss": 1.7770382165908813, |
| "eval_precision": 0.432258064516129, |
| "eval_recall": 0.3052391799544419, |
| "eval_runtime": 0.1043, |
| "eval_samples_per_second": 191.78, |
| "eval_steps_per_second": 19.178, |
| "step": 80 |
| }, |
| { |
| "epoch": 9.0, |
| "eval_f1": 0.4306709265175719, |
| "eval_loss": 1.578804612159729, |
| "eval_precision": 0.49053857350800584, |
| "eval_recall": 0.3838268792710706, |
| "eval_runtime": 0.1049, |
| "eval_samples_per_second": 190.736, |
| "eval_steps_per_second": 19.074, |
| "step": 90 |
| }, |
| { |
| "epoch": 10.0, |
| "grad_norm": 1.6135512590408325, |
| "learning_rate": 2e-05, |
| "loss": 2.0341, |
| "step": 100 |
| }, |
| { |
| "epoch": 10.0, |
| "eval_f1": 0.5129151291512916, |
| "eval_loss": 1.4062659740447998, |
| "eval_precision": 0.5574866310160428, |
| "eval_recall": 0.47494305239179957, |
| "eval_runtime": 0.1053, |
| "eval_samples_per_second": 189.876, |
| "eval_steps_per_second": 18.988, |
| "step": 100 |
| }, |
| { |
| "epoch": 11.0, |
| "eval_f1": 0.5652435357787132, |
| "eval_loss": 1.2971620559692383, |
| "eval_precision": 0.5987261146496815, |
| "eval_recall": 0.5353075170842825, |
| "eval_runtime": 0.1046, |
| "eval_samples_per_second": 191.215, |
| "eval_steps_per_second": 19.122, |
| "step": 110 |
| }, |
| { |
| "epoch": 12.0, |
| "eval_f1": 0.5844155844155845, |
| "eval_loss": 1.22593092918396, |
| "eval_precision": 0.6066176470588235, |
| "eval_recall": 0.5637813211845103, |
| "eval_runtime": 0.1052, |
| "eval_samples_per_second": 190.037, |
| "eval_steps_per_second": 19.004, |
| "step": 120 |
| }, |
| { |
| "epoch": 13.0, |
| "eval_f1": 0.6020642201834862, |
| "eval_loss": 1.1731911897659302, |
| "eval_precision": 0.6062355658198614, |
| "eval_recall": 0.5979498861047836, |
| "eval_runtime": 0.1047, |
| "eval_samples_per_second": 190.934, |
| "eval_steps_per_second": 19.093, |
| "step": 130 |
| }, |
| { |
| "epoch": 14.0, |
| "eval_f1": 0.6093023255813953, |
| "eval_loss": 1.1392405033111572, |
| "eval_precision": 0.6223277909738717, |
| "eval_recall": 0.5968109339407744, |
| "eval_runtime": 0.1076, |
| "eval_samples_per_second": 185.839, |
| "eval_steps_per_second": 18.584, |
| "step": 140 |
| }, |
| { |
| "epoch": 15.0, |
| "grad_norm": 1.8851341009140015, |
| "learning_rate": 1.888888888888889e-05, |
| "loss": 1.0843, |
| "step": 150 |
| }, |
| { |
| "epoch": 15.0, |
| "eval_f1": 0.6329849012775842, |
| "eval_loss": 1.1109048128128052, |
| "eval_precision": 0.6457345971563981, |
| "eval_recall": 0.6207289293849658, |
| "eval_runtime": 0.1045, |
| "eval_samples_per_second": 191.342, |
| "eval_steps_per_second": 19.134, |
| "step": 150 |
| }, |
| { |
| "epoch": 16.0, |
| "eval_f1": 0.6323103647944412, |
| "eval_loss": 1.111675500869751, |
| "eval_precision": 0.6431095406360424, |
| "eval_recall": 0.621867881548975, |
| "eval_runtime": 0.1064, |
| "eval_samples_per_second": 187.947, |
| "eval_steps_per_second": 18.795, |
| "step": 160 |
| }, |
| { |
| "epoch": 17.0, |
| "eval_f1": 0.6406976744186046, |
| "eval_loss": 1.1105479001998901, |
| "eval_precision": 0.6543942992874109, |
| "eval_recall": 0.6275626423690205, |
| "eval_runtime": 0.1038, |
| "eval_samples_per_second": 192.723, |
| "eval_steps_per_second": 19.272, |
| "step": 170 |
| }, |
| { |
| "epoch": 18.0, |
| "eval_f1": 0.6418338108882521, |
| "eval_loss": 1.1081936359405518, |
| "eval_precision": 0.6459054209919262, |
| "eval_recall": 0.6378132118451025, |
| "eval_runtime": 0.1093, |
| "eval_samples_per_second": 182.962, |
| "eval_steps_per_second": 18.296, |
| "step": 180 |
| }, |
| { |
| "epoch": 19.0, |
| "eval_f1": 0.656629994209612, |
| "eval_loss": 1.0905473232269287, |
| "eval_precision": 0.6678445229681979, |
| "eval_recall": 0.6457858769931663, |
| "eval_runtime": 0.1058, |
| "eval_samples_per_second": 189.016, |
| "eval_steps_per_second": 18.902, |
| "step": 190 |
| }, |
| { |
| "epoch": 20.0, |
| "grad_norm": 2.453874111175537, |
| "learning_rate": 1.7777777777777777e-05, |
| "loss": 0.6709, |
| "step": 200 |
| }, |
| { |
| "epoch": 20.0, |
| "eval_f1": 0.6527536231884057, |
| "eval_loss": 1.0979650020599365, |
| "eval_precision": 0.6646989374262101, |
| "eval_recall": 0.6412300683371298, |
| "eval_runtime": 0.1051, |
| "eval_samples_per_second": 190.38, |
| "eval_steps_per_second": 19.038, |
| "step": 200 |
| }, |
| { |
| "epoch": 21.0, |
| "eval_f1": 0.660889659156557, |
| "eval_loss": 1.1073075532913208, |
| "eval_precision": 0.6705744431418523, |
| "eval_recall": 0.6514806378132119, |
| "eval_runtime": 0.1063, |
| "eval_samples_per_second": 188.158, |
| "eval_steps_per_second": 18.816, |
| "step": 210 |
| }, |
| { |
| "epoch": 22.0, |
| "eval_f1": 0.6520231213872832, |
| "eval_loss": 1.109878420829773, |
| "eval_precision": 0.6619718309859155, |
| "eval_recall": 0.642369020501139, |
| "eval_runtime": 0.1108, |
| "eval_samples_per_second": 180.582, |
| "eval_steps_per_second": 18.058, |
| "step": 220 |
| }, |
| { |
| "epoch": 23.0, |
| "eval_f1": 0.6666666666666666, |
| "eval_loss": 1.1079308986663818, |
| "eval_precision": 0.6838323353293413, |
| "eval_recall": 0.6503416856492027, |
| "eval_runtime": 0.1051, |
| "eval_samples_per_second": 190.371, |
| "eval_steps_per_second": 19.037, |
| "step": 230 |
| }, |
| { |
| "epoch": 24.0, |
| "eval_f1": 0.6685714285714285, |
| "eval_loss": 1.0995490550994873, |
| "eval_precision": 0.6708715596330275, |
| "eval_recall": 0.6662870159453302, |
| "eval_runtime": 0.1076, |
| "eval_samples_per_second": 185.917, |
| "eval_steps_per_second": 18.592, |
| "step": 240 |
| }, |
| { |
| "epoch": 25.0, |
| "grad_norm": 1.9804632663726807, |
| "learning_rate": 1.6666666666666667e-05, |
| "loss": 0.4563, |
| "step": 250 |
| }, |
| { |
| "epoch": 25.0, |
| "eval_f1": 0.6623831775700935, |
| "eval_loss": 1.1412475109100342, |
| "eval_precision": 0.6798561151079137, |
| "eval_recall": 0.6457858769931663, |
| "eval_runtime": 0.1043, |
| "eval_samples_per_second": 191.672, |
| "eval_steps_per_second": 19.167, |
| "step": 250 |
| }, |
| { |
| "epoch": 26.0, |
| "eval_f1": 0.6685878962536023, |
| "eval_loss": 1.1206316947937012, |
| "eval_precision": 0.676779463243874, |
| "eval_recall": 0.6605922551252847, |
| "eval_runtime": 0.1025, |
| "eval_samples_per_second": 195.213, |
| "eval_steps_per_second": 19.521, |
| "step": 260 |
| }, |
| { |
| "epoch": 27.0, |
| "eval_f1": 0.674013921113689, |
| "eval_loss": 1.1223537921905518, |
| "eval_precision": 0.6867612293144209, |
| "eval_recall": 0.6617312072892938, |
| "eval_runtime": 0.1023, |
| "eval_samples_per_second": 195.488, |
| "eval_steps_per_second": 19.549, |
| "step": 270 |
| }, |
| { |
| "epoch": 28.0, |
| "eval_f1": 0.6787595084844938, |
| "eval_loss": 1.1268706321716309, |
| "eval_precision": 0.6979542719614922, |
| "eval_recall": 0.6605922551252847, |
| "eval_runtime": 0.107, |
| "eval_samples_per_second": 186.844, |
| "eval_steps_per_second": 18.684, |
| "step": 280 |
| }, |
| { |
| "epoch": 29.0, |
| "eval_f1": 0.6817391304347827, |
| "eval_loss": 1.143689751625061, |
| "eval_precision": 0.6942148760330579, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1048, |
| "eval_samples_per_second": 190.916, |
| "eval_steps_per_second": 19.092, |
| "step": 290 |
| }, |
| { |
| "epoch": 30.0, |
| "grad_norm": 1.2570631504058838, |
| "learning_rate": 1.555555555555556e-05, |
| "loss": 0.3229, |
| "step": 300 |
| }, |
| { |
| "epoch": 30.0, |
| "eval_f1": 0.6781807714450201, |
| "eval_loss": 1.1411770582199097, |
| "eval_precision": 0.6856810244470314, |
| "eval_recall": 0.6708428246013668, |
| "eval_runtime": 0.1118, |
| "eval_samples_per_second": 178.865, |
| "eval_steps_per_second": 17.887, |
| "step": 300 |
| }, |
| { |
| "epoch": 31.0, |
| "eval_f1": 0.6797235023041475, |
| "eval_loss": 1.1665282249450684, |
| "eval_precision": 0.6876456876456877, |
| "eval_recall": 0.6719817767653758, |
| "eval_runtime": 0.1061, |
| "eval_samples_per_second": 188.516, |
| "eval_steps_per_second": 18.852, |
| "step": 310 |
| }, |
| { |
| "epoch": 32.0, |
| "eval_f1": 0.6785714285714286, |
| "eval_loss": 1.147858738899231, |
| "eval_precision": 0.6864801864801865, |
| "eval_recall": 0.6708428246013668, |
| "eval_runtime": 0.1079, |
| "eval_samples_per_second": 185.36, |
| "eval_steps_per_second": 18.536, |
| "step": 320 |
| }, |
| { |
| "epoch": 33.0, |
| "eval_f1": 0.6774193548387096, |
| "eval_loss": 1.1554282903671265, |
| "eval_precision": 0.6853146853146853, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1037, |
| "eval_samples_per_second": 192.925, |
| "eval_steps_per_second": 19.292, |
| "step": 330 |
| }, |
| { |
| "epoch": 34.0, |
| "eval_f1": 0.6797687861271676, |
| "eval_loss": 1.15742027759552, |
| "eval_precision": 0.6901408450704225, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1053, |
| "eval_samples_per_second": 189.904, |
| "eval_steps_per_second": 18.99, |
| "step": 340 |
| }, |
| { |
| "epoch": 35.0, |
| "grad_norm": 1.0945429801940918, |
| "learning_rate": 1.4444444444444446e-05, |
| "loss": 0.2396, |
| "step": 350 |
| }, |
| { |
| "epoch": 35.0, |
| "eval_f1": 0.6797235023041475, |
| "eval_loss": 1.1754865646362305, |
| "eval_precision": 0.6876456876456877, |
| "eval_recall": 0.6719817767653758, |
| "eval_runtime": 0.1057, |
| "eval_samples_per_second": 189.199, |
| "eval_steps_per_second": 18.92, |
| "step": 350 |
| }, |
| { |
| "epoch": 36.0, |
| "eval_f1": 0.6735870818915801, |
| "eval_loss": 1.1885067224502563, |
| "eval_precision": 0.6822429906542056, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1, |
| "eval_samples_per_second": 200.0, |
| "eval_steps_per_second": 20.0, |
| "step": 360 |
| }, |
| { |
| "epoch": 37.0, |
| "eval_f1": 0.6806526806526807, |
| "eval_loss": 1.181584119796753, |
| "eval_precision": 0.6968973747016707, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1076, |
| "eval_samples_per_second": 185.858, |
| "eval_steps_per_second": 18.586, |
| "step": 370 |
| }, |
| { |
| "epoch": 38.0, |
| "eval_f1": 0.6787172011661807, |
| "eval_loss": 1.1876161098480225, |
| "eval_precision": 0.6953405017921147, |
| "eval_recall": 0.662870159453303, |
| "eval_runtime": 0.1161, |
| "eval_samples_per_second": 172.269, |
| "eval_steps_per_second": 17.227, |
| "step": 380 |
| }, |
| { |
| "epoch": 39.0, |
| "eval_f1": 0.6818713450292397, |
| "eval_loss": 1.2116471529006958, |
| "eval_precision": 0.7007211538461539, |
| "eval_recall": 0.664009111617312, |
| "eval_runtime": 0.1027, |
| "eval_samples_per_second": 194.71, |
| "eval_steps_per_second": 19.471, |
| "step": 390 |
| }, |
| { |
| "epoch": 40.0, |
| "grad_norm": 0.8599975109100342, |
| "learning_rate": 1.3333333333333333e-05, |
| "loss": 0.1848, |
| "step": 400 |
| }, |
| { |
| "epoch": 40.0, |
| "eval_f1": 0.6786542923433874, |
| "eval_loss": 1.1997044086456299, |
| "eval_precision": 0.6914893617021277, |
| "eval_recall": 0.6662870159453302, |
| "eval_runtime": 0.1098, |
| "eval_samples_per_second": 182.124, |
| "eval_steps_per_second": 18.212, |
| "step": 400 |
| }, |
| { |
| "epoch": 41.0, |
| "eval_f1": 0.6817917393833625, |
| "eval_loss": 1.2281190156936646, |
| "eval_precision": 0.6967895362663495, |
| "eval_recall": 0.6674259681093394, |
| "eval_runtime": 0.1026, |
| "eval_samples_per_second": 195.027, |
| "eval_steps_per_second": 19.503, |
| "step": 410 |
| }, |
| { |
| "epoch": 42.0, |
| "eval_f1": 0.6820542412002308, |
| "eval_loss": 1.205224633216858, |
| "eval_precision": 0.6912280701754386, |
| "eval_recall": 0.673120728929385, |
| "eval_runtime": 0.1029, |
| "eval_samples_per_second": 194.454, |
| "eval_steps_per_second": 19.445, |
| "step": 420 |
| }, |
| { |
| "epoch": 43.0, |
| "eval_f1": 0.6834112149532711, |
| "eval_loss": 1.2441879510879517, |
| "eval_precision": 0.7014388489208633, |
| "eval_recall": 0.6662870159453302, |
| "eval_runtime": 0.1013, |
| "eval_samples_per_second": 197.51, |
| "eval_steps_per_second": 19.751, |
| "step": 430 |
| }, |
| { |
| "epoch": 44.0, |
| "eval_f1": 0.6762672811059909, |
| "eval_loss": 1.2410287857055664, |
| "eval_precision": 0.6841491841491841, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.1039, |
| "eval_samples_per_second": 192.454, |
| "eval_steps_per_second": 19.245, |
| "step": 440 |
| }, |
| { |
| "epoch": 45.0, |
| "grad_norm": 0.8666434288024902, |
| "learning_rate": 1.2222222222222224e-05, |
| "loss": 0.1472, |
| "step": 450 |
| }, |
| { |
| "epoch": 45.0, |
| "eval_f1": 0.6809744779582366, |
| "eval_loss": 1.2373775243759155, |
| "eval_precision": 0.693853427895981, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.1016, |
| "eval_samples_per_second": 196.912, |
| "eval_steps_per_second": 19.691, |
| "step": 450 |
| }, |
| { |
| "epoch": 46.0, |
| "eval_f1": 0.6786961583236321, |
| "eval_loss": 1.237067461013794, |
| "eval_precision": 0.694047619047619, |
| "eval_recall": 0.664009111617312, |
| "eval_runtime": 0.1002, |
| "eval_samples_per_second": 199.663, |
| "eval_steps_per_second": 19.966, |
| "step": 460 |
| }, |
| { |
| "epoch": 47.0, |
| "eval_f1": 0.6889016676250718, |
| "eval_loss": 1.2270065546035767, |
| "eval_precision": 0.6957026713124274, |
| "eval_recall": 0.6822323462414579, |
| "eval_runtime": 0.1051, |
| "eval_samples_per_second": 190.295, |
| "eval_steps_per_second": 19.03, |
| "step": 470 |
| }, |
| { |
| "epoch": 48.0, |
| "eval_f1": 0.6805555555555555, |
| "eval_loss": 1.238765001296997, |
| "eval_precision": 0.691764705882353, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1066, |
| "eval_samples_per_second": 187.677, |
| "eval_steps_per_second": 18.768, |
| "step": 480 |
| }, |
| { |
| "epoch": 49.0, |
| "eval_f1": 0.6790914385556202, |
| "eval_loss": 1.2525634765625, |
| "eval_precision": 0.6948748510131109, |
| "eval_recall": 0.664009111617312, |
| "eval_runtime": 0.1021, |
| "eval_samples_per_second": 195.942, |
| "eval_steps_per_second": 19.594, |
| "step": 490 |
| }, |
| { |
| "epoch": 50.0, |
| "grad_norm": 0.8096102476119995, |
| "learning_rate": 1.1111111111111113e-05, |
| "loss": 0.1184, |
| "step": 500 |
| }, |
| { |
| "epoch": 50.0, |
| "eval_f1": 0.681421083284799, |
| "eval_loss": 1.2390888929367065, |
| "eval_precision": 0.6972586412395709, |
| "eval_recall": 0.6662870159453302, |
| "eval_runtime": 0.1042, |
| "eval_samples_per_second": 191.926, |
| "eval_steps_per_second": 19.193, |
| "step": 500 |
| }, |
| { |
| "epoch": 51.0, |
| "eval_f1": 0.6782810685249709, |
| "eval_loss": 1.2617552280426025, |
| "eval_precision": 0.6919431279620853, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1011, |
| "eval_samples_per_second": 197.736, |
| "eval_steps_per_second": 19.774, |
| "step": 510 |
| }, |
| { |
| "epoch": 52.0, |
| "eval_f1": 0.6814469078179697, |
| "eval_loss": 1.2573115825653076, |
| "eval_precision": 0.6985645933014354, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1033, |
| "eval_samples_per_second": 193.643, |
| "eval_steps_per_second": 19.364, |
| "step": 520 |
| }, |
| { |
| "epoch": 53.0, |
| "eval_f1": 0.681369704004643, |
| "eval_loss": 1.2631280422210693, |
| "eval_precision": 0.6946745562130178, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.1027, |
| "eval_samples_per_second": 194.742, |
| "eval_steps_per_second": 19.474, |
| "step": 530 |
| }, |
| { |
| "epoch": 54.0, |
| "eval_f1": 0.6822429906542057, |
| "eval_loss": 1.2612630128860474, |
| "eval_precision": 0.7002398081534772, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1034, |
| "eval_samples_per_second": 193.355, |
| "eval_steps_per_second": 19.335, |
| "step": 540 |
| }, |
| { |
| "epoch": 55.0, |
| "grad_norm": 1.258770227432251, |
| "learning_rate": 1e-05, |
| "loss": 0.0965, |
| "step": 550 |
| }, |
| { |
| "epoch": 55.0, |
| "eval_f1": 0.678592036930179, |
| "eval_loss": 1.2565994262695312, |
| "eval_precision": 0.6877192982456141, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1065, |
| "eval_samples_per_second": 187.769, |
| "eval_steps_per_second": 18.777, |
| "step": 550 |
| }, |
| { |
| "epoch": 56.0, |
| "eval_f1": 0.6720461095100864, |
| "eval_loss": 1.286030888557434, |
| "eval_precision": 0.6802800466744457, |
| "eval_recall": 0.664009111617312, |
| "eval_runtime": 0.1017, |
| "eval_samples_per_second": 196.637, |
| "eval_steps_per_second": 19.664, |
| "step": 560 |
| }, |
| { |
| "epoch": 57.0, |
| "eval_f1": 0.6774941995359629, |
| "eval_loss": 1.2746167182922363, |
| "eval_precision": 0.6903073286052009, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.104, |
| "eval_samples_per_second": 192.291, |
| "eval_steps_per_second": 19.229, |
| "step": 570 |
| }, |
| { |
| "epoch": 58.0, |
| "eval_f1": 0.6813441483198146, |
| "eval_loss": 1.2719839811325073, |
| "eval_precision": 0.6933962264150944, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1009, |
| "eval_samples_per_second": 198.12, |
| "eval_steps_per_second": 19.812, |
| "step": 580 |
| }, |
| { |
| "epoch": 59.0, |
| "eval_f1": 0.6845168800931315, |
| "eval_loss": 1.2790720462799072, |
| "eval_precision": 0.7, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1025, |
| "eval_samples_per_second": 195.09, |
| "eval_steps_per_second": 19.509, |
| "step": 590 |
| }, |
| { |
| "epoch": 60.0, |
| "grad_norm": 0.6421855688095093, |
| "learning_rate": 8.888888888888888e-06, |
| "loss": 0.0841, |
| "step": 600 |
| }, |
| { |
| "epoch": 60.0, |
| "eval_f1": 0.6827309236947792, |
| "eval_loss": 1.2661317586898804, |
| "eval_precision": 0.6878612716763006, |
| "eval_recall": 0.6776765375854215, |
| "eval_runtime": 0.1054, |
| "eval_samples_per_second": 189.834, |
| "eval_steps_per_second": 18.983, |
| "step": 600 |
| }, |
| { |
| "epoch": 61.0, |
| "eval_f1": 0.6803039158386909, |
| "eval_loss": 1.2873255014419556, |
| "eval_precision": 0.6986794717887155, |
| "eval_recall": 0.662870159453303, |
| "eval_runtime": 0.1028, |
| "eval_samples_per_second": 194.643, |
| "eval_steps_per_second": 19.464, |
| "step": 610 |
| }, |
| { |
| "epoch": 62.0, |
| "eval_f1": 0.6809248554913295, |
| "eval_loss": 1.2766045331954956, |
| "eval_precision": 0.6913145539906104, |
| "eval_recall": 0.6708428246013668, |
| "eval_runtime": 0.1044, |
| "eval_samples_per_second": 191.487, |
| "eval_steps_per_second": 19.149, |
| "step": 620 |
| }, |
| { |
| "epoch": 63.0, |
| "eval_f1": 0.6755658734764944, |
| "eval_loss": 1.2915081977844238, |
| "eval_precision": 0.6887573964497041, |
| "eval_recall": 0.662870159453303, |
| "eval_runtime": 0.1078, |
| "eval_samples_per_second": 185.542, |
| "eval_steps_per_second": 18.554, |
| "step": 630 |
| }, |
| { |
| "epoch": 64.0, |
| "eval_f1": 0.6732101616628174, |
| "eval_loss": 1.2793446779251099, |
| "eval_precision": 0.6826697892271663, |
| "eval_recall": 0.664009111617312, |
| "eval_runtime": 0.1016, |
| "eval_samples_per_second": 196.942, |
| "eval_steps_per_second": 19.694, |
| "step": 640 |
| }, |
| { |
| "epoch": 65.0, |
| "grad_norm": 0.5916463136672974, |
| "learning_rate": 7.77777777777778e-06, |
| "loss": 0.0714, |
| "step": 650 |
| }, |
| { |
| "epoch": 65.0, |
| "eval_f1": 0.6820276497695852, |
| "eval_loss": 1.3019025325775146, |
| "eval_precision": 0.6899766899766899, |
| "eval_recall": 0.6742596810933941, |
| "eval_runtime": 0.1008, |
| "eval_samples_per_second": 198.393, |
| "eval_steps_per_second": 19.839, |
| "step": 650 |
| }, |
| { |
| "epoch": 66.0, |
| "eval_f1": 0.6853473438412142, |
| "eval_loss": 1.2911741733551025, |
| "eval_precision": 0.7029940119760479, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.106, |
| "eval_samples_per_second": 188.757, |
| "eval_steps_per_second": 18.876, |
| "step": 660 |
| }, |
| { |
| "epoch": 67.0, |
| "eval_f1": 0.67816091954023, |
| "eval_loss": 1.2967917919158936, |
| "eval_precision": 0.6844547563805105, |
| "eval_recall": 0.6719817767653758, |
| "eval_runtime": 0.1092, |
| "eval_samples_per_second": 183.175, |
| "eval_steps_per_second": 18.318, |
| "step": 670 |
| }, |
| { |
| "epoch": 68.0, |
| "eval_f1": 0.6895348837209303, |
| "eval_loss": 1.2946228981018066, |
| "eval_precision": 0.7042755344418052, |
| "eval_recall": 0.6753986332574032, |
| "eval_runtime": 0.1052, |
| "eval_samples_per_second": 190.167, |
| "eval_steps_per_second": 19.017, |
| "step": 680 |
| }, |
| { |
| "epoch": 69.0, |
| "eval_f1": 0.6863425925925927, |
| "eval_loss": 1.2976857423782349, |
| "eval_precision": 0.6976470588235294, |
| "eval_recall": 0.6753986332574032, |
| "eval_runtime": 0.103, |
| "eval_samples_per_second": 194.22, |
| "eval_steps_per_second": 19.422, |
| "step": 690 |
| }, |
| { |
| "epoch": 70.0, |
| "grad_norm": 0.7995481491088867, |
| "learning_rate": 6.666666666666667e-06, |
| "loss": 0.064, |
| "step": 700 |
| }, |
| { |
| "epoch": 70.0, |
| "eval_f1": 0.6771014492753623, |
| "eval_loss": 1.295568585395813, |
| "eval_precision": 0.6894923258559622, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1031, |
| "eval_samples_per_second": 193.92, |
| "eval_steps_per_second": 19.392, |
| "step": 700 |
| }, |
| { |
| "epoch": 71.0, |
| "eval_f1": 0.6797687861271676, |
| "eval_loss": 1.2898850440979004, |
| "eval_precision": 0.6901408450704225, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.1005, |
| "eval_samples_per_second": 198.942, |
| "eval_steps_per_second": 19.894, |
| "step": 710 |
| }, |
| { |
| "epoch": 72.0, |
| "eval_f1": 0.6806526806526807, |
| "eval_loss": 1.3075172901153564, |
| "eval_precision": 0.6968973747016707, |
| "eval_recall": 0.6651480637813212, |
| "eval_runtime": 0.1087, |
| "eval_samples_per_second": 184.017, |
| "eval_steps_per_second": 18.402, |
| "step": 720 |
| }, |
| { |
| "epoch": 73.0, |
| "eval_f1": 0.683750728013978, |
| "eval_loss": 1.2973222732543945, |
| "eval_precision": 0.699642431466031, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.1054, |
| "eval_samples_per_second": 189.672, |
| "eval_steps_per_second": 18.967, |
| "step": 730 |
| }, |
| { |
| "epoch": 74.0, |
| "eval_f1": 0.6872812135355894, |
| "eval_loss": 1.3102946281433105, |
| "eval_precision": 0.7045454545454546, |
| "eval_recall": 0.6708428246013668, |
| "eval_runtime": 0.1064, |
| "eval_samples_per_second": 188.0, |
| "eval_steps_per_second": 18.8, |
| "step": 740 |
| }, |
| { |
| "epoch": 75.0, |
| "grad_norm": 0.8353786468505859, |
| "learning_rate": 5.555555555555557e-06, |
| "loss": 0.0575, |
| "step": 750 |
| }, |
| { |
| "epoch": 75.0, |
| "eval_f1": 0.6797915460335843, |
| "eval_loss": 1.3147099018096924, |
| "eval_precision": 0.6914016489988222, |
| "eval_recall": 0.6685649202733486, |
| "eval_runtime": 0.1049, |
| "eval_samples_per_second": 190.589, |
| "eval_steps_per_second": 19.059, |
| "step": 750 |
| }, |
| { |
| "epoch": 76.0, |
| "eval_f1": 0.6845168800931315, |
| "eval_loss": 1.3087732791900635, |
| "eval_precision": 0.7, |
| "eval_recall": 0.6697038724373576, |
| "eval_runtime": 0.105, |
| "eval_samples_per_second": 190.4, |
| "eval_steps_per_second": 19.04, |
| "step": 760 |
| }, |
| { |
| "epoch": 77.0, |
| "eval_f1": 0.6937354988399073, |
| "eval_loss": 1.3092721700668335, |
| "eval_precision": 0.706855791962175, |
| "eval_recall": 0.6810933940774487, |
| "eval_runtime": 0.1053, |
| "eval_samples_per_second": 189.996, |
| "eval_steps_per_second": 19.0, |
| "step": 770 |
| } |
| ], |
| "logging_steps": 50, |
| "max_steps": 1000, |
| "num_input_tokens_seen": 0, |
| "num_train_epochs": 100, |
| "save_steps": 500, |
| "stateful_callbacks": { |
| "TrainerControl": { |
| "args": { |
| "should_epoch_stop": false, |
| "should_evaluate": false, |
| "should_log": false, |
| "should_save": true, |
| "should_training_stop": false |
| }, |
| "attributes": {} |
| } |
| }, |
| "total_flos": 402935426826240.0, |
| "train_batch_size": 16, |
| "trial_name": null, |
| "trial_params": null |
| } |
|
|