Mabel44's picture
Upload 11 files
537cac6
{
"best_metric": 0.9957275483137553,
"best_model_checkpoint": "/home/obigo/mabel_folder/weights/20230807T14-16/checkpoint-3720",
"epoch": 130.0,
"global_step": 3900,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 1.0,
"eval_accuracy": 0.0,
"eval_f1": 0.022634836427939876,
"eval_loss": 0.5419425368309021,
"eval_roc_auc": 0.5090087204709872,
"eval_runtime": 0.5431,
"eval_samples_per_second": 1388.45,
"eval_steps_per_second": 5.524,
"step": 30
},
{
"epoch": 2.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.43089452385902405,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5448,
"eval_samples_per_second": 1383.892,
"eval_steps_per_second": 5.506,
"step": 60
},
{
"epoch": 3.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.3317475914955139,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5383,
"eval_samples_per_second": 1400.835,
"eval_steps_per_second": 5.574,
"step": 90
},
{
"epoch": 4.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.2464015930891037,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5361,
"eval_samples_per_second": 1406.54,
"eval_steps_per_second": 5.596,
"step": 120
},
{
"epoch": 5.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.18657957017421722,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5422,
"eval_samples_per_second": 1390.681,
"eval_steps_per_second": 5.533,
"step": 150
},
{
"epoch": 6.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.15198080241680145,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5414,
"eval_samples_per_second": 1392.668,
"eval_steps_per_second": 5.541,
"step": 180
},
{
"epoch": 7.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.13419176638126373,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5393,
"eval_samples_per_second": 1398.08,
"eval_steps_per_second": 5.563,
"step": 210
},
{
"epoch": 8.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.1253235787153244,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5439,
"eval_samples_per_second": 1386.359,
"eval_steps_per_second": 5.516,
"step": 240
},
{
"epoch": 9.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.12080227583646774,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5365,
"eval_samples_per_second": 1405.402,
"eval_steps_per_second": 5.592,
"step": 270
},
{
"epoch": 10.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11838895082473755,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5379,
"eval_samples_per_second": 1401.621,
"eval_steps_per_second": 5.577,
"step": 300
},
{
"epoch": 11.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11700380593538284,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5389,
"eval_samples_per_second": 1399.275,
"eval_steps_per_second": 5.567,
"step": 330
},
{
"epoch": 12.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11613008379936218,
"eval_roc_auc": 0.5,
"eval_runtime": 0.538,
"eval_samples_per_second": 1401.41,
"eval_steps_per_second": 5.576,
"step": 360
},
{
"epoch": 13.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11535105854272842,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5336,
"eval_samples_per_second": 1413.171,
"eval_steps_per_second": 5.623,
"step": 390
},
{
"epoch": 14.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11359580606222153,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5384,
"eval_samples_per_second": 1400.513,
"eval_steps_per_second": 5.572,
"step": 420
},
{
"epoch": 15.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.11105558276176453,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5337,
"eval_samples_per_second": 1412.725,
"eval_steps_per_second": 5.621,
"step": 450
},
{
"epoch": 16.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.10822370648384094,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5316,
"eval_samples_per_second": 1418.454,
"eval_steps_per_second": 5.644,
"step": 480
},
{
"epoch": 16.67,
"learning_rate": 1.3076923076923078e-05,
"loss": 0.2117,
"step": 500
},
{
"epoch": 17.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.10509264469146729,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5347,
"eval_samples_per_second": 1410.035,
"eval_steps_per_second": 5.61,
"step": 510
},
{
"epoch": 18.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.10190562158823013,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5367,
"eval_samples_per_second": 1404.771,
"eval_steps_per_second": 5.589,
"step": 540
},
{
"epoch": 19.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.09861494600772858,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5384,
"eval_samples_per_second": 1400.52,
"eval_steps_per_second": 5.572,
"step": 570
},
{
"epoch": 20.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.09537718445062637,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5362,
"eval_samples_per_second": 1406.174,
"eval_steps_per_second": 5.595,
"step": 600
},
{
"epoch": 21.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0,
"eval_loss": 0.09202598035335541,
"eval_roc_auc": 0.5,
"eval_runtime": 0.5373,
"eval_samples_per_second": 1403.389,
"eval_steps_per_second": 5.584,
"step": 630
},
{
"epoch": 22.0,
"eval_accuracy": 0.0,
"eval_f1": 0.0008841732979664014,
"eval_loss": 0.08873076736927032,
"eval_roc_auc": 0.5003802281368821,
"eval_runtime": 0.5334,
"eval_samples_per_second": 1413.555,
"eval_steps_per_second": 5.624,
"step": 660
},
{
"epoch": 23.0,
"eval_accuracy": 0.0,
"eval_f1": 0.017329796640141466,
"eval_loss": 0.08568281680345535,
"eval_roc_auc": 0.5075839224767497,
"eval_runtime": 0.5336,
"eval_samples_per_second": 1413.107,
"eval_steps_per_second": 5.622,
"step": 690
},
{
"epoch": 24.0,
"eval_accuracy": 0.0,
"eval_f1": 0.05791335101679928,
"eval_loss": 0.08255316317081451,
"eval_roc_auc": 0.5277153734706096,
"eval_runtime": 0.5382,
"eval_samples_per_second": 1401.051,
"eval_steps_per_second": 5.574,
"step": 720
},
{
"epoch": 25.0,
"eval_accuracy": 0.0,
"eval_f1": 0.06352785145888594,
"eval_loss": 0.07957819849252701,
"eval_roc_auc": 0.5311477468329951,
"eval_runtime": 0.5335,
"eval_samples_per_second": 1413.239,
"eval_steps_per_second": 5.623,
"step": 750
},
{
"epoch": 26.0,
"eval_accuracy": 0.0,
"eval_f1": 0.07966401414677277,
"eval_loss": 0.07669854909181595,
"eval_roc_auc": 0.5383617613033091,
"eval_runtime": 0.537,
"eval_samples_per_second": 1404.098,
"eval_steps_per_second": 5.587,
"step": 780
},
{
"epoch": 27.0,
"eval_accuracy": 0.0,
"eval_f1": 0.08757736516357206,
"eval_loss": 0.07403922080993652,
"eval_roc_auc": 0.5429244989458949,
"eval_runtime": 0.5351,
"eval_samples_per_second": 1408.981,
"eval_steps_per_second": 5.606,
"step": 810
},
{
"epoch": 28.0,
"eval_accuracy": 0.0,
"eval_f1": 0.10030946065428825,
"eval_loss": 0.07141123712062836,
"eval_roc_auc": 0.5493986974033375,
"eval_runtime": 0.5356,
"eval_samples_per_second": 1407.698,
"eval_steps_per_second": 5.601,
"step": 840
},
{
"epoch": 29.0,
"eval_accuracy": 0.0,
"eval_f1": 0.12139699381078692,
"eval_loss": 0.06896477937698364,
"eval_roc_auc": 0.5596648570991549,
"eval_runtime": 0.5385,
"eval_samples_per_second": 1400.089,
"eval_steps_per_second": 5.571,
"step": 870
},
{
"epoch": 30.0,
"eval_accuracy": 0.0,
"eval_f1": 0.1469496021220159,
"eval_loss": 0.06645014137029648,
"eval_roc_auc": 0.5718321574793831,
"eval_runtime": 0.539,
"eval_samples_per_second": 1398.905,
"eval_steps_per_second": 5.566,
"step": 900
},
{
"epoch": 31.0,
"eval_accuracy": 0.0,
"eval_f1": 0.16958443854995578,
"eval_loss": 0.06419382989406586,
"eval_roc_auc": 0.5836192297227291,
"eval_runtime": 0.5355,
"eval_samples_per_second": 1408.141,
"eval_steps_per_second": 5.603,
"step": 930
},
{
"epoch": 32.0,
"eval_accuracy": 0.04907161803713528,
"eval_f1": 0.27617152961980546,
"eval_loss": 0.06197493150830269,
"eval_roc_auc": 0.6243036403691168,
"eval_runtime": 0.5352,
"eval_samples_per_second": 1408.797,
"eval_steps_per_second": 5.605,
"step": 960
},
{
"epoch": 33.0,
"eval_accuracy": 0.050397877984084884,
"eval_f1": 0.29902740937223693,
"eval_loss": 0.05977466702461243,
"eval_roc_auc": 0.634559479934488,
"eval_runtime": 0.5415,
"eval_samples_per_second": 1392.528,
"eval_steps_per_second": 5.541,
"step": 990
},
{
"epoch": 33.33,
"learning_rate": 1.1153846153846154e-05,
"loss": 0.0856,
"step": 1000
},
{
"epoch": 34.0,
"eval_accuracy": 0.054376657824933686,
"eval_f1": 0.3352343059239611,
"eval_loss": 0.05773809924721718,
"eval_roc_auc": 0.6509299300813125,
"eval_runtime": 0.5369,
"eval_samples_per_second": 1404.423,
"eval_steps_per_second": 5.588,
"step": 1020
},
{
"epoch": 35.0,
"eval_accuracy": 0.05702917771883289,
"eval_f1": 0.34801692560313247,
"eval_loss": 0.055638011544942856,
"eval_roc_auc": 0.6596545369687085,
"eval_runtime": 0.5395,
"eval_samples_per_second": 1397.587,
"eval_steps_per_second": 5.561,
"step": 1050
},
{
"epoch": 36.0,
"eval_accuracy": 0.0636604774535809,
"eval_f1": 0.36848553745105467,
"eval_loss": 0.05378811061382294,
"eval_roc_auc": 0.6695404685276438,
"eval_runtime": 0.5346,
"eval_samples_per_second": 1410.402,
"eval_steps_per_second": 5.612,
"step": 1080
},
{
"epoch": 37.0,
"eval_accuracy": 0.06896551724137931,
"eval_f1": 0.4015094101300997,
"eval_loss": 0.051841311156749725,
"eval_roc_auc": 0.6885621955021968,
"eval_runtime": 0.5357,
"eval_samples_per_second": 1407.52,
"eval_steps_per_second": 5.6,
"step": 1110
},
{
"epoch": 38.0,
"eval_accuracy": 0.11273209549071618,
"eval_f1": 0.4456738663635216,
"eval_loss": 0.050086263567209244,
"eval_roc_auc": 0.711005975708689,
"eval_runtime": 0.5355,
"eval_samples_per_second": 1408.16,
"eval_steps_per_second": 5.603,
"step": 1140
},
{
"epoch": 39.0,
"eval_accuracy": 0.09946949602122016,
"eval_f1": 0.43961727927245164,
"eval_loss": 0.048313576728105545,
"eval_roc_auc": 0.7079538304831854,
"eval_runtime": 0.5342,
"eval_samples_per_second": 1411.344,
"eval_steps_per_second": 5.615,
"step": 1170
},
{
"epoch": 40.0,
"eval_accuracy": 0.16578249336870027,
"eval_f1": 0.4980042945560187,
"eval_loss": 0.04664042219519615,
"eval_roc_auc": 0.7330385673869595,
"eval_runtime": 0.5345,
"eval_samples_per_second": 1410.668,
"eval_steps_per_second": 5.613,
"step": 1200
},
{
"epoch": 41.0,
"eval_accuracy": 0.23342175066312998,
"eval_f1": 0.5616647720095996,
"eval_loss": 0.04504011198878288,
"eval_roc_auc": 0.7577533962842978,
"eval_runtime": 0.535,
"eval_samples_per_second": 1409.429,
"eval_steps_per_second": 5.608,
"step": 1230
},
{
"epoch": 42.0,
"eval_accuracy": 0.2572944297082228,
"eval_f1": 0.5754578754578755,
"eval_loss": 0.04347091540694237,
"eval_roc_auc": 0.7661184152957047,
"eval_runtime": 0.5319,
"eval_samples_per_second": 1417.63,
"eval_steps_per_second": 5.64,
"step": 1260
},
{
"epoch": 43.0,
"eval_accuracy": 0.3275862068965517,
"eval_f1": 0.6213022609574333,
"eval_loss": 0.04208529368042946,
"eval_roc_auc": 0.7866404145568933,
"eval_runtime": 0.5372,
"eval_samples_per_second": 1403.583,
"eval_steps_per_second": 5.585,
"step": 1290
},
{
"epoch": 44.0,
"eval_accuracy": 0.3687002652519894,
"eval_f1": 0.6514525704180877,
"eval_loss": 0.04067908599972725,
"eval_roc_auc": 0.7999587194782143,
"eval_runtime": 0.5388,
"eval_samples_per_second": 1399.494,
"eval_steps_per_second": 5.568,
"step": 1320
},
{
"epoch": 45.0,
"eval_accuracy": 0.43103448275862066,
"eval_f1": 0.6980042945560188,
"eval_loss": 0.03921309486031532,
"eval_roc_auc": 0.8174492137747922,
"eval_runtime": 0.534,
"eval_samples_per_second": 1411.985,
"eval_steps_per_second": 5.618,
"step": 1350
},
{
"epoch": 46.0,
"eval_accuracy": 0.4389920424403183,
"eval_f1": 0.7051218896046483,
"eval_loss": 0.038001034408807755,
"eval_roc_auc": 0.8197305825960849,
"eval_runtime": 0.5374,
"eval_samples_per_second": 1403.153,
"eval_steps_per_second": 5.583,
"step": 1380
},
{
"epoch": 47.0,
"eval_accuracy": 0.4708222811671088,
"eval_f1": 0.7296987495263356,
"eval_loss": 0.036776889115571976,
"eval_roc_auc": 0.831116786441656,
"eval_runtime": 0.5335,
"eval_samples_per_second": 1413.257,
"eval_steps_per_second": 5.623,
"step": 1410
},
{
"epoch": 48.0,
"eval_accuracy": 0.4920424403183024,
"eval_f1": 0.747950612605785,
"eval_loss": 0.03557248413562775,
"eval_roc_auc": 0.8375909848990984,
"eval_runtime": 0.5366,
"eval_samples_per_second": 1405.081,
"eval_steps_per_second": 5.591,
"step": 1440
},
{
"epoch": 49.0,
"eval_accuracy": 0.5212201591511937,
"eval_f1": 0.7606069218138183,
"eval_loss": 0.03450340777635574,
"eval_roc_auc": 0.845925043519166,
"eval_runtime": 0.5383,
"eval_samples_per_second": 1400.798,
"eval_steps_per_second": 5.573,
"step": 1470
},
{
"epoch": 50.0,
"learning_rate": 9.230769230769232e-06,
"loss": 0.0497,
"step": 1500
},
{
"epoch": 50.0,
"eval_accuracy": 0.5371352785145889,
"eval_f1": 0.7627226222053809,
"eval_loss": 0.03335259482264519,
"eval_roc_auc": 0.8508886495595266,
"eval_runtime": 0.532,
"eval_samples_per_second": 1417.332,
"eval_steps_per_second": 5.639,
"step": 1500
},
{
"epoch": 51.0,
"eval_accuracy": 0.5915119363395226,
"eval_f1": 0.8100701023114816,
"eval_loss": 0.032284460961818695,
"eval_roc_auc": 0.8672281393150117,
"eval_runtime": 0.5381,
"eval_samples_per_second": 1401.158,
"eval_steps_per_second": 5.575,
"step": 1530
},
{
"epoch": 52.0,
"eval_accuracy": 0.610079575596817,
"eval_f1": 0.8129247189592016,
"eval_loss": 0.03143255040049553,
"eval_roc_auc": 0.8744627940462186,
"eval_runtime": 0.5361,
"eval_samples_per_second": 1406.42,
"eval_steps_per_second": 5.596,
"step": 1560
},
{
"epoch": 53.0,
"eval_accuracy": 0.6538461538461539,
"eval_f1": 0.8507420740179361,
"eval_loss": 0.0304188784211874,
"eval_roc_auc": 0.8866197742960004,
"eval_runtime": 0.5356,
"eval_samples_per_second": 1407.838,
"eval_steps_per_second": 5.601,
"step": 1590
},
{
"epoch": 54.0,
"eval_accuracy": 0.6578249336870027,
"eval_f1": 0.8552703044082355,
"eval_loss": 0.029446031898260117,
"eval_roc_auc": 0.890052147658386,
"eval_runtime": 0.5353,
"eval_samples_per_second": 1408.566,
"eval_steps_per_second": 5.604,
"step": 1620
},
{
"epoch": 55.0,
"eval_accuracy": 0.6790450928381963,
"eval_f1": 0.8615195149677907,
"eval_loss": 0.028606314212083817,
"eval_roc_auc": 0.897625750004689,
"eval_runtime": 0.5341,
"eval_samples_per_second": 1411.668,
"eval_steps_per_second": 5.617,
"step": 1650
},
{
"epoch": 56.0,
"eval_accuracy": 0.6777188328912467,
"eval_f1": 0.864863584691171,
"eval_loss": 0.027681471779942513,
"eval_roc_auc": 0.8984171666697929,
"eval_runtime": 0.5356,
"eval_samples_per_second": 1407.868,
"eval_steps_per_second": 5.602,
"step": 1680
},
{
"epoch": 57.0,
"eval_accuracy": 0.6790450928381963,
"eval_f1": 0.8621510673234811,
"eval_loss": 0.026845382526516914,
"eval_roc_auc": 0.8969065742527106,
"eval_runtime": 0.5361,
"eval_samples_per_second": 1406.498,
"eval_steps_per_second": 5.596,
"step": 1710
},
{
"epoch": 58.0,
"eval_accuracy": 0.7015915119363395,
"eval_f1": 0.8810281672350637,
"eval_loss": 0.026072582229971886,
"eval_roc_auc": 0.9060217294074353,
"eval_runtime": 0.5353,
"eval_samples_per_second": 1408.671,
"eval_steps_per_second": 5.605,
"step": 1740
},
{
"epoch": 59.0,
"eval_accuracy": 0.7188328912466844,
"eval_f1": 0.8876594669698118,
"eval_loss": 0.025316763669252396,
"eval_roc_auc": 0.9106051073109138,
"eval_runtime": 0.5362,
"eval_samples_per_second": 1406.26,
"eval_steps_per_second": 5.595,
"step": 1770
},
{
"epoch": 60.0,
"eval_accuracy": 0.7201591511936339,
"eval_f1": 0.8895888594164456,
"eval_loss": 0.024538854137063026,
"eval_roc_auc": 0.9124959278648781,
"eval_runtime": 0.5368,
"eval_samples_per_second": 1404.713,
"eval_steps_per_second": 5.589,
"step": 1800
},
{
"epoch": 61.0,
"eval_accuracy": 0.7374005305039788,
"eval_f1": 0.8951402046229632,
"eval_loss": 0.023838359862565994,
"eval_roc_auc": 0.9174492137747923,
"eval_runtime": 0.5444,
"eval_samples_per_second": 1385.12,
"eval_steps_per_second": 5.511,
"step": 1830
},
{
"epoch": 62.0,
"eval_accuracy": 0.746684350132626,
"eval_f1": 0.901335733232285,
"eval_loss": 0.023148847743868828,
"eval_roc_auc": 0.9235019035735669,
"eval_runtime": 0.535,
"eval_samples_per_second": 1409.257,
"eval_steps_per_second": 5.607,
"step": 1860
},
{
"epoch": 63.0,
"eval_accuracy": 0.76657824933687,
"eval_f1": 0.9092175066312996,
"eval_loss": 0.02254069782793522,
"eval_roc_auc": 0.9292259658876918,
"eval_runtime": 0.5372,
"eval_samples_per_second": 1403.696,
"eval_steps_per_second": 5.585,
"step": 1890
},
{
"epoch": 64.0,
"eval_accuracy": 0.7718832891246684,
"eval_f1": 0.9126215738284704,
"eval_loss": 0.021912721917033195,
"eval_roc_auc": 0.929986422161456,
"eval_runtime": 0.5359,
"eval_samples_per_second": 1406.883,
"eval_steps_per_second": 5.598,
"step": 1920
},
{
"epoch": 65.0,
"eval_accuracy": 0.7904509283819628,
"eval_f1": 0.9302608311229001,
"eval_loss": 0.02143138088285923,
"eval_roc_auc": 0.9372107567622165,
"eval_runtime": 0.5363,
"eval_samples_per_second": 1406.027,
"eval_steps_per_second": 5.594,
"step": 1950
},
{
"epoch": 66.0,
"eval_accuracy": 0.7917771883289124,
"eval_f1": 0.9300839964633068,
"eval_loss": 0.020785199478268623,
"eval_roc_auc": 0.9364606206188987,
"eval_runtime": 0.5391,
"eval_samples_per_second": 1398.555,
"eval_steps_per_second": 5.565,
"step": 1980
},
{
"epoch": 66.67,
"learning_rate": 7.307692307692308e-06,
"loss": 0.0301,
"step": 2000
},
{
"epoch": 67.0,
"eval_accuracy": 0.8010610079575596,
"eval_f1": 0.9349911582670204,
"eval_loss": 0.020172661170363426,
"eval_roc_auc": 0.9398929939812842,
"eval_runtime": 0.5431,
"eval_samples_per_second": 1388.32,
"eval_steps_per_second": 5.524,
"step": 2010
},
{
"epoch": 68.0,
"eval_accuracy": 0.8050397877984085,
"eval_f1": 0.9368479221927499,
"eval_loss": 0.019651979207992554,
"eval_roc_auc": 0.9410233582614841,
"eval_runtime": 0.5372,
"eval_samples_per_second": 1403.636,
"eval_steps_per_second": 5.585,
"step": 2040
},
{
"epoch": 69.0,
"eval_accuracy": 0.8209549071618037,
"eval_f1": 0.9433339648856889,
"eval_loss": 0.019185032695531845,
"eval_roc_auc": 0.9467371004451625,
"eval_runtime": 0.5361,
"eval_samples_per_second": 1406.542,
"eval_steps_per_second": 5.596,
"step": 2070
},
{
"epoch": 70.0,
"eval_accuracy": 0.8262599469496021,
"eval_f1": 0.9441013009978527,
"eval_loss": 0.01870913803577423,
"eval_roc_auc": 0.9482476928622445,
"eval_runtime": 0.5467,
"eval_samples_per_second": 1379.282,
"eval_steps_per_second": 5.488,
"step": 2100
},
{
"epoch": 71.0,
"eval_accuracy": 0.8236074270557029,
"eval_f1": 0.9441234053303018,
"eval_loss": 0.018251696601510048,
"eval_roc_auc": 0.9474975567189267,
"eval_runtime": 0.539,
"eval_samples_per_second": 1398.772,
"eval_steps_per_second": 5.565,
"step": 2130
},
{
"epoch": 72.0,
"eval_accuracy": 0.8289124668435013,
"eval_f1": 0.9458349122142224,
"eval_loss": 0.01777571812272072,
"eval_roc_auc": 0.9494090175337839,
"eval_runtime": 0.5368,
"eval_samples_per_second": 1404.669,
"eval_steps_per_second": 5.589,
"step": 2160
},
{
"epoch": 73.0,
"eval_accuracy": 0.8368700265251989,
"eval_f1": 0.9490179360869017,
"eval_loss": 0.017392940819263458,
"eval_roc_auc": 0.9520706144919588,
"eval_runtime": 0.5345,
"eval_samples_per_second": 1410.719,
"eval_steps_per_second": 5.613,
"step": 2190
},
{
"epoch": 74.0,
"eval_accuracy": 0.8395225464190982,
"eval_f1": 0.9497252747252748,
"eval_loss": 0.01703151874244213,
"eval_roc_auc": 0.9528310707657232,
"eval_runtime": 0.5352,
"eval_samples_per_second": 1408.875,
"eval_steps_per_second": 5.606,
"step": 2220
},
{
"epoch": 75.0,
"eval_accuracy": 0.8448275862068966,
"eval_f1": 0.9510957433371227,
"eval_loss": 0.016582759097218513,
"eval_roc_auc": 0.9543416631828051,
"eval_runtime": 0.5383,
"eval_samples_per_second": 1400.764,
"eval_steps_per_second": 5.573,
"step": 2250
},
{
"epoch": 76.0,
"eval_accuracy": 0.8488063660477454,
"eval_f1": 0.9522135910066944,
"eval_loss": 0.016240444034337997,
"eval_roc_auc": 0.9551124395870159,
"eval_runtime": 0.5333,
"eval_samples_per_second": 1413.847,
"eval_steps_per_second": 5.625,
"step": 2280
},
{
"epoch": 77.0,
"eval_accuracy": 0.850132625994695,
"eval_f1": 0.9526872552734622,
"eval_loss": 0.015849757939577103,
"eval_roc_auc": 0.9558625757303335,
"eval_runtime": 0.537,
"eval_samples_per_second": 1404.008,
"eval_steps_per_second": 5.586,
"step": 2310
},
{
"epoch": 78.0,
"eval_accuracy": 0.8488063660477454,
"eval_f1": 0.9518157130226096,
"eval_loss": 0.015539790503680706,
"eval_roc_auc": 0.9547322114501339,
"eval_runtime": 0.5388,
"eval_samples_per_second": 1399.303,
"eval_steps_per_second": 5.568,
"step": 2340
},
{
"epoch": 79.0,
"eval_accuracy": 0.8567639257294429,
"eval_f1": 0.9545882278640899,
"eval_loss": 0.015179312787950039,
"eval_roc_auc": 0.9577740365451908,
"eval_runtime": 0.5402,
"eval_samples_per_second": 1395.903,
"eval_steps_per_second": 5.554,
"step": 2370
},
{
"epoch": 80.0,
"eval_accuracy": 0.8594164456233422,
"eval_f1": 0.9569439181508146,
"eval_loss": 0.014874554239213467,
"eval_roc_auc": 0.9577740365451908,
"eval_runtime": 0.5414,
"eval_samples_per_second": 1392.664,
"eval_steps_per_second": 5.541,
"step": 2400
},
{
"epoch": 81.0,
"eval_accuracy": 0.8620689655172413,
"eval_f1": 0.958023872679045,
"eval_loss": 0.014504685997962952,
"eval_roc_auc": 0.9596751772296016,
"eval_runtime": 0.5336,
"eval_samples_per_second": 1412.916,
"eval_steps_per_second": 5.622,
"step": 2430
},
{
"epoch": 82.0,
"eval_accuracy": 0.870026525198939,
"eval_f1": 0.9595395983327017,
"eval_loss": 0.014218125492334366,
"eval_roc_auc": 0.9611960897771299,
"eval_runtime": 0.5371,
"eval_samples_per_second": 1403.78,
"eval_steps_per_second": 5.585,
"step": 2460
},
{
"epoch": 83.0,
"eval_accuracy": 0.8660477453580901,
"eval_f1": 0.9604111405835545,
"eval_loss": 0.013919519260525703,
"eval_roc_auc": 0.9608261817706942,
"eval_runtime": 0.5354,
"eval_samples_per_second": 1408.195,
"eval_steps_per_second": 5.603,
"step": 2490
},
{
"epoch": 83.33,
"learning_rate": 5.384615384615385e-06,
"loss": 0.02,
"step": 2500
},
{
"epoch": 84.0,
"eval_accuracy": 0.8779840848806366,
"eval_f1": 0.9646235947960087,
"eval_loss": 0.013672588393092155,
"eval_roc_auc": 0.9638473666048583,
"eval_runtime": 0.5354,
"eval_samples_per_second": 1408.217,
"eval_steps_per_second": 5.603,
"step": 2520
},
{
"epoch": 85.0,
"eval_accuracy": 0.8872679045092838,
"eval_f1": 0.9690760389036251,
"eval_loss": 0.013412056490778923,
"eval_roc_auc": 0.9668995118303618,
"eval_runtime": 0.5376,
"eval_samples_per_second": 1402.415,
"eval_steps_per_second": 5.58,
"step": 2550
},
{
"epoch": 86.0,
"eval_accuracy": 0.8952254641909815,
"eval_f1": 0.9720317039282557,
"eval_loss": 0.01312048826366663,
"eval_roc_auc": 0.9692015209125475,
"eval_runtime": 0.5348,
"eval_samples_per_second": 1409.848,
"eval_steps_per_second": 5.609,
"step": 2580
},
{
"epoch": 87.0,
"eval_accuracy": 0.9005305039787799,
"eval_f1": 0.9731937602627256,
"eval_loss": 0.012925405986607075,
"eval_roc_auc": 0.9703422053231939,
"eval_runtime": 0.5427,
"eval_samples_per_second": 1389.4,
"eval_steps_per_second": 5.528,
"step": 2610
},
{
"epoch": 88.0,
"eval_accuracy": 0.9018567639257294,
"eval_f1": 0.9739389920424402,
"eval_loss": 0.012665793299674988,
"eval_roc_auc": 0.9710820213360654,
"eval_runtime": 0.5379,
"eval_samples_per_second": 1401.691,
"eval_steps_per_second": 5.577,
"step": 2640
},
{
"epoch": 89.0,
"eval_accuracy": 0.9058355437665783,
"eval_f1": 0.9751389415182519,
"eval_loss": 0.012404780834913254,
"eval_roc_auc": 0.9718631178707224,
"eval_runtime": 0.5366,
"eval_samples_per_second": 1405.048,
"eval_steps_per_second": 5.59,
"step": 2670
},
{
"epoch": 90.0,
"eval_accuracy": 0.9098143236074271,
"eval_f1": 0.976364153088291,
"eval_loss": 0.012243787758052349,
"eval_roc_auc": 0.973384030418251,
"eval_runtime": 0.543,
"eval_samples_per_second": 1388.515,
"eval_steps_per_second": 5.525,
"step": 2700
},
{
"epoch": 91.0,
"eval_accuracy": 0.9137931034482759,
"eval_f1": 0.9770841227737779,
"eval_loss": 0.01201709359884262,
"eval_roc_auc": 0.9741341665615688,
"eval_runtime": 0.5346,
"eval_samples_per_second": 1410.515,
"eval_steps_per_second": 5.612,
"step": 2730
},
{
"epoch": 92.0,
"eval_accuracy": 0.9137931034482759,
"eval_f1": 0.9769072881141846,
"eval_loss": 0.01179158128798008,
"eval_roc_auc": 0.9741444866920153,
"eval_runtime": 0.5367,
"eval_samples_per_second": 1404.786,
"eval_steps_per_second": 5.589,
"step": 2760
},
{
"epoch": 93.0,
"eval_accuracy": 0.9177718832891246,
"eval_f1": 0.9778798787419477,
"eval_loss": 0.011644715443253517,
"eval_roc_auc": 0.9752748509722151,
"eval_runtime": 0.536,
"eval_samples_per_second": 1406.587,
"eval_steps_per_second": 5.597,
"step": 2790
},
{
"epoch": 94.0,
"eval_accuracy": 0.9230769230769231,
"eval_f1": 0.9799008462801566,
"eval_loss": 0.01145511120557785,
"eval_roc_auc": 0.9771863117870723,
"eval_runtime": 0.5368,
"eval_samples_per_second": 1404.597,
"eval_steps_per_second": 5.589,
"step": 2820
},
{
"epoch": 95.0,
"eval_accuracy": 0.9244031830238727,
"eval_f1": 0.9801660982695466,
"eval_loss": 0.011244919151067734,
"eval_roc_auc": 0.9775665399239544,
"eval_runtime": 0.5394,
"eval_samples_per_second": 1397.779,
"eval_steps_per_second": 5.561,
"step": 2850
},
{
"epoch": 96.0,
"eval_accuracy": 0.9297082228116711,
"eval_f1": 0.9811513199444234,
"eval_loss": 0.011063193902373314,
"eval_roc_auc": 0.9787072243346008,
"eval_runtime": 0.5395,
"eval_samples_per_second": 1397.471,
"eval_steps_per_second": 5.56,
"step": 2880
},
{
"epoch": 97.0,
"eval_accuracy": 0.9283819628647215,
"eval_f1": 0.9817702412529998,
"eval_loss": 0.010917922481894493,
"eval_roc_auc": 0.9783269961977186,
"eval_runtime": 0.5395,
"eval_samples_per_second": 1397.593,
"eval_steps_per_second": 5.561,
"step": 2910
},
{
"epoch": 98.0,
"eval_accuracy": 0.9416445623342176,
"eval_f1": 0.9853069344448655,
"eval_loss": 0.010806653648614883,
"eval_roc_auc": 0.98212927756654,
"eval_runtime": 0.536,
"eval_samples_per_second": 1406.725,
"eval_steps_per_second": 5.597,
"step": 2940
},
{
"epoch": 99.0,
"eval_accuracy": 0.9416445623342176,
"eval_f1": 0.9853069344448655,
"eval_loss": 0.01062620710581541,
"eval_roc_auc": 0.98212927756654,
"eval_runtime": 0.5407,
"eval_samples_per_second": 1394.567,
"eval_steps_per_second": 5.549,
"step": 2970
},
{
"epoch": 100.0,
"learning_rate": 3.4615384615384617e-06,
"loss": 0.0146,
"step": 3000
},
{
"epoch": 100.0,
"eval_accuracy": 0.9429708222811671,
"eval_f1": 0.9855721864342555,
"eval_loss": 0.01047496683895588,
"eval_roc_auc": 0.9825095057034221,
"eval_runtime": 0.5382,
"eval_samples_per_second": 1400.898,
"eval_steps_per_second": 5.574,
"step": 3000
},
{
"epoch": 101.0,
"eval_accuracy": 0.9416445623342176,
"eval_f1": 0.9853069344448655,
"eval_loss": 0.01036164816468954,
"eval_roc_auc": 0.98212927756654,
"eval_runtime": 0.5375,
"eval_samples_per_second": 1402.764,
"eval_steps_per_second": 5.581,
"step": 3030
},
{
"epoch": 102.0,
"eval_accuracy": 0.9442970822281167,
"eval_f1": 0.986115321460149,
"eval_loss": 0.010181589052081108,
"eval_roc_auc": 0.9828897338403042,
"eval_runtime": 0.5383,
"eval_samples_per_second": 1400.644,
"eval_steps_per_second": 5.573,
"step": 3060
},
{
"epoch": 103.0,
"eval_accuracy": 0.9496021220159151,
"eval_f1": 0.9876057850195782,
"eval_loss": 0.010093181394040585,
"eval_roc_auc": 0.9847908745247148,
"eval_runtime": 0.5337,
"eval_samples_per_second": 1412.756,
"eval_steps_per_second": 5.621,
"step": 3090
},
{
"epoch": 104.0,
"eval_accuracy": 0.9482758620689655,
"eval_f1": 0.9873405330301882,
"eval_loss": 0.009936739690601826,
"eval_roc_auc": 0.9840304182509505,
"eval_runtime": 0.5345,
"eval_samples_per_second": 1410.682,
"eval_steps_per_second": 5.613,
"step": 3120
},
{
"epoch": 105.0,
"eval_accuracy": 0.9496021220159151,
"eval_f1": 0.9875299987368952,
"eval_loss": 0.009850489906966686,
"eval_roc_auc": 0.9844106463878327,
"eval_runtime": 0.5364,
"eval_samples_per_second": 1405.623,
"eval_steps_per_second": 5.593,
"step": 3150
},
{
"epoch": 106.0,
"eval_accuracy": 0.9522546419098143,
"eval_f1": 0.9887425792598207,
"eval_loss": 0.009748827666044235,
"eval_roc_auc": 0.9855513307984791,
"eval_runtime": 0.5365,
"eval_samples_per_second": 1405.409,
"eval_steps_per_second": 5.592,
"step": 3180
},
{
"epoch": 107.0,
"eval_accuracy": 0.9549071618037135,
"eval_f1": 0.9896267525577871,
"eval_loss": 0.009625904262065887,
"eval_roc_auc": 0.9863117870722433,
"eval_runtime": 0.5349,
"eval_samples_per_second": 1409.481,
"eval_steps_per_second": 5.608,
"step": 3210
},
{
"epoch": 108.0,
"eval_accuracy": 0.9588859416445623,
"eval_f1": 0.9907761778451434,
"eval_loss": 0.009538683108985424,
"eval_roc_auc": 0.9874524714828897,
"eval_runtime": 0.5345,
"eval_samples_per_second": 1410.756,
"eval_steps_per_second": 5.613,
"step": 3240
},
{
"epoch": 109.0,
"eval_accuracy": 0.9602122015915119,
"eval_f1": 0.9911424782114437,
"eval_loss": 0.009465099312365055,
"eval_roc_auc": 0.9878326996197719,
"eval_runtime": 0.5389,
"eval_samples_per_second": 1399.088,
"eval_steps_per_second": 5.567,
"step": 3270
},
{
"epoch": 110.0,
"eval_accuracy": 0.9615384615384616,
"eval_f1": 0.9916603511431098,
"eval_loss": 0.00935909990221262,
"eval_roc_auc": 0.988212927756654,
"eval_runtime": 0.6487,
"eval_samples_per_second": 1162.329,
"eval_steps_per_second": 4.625,
"step": 3300
},
{
"epoch": 111.0,
"eval_accuracy": 0.9588859416445623,
"eval_f1": 0.9908772262220539,
"eval_loss": 0.009284152649343014,
"eval_roc_auc": 0.9874524714828897,
"eval_runtime": 0.5333,
"eval_samples_per_second": 1413.782,
"eval_steps_per_second": 5.625,
"step": 3330
},
{
"epoch": 112.0,
"eval_accuracy": 0.9641909814323607,
"eval_f1": 0.9924687381583933,
"eval_loss": 0.009203045628964901,
"eval_roc_auc": 0.9889733840304182,
"eval_runtime": 0.5399,
"eval_samples_per_second": 1396.478,
"eval_steps_per_second": 5.556,
"step": 3360
},
{
"epoch": 113.0,
"eval_accuracy": 0.9641909814323607,
"eval_f1": 0.9922919034988,
"eval_loss": 0.00910850428044796,
"eval_roc_auc": 0.9889733840304182,
"eval_runtime": 0.5354,
"eval_samples_per_second": 1408.277,
"eval_steps_per_second": 5.603,
"step": 3390
},
{
"epoch": 114.0,
"eval_accuracy": 0.9694960212201591,
"eval_f1": 0.9941360363774157,
"eval_loss": 0.009037572890520096,
"eval_roc_auc": 0.990874524714829,
"eval_runtime": 0.5375,
"eval_samples_per_second": 1402.803,
"eval_steps_per_second": 5.581,
"step": 3420
},
{
"epoch": 115.0,
"eval_accuracy": 0.9694960212201591,
"eval_f1": 0.9941360363774157,
"eval_loss": 0.008973510935902596,
"eval_roc_auc": 0.990874524714829,
"eval_runtime": 0.5354,
"eval_samples_per_second": 1408.234,
"eval_steps_per_second": 5.603,
"step": 3450
},
{
"epoch": 116.0,
"eval_accuracy": 0.9694960212201591,
"eval_f1": 0.9941360363774157,
"eval_loss": 0.008894499391317368,
"eval_roc_auc": 0.990874524714829,
"eval_runtime": 0.539,
"eval_samples_per_second": 1398.882,
"eval_steps_per_second": 5.566,
"step": 3480
},
{
"epoch": 116.67,
"learning_rate": 1.5384615384615385e-06,
"loss": 0.0119,
"step": 3500
},
{
"epoch": 117.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.9952854616647722,
"eval_loss": 0.008851761929690838,
"eval_roc_auc": 0.9920152091254753,
"eval_runtime": 0.5399,
"eval_samples_per_second": 1396.547,
"eval_steps_per_second": 5.557,
"step": 3510
},
{
"epoch": 118.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.995285461664772,
"eval_loss": 0.008802603930234909,
"eval_roc_auc": 0.9920152091254753,
"eval_runtime": 0.5378,
"eval_samples_per_second": 1402.054,
"eval_steps_per_second": 5.578,
"step": 3540
},
{
"epoch": 119.0,
"eval_accuracy": 0.9721485411140584,
"eval_f1": 0.9950202096753822,
"eval_loss": 0.008759119547903538,
"eval_roc_auc": 0.9916349809885932,
"eval_runtime": 0.5394,
"eval_samples_per_second": 1397.954,
"eval_steps_per_second": 5.562,
"step": 3570
},
{
"epoch": 120.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.995032840722496,
"eval_loss": 0.008710918948054314,
"eval_roc_auc": 0.9916349809885932,
"eval_runtime": 0.5374,
"eval_samples_per_second": 1403.078,
"eval_steps_per_second": 5.583,
"step": 3600
},
{
"epoch": 121.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.995032840722496,
"eval_loss": 0.008674073964357376,
"eval_roc_auc": 0.9916349809885932,
"eval_runtime": 0.5361,
"eval_samples_per_second": 1406.392,
"eval_steps_per_second": 5.596,
"step": 3630
},
{
"epoch": 122.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.995032840722496,
"eval_loss": 0.008630850352346897,
"eval_roc_auc": 0.9916349809885932,
"eval_runtime": 0.5409,
"eval_samples_per_second": 1394.062,
"eval_steps_per_second": 5.547,
"step": 3660
},
{
"epoch": 123.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9954749273714792,
"eval_loss": 0.008607584983110428,
"eval_roc_auc": 0.9920152091254753,
"eval_runtime": 0.5356,
"eval_samples_per_second": 1407.661,
"eval_steps_per_second": 5.601,
"step": 3690
},
{
"epoch": 124.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.008562309667468071,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5367,
"eval_samples_per_second": 1404.922,
"eval_steps_per_second": 5.59,
"step": 3720
},
{
"epoch": 125.0,
"eval_accuracy": 0.9734748010610079,
"eval_f1": 0.995285461664772,
"eval_loss": 0.0085311783477664,
"eval_roc_auc": 0.9920152091254753,
"eval_runtime": 0.5369,
"eval_samples_per_second": 1404.35,
"eval_steps_per_second": 5.588,
"step": 3750
},
{
"epoch": 126.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.008514598943293095,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5404,
"eval_samples_per_second": 1395.332,
"eval_steps_per_second": 5.552,
"step": 3780
},
{
"epoch": 127.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.008509295992553234,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5378,
"eval_samples_per_second": 1401.996,
"eval_steps_per_second": 5.578,
"step": 3810
},
{
"epoch": 128.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.00849186722189188,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5355,
"eval_samples_per_second": 1407.909,
"eval_steps_per_second": 5.602,
"step": 3840
},
{
"epoch": 129.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.008484904654324055,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5382,
"eval_samples_per_second": 1401.071,
"eval_steps_per_second": 5.575,
"step": 3870
},
{
"epoch": 130.0,
"eval_accuracy": 0.9748010610079576,
"eval_f1": 0.9957275483137553,
"eval_loss": 0.008481933735311031,
"eval_roc_auc": 0.9923954372623573,
"eval_runtime": 0.5421,
"eval_samples_per_second": 1390.942,
"eval_steps_per_second": 5.534,
"step": 3900
}
],
"max_steps": 3900,
"num_train_epochs": 130,
"total_flos": 8883063635970888.0,
"trial_name": null,
"trial_params": null
}