{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.7842232729788952, "eval_steps": 5, "global_step": 8500, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "eval_GEN Loss": 1.2385475635528564, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM Loss": 0.6931641101837158, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 1.8721153736114502, "eval_runtime": 55.5872, "eval_samples_per_second": 1.169, "eval_steps_per_second": 0.09, "step": 0 }, { "epoch": 9.226156152692884e-05, "grad_norm": 3.1269080771685585, "learning_rate": 3.109452736318408e-09, "loss": 1.6746, "step": 1 }, { "epoch": 0.00018452312305385768, "grad_norm": 3.5449940973885044, "learning_rate": 6.218905472636816e-09, "loss": 1.8898, "step": 2 }, { "epoch": 0.0002767846845807865, "grad_norm": 3.4603091206773233, "learning_rate": 9.328358208955224e-09, "loss": 1.5738, "step": 3 }, { "epoch": 0.00036904624610771536, "grad_norm": 4.577609127214851, "learning_rate": 1.2437810945273633e-08, "loss": 1.93, "step": 4 }, { "epoch": 0.0004613078076346442, "grad_norm": 3.117899016828671, "learning_rate": 1.554726368159204e-08, "loss": 1.8182, "step": 5 }, { "epoch": 0.0004613078076346442, "eval_GEN Loss": 1.2392983436584473, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM Loss": 0.6931981444358826, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 1.873557686805725, "eval_runtime": 55.9315, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5 }, { "epoch": 0.000553569369161573, "grad_norm": 5.835077403604924, "learning_rate": 1.8656716417910447e-08, "loss": 1.8551, "step": 6 }, { "epoch": 0.0006458309306885019, "grad_norm": 4.210580345606465, "learning_rate": 2.176616915422886e-08, "loss": 1.728, "step": 7 }, { "epoch": 0.0007380924922154307, "grad_norm": 3.9832144368906084, "learning_rate": 2.4875621890547265e-08, "loss": 1.7872, "step": 8 }, { "epoch": 0.0008303540537423596, "grad_norm": 4.290185811653636, "learning_rate": 2.798507462686567e-08, "loss": 1.9864, "step": 9 }, { "epoch": 0.0009226156152692884, "grad_norm": 4.043726650440571, "learning_rate": 3.109452736318408e-08, "loss": 1.8669, "step": 10 }, { "epoch": 0.0009226156152692884, "eval_GEN Loss": 1.2399370670318604, "eval_GEN top-5 accuracy": 0.9140727750986409, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM Loss": 0.6931888461112976, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 1.8730769157409668, "eval_runtime": 55.8813, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 10 }, { "epoch": 0.0010148771767962172, "grad_norm": 4.406640040740555, "learning_rate": 3.420398009950249e-08, "loss": 1.9705, "step": 11 }, { "epoch": 0.001107138738323146, "grad_norm": 3.001575732066938, "learning_rate": 3.7313432835820895e-08, "loss": 2.0106, "step": 12 }, { "epoch": 0.0011994002998500749, "grad_norm": 5.2380060824960655, "learning_rate": 4.042288557213931e-08, "loss": 1.9344, "step": 13 }, { "epoch": 0.0012916618613770037, "grad_norm": 4.727236576460403, "learning_rate": 4.353233830845772e-08, "loss": 1.8549, "step": 14 }, { "epoch": 0.0013839234229039326, "grad_norm": 3.570054790174049, "learning_rate": 4.664179104477612e-08, "loss": 1.7543, "step": 15 }, { "epoch": 0.0013839234229039326, "eval_GEN Loss": 1.2388570308685303, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.22641509433962265, "eval_PRM F1": 0.023809523809523808, "eval_PRM F1 AUC": 0.5060240963855421, "eval_PRM F1 Neg": 0.359375, "eval_PRM Loss": 0.6931596994400024, "eval_PRM NPV": 0.21904761904761905, "eval_PRM Precision": 1.0, "eval_PRM Recall": 0.012048192771084338, "eval_PRM Specificty": 1.0, "eval_loss": 1.8725961446762085, "eval_runtime": 56.0124, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 15 }, { "epoch": 0.0014761849844308614, "grad_norm": 4.270529049520865, "learning_rate": 4.975124378109453e-08, "loss": 2.2358, "step": 16 }, { "epoch": 0.0015684465459577903, "grad_norm": 2.6485702290657556, "learning_rate": 5.286069651741294e-08, "loss": 2.0089, "step": 17 }, { "epoch": 0.0016607081074847191, "grad_norm": 5.330399703975629, "learning_rate": 5.597014925373134e-08, "loss": 1.7244, "step": 18 }, { "epoch": 0.001752969669011648, "grad_norm": 4.505723463929839, "learning_rate": 5.9079601990049754e-08, "loss": 1.9108, "step": 19 }, { "epoch": 0.0018452312305385769, "grad_norm": 3.5337375234196995, "learning_rate": 6.218905472636817e-08, "loss": 1.7413, "step": 20 }, { "epoch": 0.0018452312305385769, "eval_GEN Loss": 1.2375545501708984, "eval_GEN top-5 accuracy": 0.9145111793073214, "eval_PRM Accuracy": 0.25471698113207547, "eval_PRM F1": 0.09195402298850575, "eval_PRM F1 AUC": 0.5240963855421686, "eval_PRM F1 Neg": 0.368, "eval_PRM Loss": 0.693073034286499, "eval_PRM NPV": 0.22549019607843138, "eval_PRM Precision": 1.0, "eval_PRM Recall": 0.04819277108433735, "eval_PRM Specificty": 1.0, "eval_loss": 1.8711538314819336, "eval_runtime": 55.6906, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 20 }, { "epoch": 0.0019374927920655057, "grad_norm": 4.773455261650772, "learning_rate": 6.529850746268657e-08, "loss": 1.5142, "step": 21 }, { "epoch": 0.0020297543535924343, "grad_norm": 4.704180183206908, "learning_rate": 6.840796019900498e-08, "loss": 1.9425, "step": 22 }, { "epoch": 0.002122015915119363, "grad_norm": 5.212381712859903, "learning_rate": 7.151741293532339e-08, "loss": 1.7149, "step": 23 }, { "epoch": 0.002214277476646292, "grad_norm": 4.804344322732823, "learning_rate": 7.462686567164179e-08, "loss": 1.7484, "step": 24 }, { "epoch": 0.002306539038173221, "grad_norm": 3.4852690113725977, "learning_rate": 7.77363184079602e-08, "loss": 2.1117, "step": 25 }, { "epoch": 0.002306539038173221, "eval_GEN Loss": 1.2359493970870972, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.3113207547169811, "eval_PRM F1": 0.23157894736842105, "eval_PRM F1 AUC": 0.5445259298061813, "eval_PRM F1 Neg": 0.37606837606837606, "eval_PRM Loss": 0.6930320262908936, "eval_PRM NPV": 0.23404255319148937, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.13253012048192772, "eval_PRM Specificty": 0.9565217391304348, "eval_loss": 1.871634602546692, "eval_runtime": 56.0441, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 25 }, { "epoch": 0.0023988005997001498, "grad_norm": 5.621336774755585, "learning_rate": 8.084577114427861e-08, "loss": 2.0755, "step": 26 }, { "epoch": 0.0024910621612270786, "grad_norm": 5.278482792916371, "learning_rate": 8.395522388059703e-08, "loss": 1.853, "step": 27 }, { "epoch": 0.0025833237227540075, "grad_norm": 3.429298179970435, "learning_rate": 8.706467661691544e-08, "loss": 1.8945, "step": 28 }, { "epoch": 0.0026755852842809363, "grad_norm": 3.7644884791494992, "learning_rate": 9.017412935323384e-08, "loss": 1.9576, "step": 29 }, { "epoch": 0.002767846845807865, "grad_norm": 4.516102493942929, "learning_rate": 9.328358208955224e-08, "loss": 2.0927, "step": 30 }, { "epoch": 0.002767846845807865, "eval_GEN Loss": 1.228596806526184, "eval_GEN top-5 accuracy": 0.9140727750986409, "eval_PRM Accuracy": 0.42452830188679247, "eval_PRM F1": 0.48739495798319327, "eval_PRM F1 AUC": 0.5225248821372446, "eval_PRM F1 Neg": 0.34408602150537637, "eval_PRM Loss": 0.6929349303245544, "eval_PRM NPV": 0.22857142857142856, "eval_PRM Precision": 0.8055555555555556, "eval_PRM Recall": 0.3493975903614458, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 1.8620191812515259, "eval_runtime": 55.8959, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 30 }, { "epoch": 0.002860108407334794, "grad_norm": 2.5973567522779573, "learning_rate": 9.639303482587065e-08, "loss": 1.9186, "step": 31 }, { "epoch": 0.002952369968861723, "grad_norm": 3.964938026808683, "learning_rate": 9.950248756218906e-08, "loss": 1.9025, "step": 32 }, { "epoch": 0.0030446315303886517, "grad_norm": 4.359962855655254, "learning_rate": 1.0261194029850747e-07, "loss": 1.6659, "step": 33 }, { "epoch": 0.0031368930919155806, "grad_norm": 4.6732889936639985, "learning_rate": 1.0572139303482589e-07, "loss": 1.6562, "step": 34 }, { "epoch": 0.0032291546534425094, "grad_norm": 4.754796330549508, "learning_rate": 1.088308457711443e-07, "loss": 1.7985, "step": 35 }, { "epoch": 0.0032291546534425094, "eval_GEN Loss": 1.2255665063858032, "eval_GEN top-5 accuracy": 0.9145111793073214, "eval_PRM Accuracy": 0.4811320754716981, "eval_PRM F1": 0.5736434108527132, "eval_PRM F1 AUC": 0.5272393923520168, "eval_PRM F1 Neg": 0.3373493975903614, "eval_PRM Loss": 0.692743718624115, "eval_PRM NPV": 0.23333333333333334, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.4457831325301205, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 1.8596153259277344, "eval_runtime": 56.8707, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 35 }, { "epoch": 0.0033214162149694383, "grad_norm": 4.724528772133822, "learning_rate": 1.1194029850746268e-07, "loss": 2.1671, "step": 36 }, { "epoch": 0.003413677776496367, "grad_norm": 3.9150096808620876, "learning_rate": 1.150497512437811e-07, "loss": 1.6174, "step": 37 }, { "epoch": 0.003505939338023296, "grad_norm": 5.773492084076176, "learning_rate": 1.1815920398009951e-07, "loss": 1.8857, "step": 38 }, { "epoch": 0.003598200899550225, "grad_norm": 5.451277117015242, "learning_rate": 1.2126865671641792e-07, "loss": 2.0441, "step": 39 }, { "epoch": 0.0036904624610771537, "grad_norm": 2.696966431348262, "learning_rate": 1.2437810945273633e-07, "loss": 1.8209, "step": 40 }, { "epoch": 0.0036904624610771537, "eval_GEN Loss": 1.2069568634033203, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.660377358490566, "eval_PRM F1": 0.7831325301204819, "eval_PRM F1 AUC": 0.5002619172341539, "eval_PRM F1 Neg": 0.21739130434782608, "eval_PRM Loss": 0.6919686794281006, "eval_PRM NPV": 0.21739130434782608, "eval_PRM Precision": 0.7831325301204819, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.8411058187484741, "eval_runtime": 56.0246, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 40 }, { "epoch": 0.0037827240226040826, "grad_norm": 3.493866530933666, "learning_rate": 1.2748756218905472e-07, "loss": 1.6863, "step": 41 }, { "epoch": 0.0038749855841310114, "grad_norm": 2.6161801908482523, "learning_rate": 1.3059701492537313e-07, "loss": 1.7593, "step": 42 }, { "epoch": 0.00396724714565794, "grad_norm": 5.694591249676084, "learning_rate": 1.3370646766169154e-07, "loss": 1.6312, "step": 43 }, { "epoch": 0.004059508707184869, "grad_norm": 3.1568086255048233, "learning_rate": 1.3681592039800996e-07, "loss": 1.597, "step": 44 }, { "epoch": 0.0041517702687117975, "grad_norm": 3.587678655299929, "learning_rate": 1.3992537313432837e-07, "loss": 1.7693, "step": 45 }, { "epoch": 0.0041517702687117975, "eval_GEN Loss": 1.1930245161056519, "eval_GEN top-5 accuracy": 0.9149495835160018, "eval_PRM Accuracy": 0.6886792452830188, "eval_PRM F1": 0.8092485549132948, "eval_PRM F1 AUC": 0.48690413829229967, "eval_PRM F1 Neg": 0.15384615384615385, "eval_PRM Loss": 0.691718339920044, "eval_PRM NPV": 0.1875, "eval_PRM Precision": 0.7777777777777778, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.13043478260869565, "eval_loss": 1.8271634578704834, "eval_runtime": 55.8771, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 45 }, { "epoch": 0.004244031830238726, "grad_norm": 2.5237286778823944, "learning_rate": 1.4303482587064678e-07, "loss": 1.7863, "step": 46 }, { "epoch": 0.004336293391765655, "grad_norm": 5.26890923882605, "learning_rate": 1.461442786069652e-07, "loss": 1.8039, "step": 47 }, { "epoch": 0.004428554953292584, "grad_norm": 4.171052115799442, "learning_rate": 1.4925373134328358e-07, "loss": 1.7905, "step": 48 }, { "epoch": 0.004520816514819513, "grad_norm": 6.515718983622325, "learning_rate": 1.52363184079602e-07, "loss": 1.9001, "step": 49 }, { "epoch": 0.004613078076346442, "grad_norm": 4.372461415549234, "learning_rate": 1.554726368159204e-07, "loss": 1.8444, "step": 50 }, { "epoch": 0.004613078076346442, "eval_GEN Loss": 1.1805022954940796, "eval_GEN top-5 accuracy": 0.9153879877246821, "eval_PRM Accuracy": 0.6509433962264151, "eval_PRM F1": 0.783625730994152, "eval_PRM F1 AUC": 0.44709271870089057, "eval_PRM F1 Neg": 0.0975609756097561, "eval_PRM Loss": 0.69174724817276, "eval_PRM NPV": 0.1111111111111111, "eval_PRM Precision": 0.7613636363636364, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.08695652173913043, "eval_loss": 1.817307710647583, "eval_runtime": 55.9481, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 50 }, { "epoch": 0.004705339637873371, "grad_norm": 4.193248151423293, "learning_rate": 1.5858208955223882e-07, "loss": 2.1622, "step": 51 }, { "epoch": 0.0047976011994002995, "grad_norm": 4.623631435876188, "learning_rate": 1.6169154228855723e-07, "loss": 2.0667, "step": 52 }, { "epoch": 0.004889862760927228, "grad_norm": 3.345737382972426, "learning_rate": 1.6480099502487564e-07, "loss": 1.7507, "step": 53 }, { "epoch": 0.004982124322454157, "grad_norm": 3.9041233882558597, "learning_rate": 1.6791044776119405e-07, "loss": 1.818, "step": 54 }, { "epoch": 0.005074385883981086, "grad_norm": 5.298607880934922, "learning_rate": 1.7101990049751244e-07, "loss": 1.5183, "step": 55 }, { "epoch": 0.005074385883981086, "eval_GEN Loss": 1.1278165578842163, "eval_GEN top-5 accuracy": 0.9158263919333626, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6889498233795166, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.7629808187484741, "eval_runtime": 55.9126, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 55 }, { "epoch": 0.005166647445508015, "grad_norm": 3.336218883854023, "learning_rate": 1.7412935323383088e-07, "loss": 1.6167, "step": 56 }, { "epoch": 0.005258909007034944, "grad_norm": 3.8759513202112656, "learning_rate": 1.7723880597014926e-07, "loss": 1.7826, "step": 57 }, { "epoch": 0.005351170568561873, "grad_norm": 3.127856786853475, "learning_rate": 1.8034825870646767e-07, "loss": 1.9113, "step": 58 }, { "epoch": 0.0054434321300888015, "grad_norm": 4.326349376650393, "learning_rate": 1.834577114427861e-07, "loss": 1.7121, "step": 59 }, { "epoch": 0.00553569369161573, "grad_norm": 4.624249003919422, "learning_rate": 1.8656716417910447e-07, "loss": 1.5453, "step": 60 }, { "epoch": 0.00553569369161573, "eval_GEN Loss": 1.0909538269042969, "eval_GEN top-5 accuracy": 0.9158263919333626, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6880059242248535, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.7301682233810425, "eval_runtime": 56.7905, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 60 }, { "epoch": 0.005627955253142659, "grad_norm": 3.486124204854497, "learning_rate": 1.896766169154229e-07, "loss": 1.7168, "step": 61 }, { "epoch": 0.005720216814669588, "grad_norm": 4.489173258726614, "learning_rate": 1.927860696517413e-07, "loss": 1.6848, "step": 62 }, { "epoch": 0.005812478376196517, "grad_norm": 3.9397917707556602, "learning_rate": 1.9589552238805974e-07, "loss": 1.4471, "step": 63 }, { "epoch": 0.005904739937723446, "grad_norm": 2.6644880049876924, "learning_rate": 1.9900497512437812e-07, "loss": 1.7052, "step": 64 }, { "epoch": 0.005997001499250375, "grad_norm": 4.2575966052447285, "learning_rate": 2.0211442786069656e-07, "loss": 1.7001, "step": 65 }, { "epoch": 0.005997001499250375, "eval_GEN Loss": 1.064455270767212, "eval_GEN top-5 accuracy": 0.918456817185445, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6875361204147339, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.7044471502304077, "eval_runtime": 56.9189, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 65 }, { "epoch": 0.0060892630607773035, "grad_norm": 3.2355348663472263, "learning_rate": 2.0522388059701495e-07, "loss": 1.6682, "step": 66 }, { "epoch": 0.006181524622304232, "grad_norm": 3.071024405471419, "learning_rate": 2.0833333333333333e-07, "loss": 1.6072, "step": 67 }, { "epoch": 0.006273786183831161, "grad_norm": 3.554680940774165, "learning_rate": 2.1144278606965177e-07, "loss": 1.7963, "step": 68 }, { "epoch": 0.00636604774535809, "grad_norm": 2.5298879543430677, "learning_rate": 2.1455223880597016e-07, "loss": 1.6359, "step": 69 }, { "epoch": 0.006458309306885019, "grad_norm": 6.083087924089791, "learning_rate": 2.176616915422886e-07, "loss": 1.8998, "step": 70 }, { "epoch": 0.006458309306885019, "eval_GEN Loss": 1.0378422737121582, "eval_GEN top-5 accuracy": 0.9197720298114862, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6867654323577881, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.6774038076400757, "eval_runtime": 55.8194, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 70 }, { "epoch": 0.006550570868411948, "grad_norm": 2.9042617792127965, "learning_rate": 2.2077114427860698e-07, "loss": 1.8414, "step": 71 }, { "epoch": 0.006642832429938877, "grad_norm": 4.244590383180499, "learning_rate": 2.2388059701492537e-07, "loss": 1.6526, "step": 72 }, { "epoch": 0.0067350939914658054, "grad_norm": 3.3203920579098694, "learning_rate": 2.269900497512438e-07, "loss": 1.5533, "step": 73 }, { "epoch": 0.006827355552992734, "grad_norm": 1.744830315172512, "learning_rate": 2.300995024875622e-07, "loss": 1.3191, "step": 74 }, { "epoch": 0.006919617114519663, "grad_norm": 4.326451307986983, "learning_rate": 2.3320895522388063e-07, "loss": 1.5463, "step": 75 }, { "epoch": 0.006919617114519663, "eval_GEN Loss": 0.9482924938201904, "eval_GEN top-5 accuracy": 0.9224024550635687, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6790199875831604, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.5992788076400757, "eval_runtime": 56.734, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 75 }, { "epoch": 0.007011878676046592, "grad_norm": 2.1644395245838948, "learning_rate": 2.3631840796019902e-07, "loss": 1.5132, "step": 76 }, { "epoch": 0.007104140237573521, "grad_norm": 5.274809047495626, "learning_rate": 2.394278606965174e-07, "loss": 1.434, "step": 77 }, { "epoch": 0.00719640179910045, "grad_norm": 2.813602299901219, "learning_rate": 2.4253731343283584e-07, "loss": 1.4597, "step": 78 }, { "epoch": 0.007288663360627379, "grad_norm": 2.023967194882434, "learning_rate": 2.4564676616915423e-07, "loss": 1.4597, "step": 79 }, { "epoch": 0.007380924922154307, "grad_norm": 2.3835753067138805, "learning_rate": 2.4875621890547267e-07, "loss": 1.4664, "step": 80 }, { "epoch": 0.007380924922154307, "eval_GEN Loss": 0.8692818284034729, "eval_GEN top-5 accuracy": 0.9285401139850943, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6763344407081604, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.526802897453308, "eval_runtime": 56.8248, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 80 }, { "epoch": 0.007473186483681236, "grad_norm": 3.2167315704974158, "learning_rate": 2.5186567164179105e-07, "loss": 1.4135, "step": 81 }, { "epoch": 0.007565448045208165, "grad_norm": 2.8205981850032686, "learning_rate": 2.5497512437810944e-07, "loss": 1.4354, "step": 82 }, { "epoch": 0.007657709606735094, "grad_norm": 2.518582934298941, "learning_rate": 2.580845771144279e-07, "loss": 1.4236, "step": 83 }, { "epoch": 0.007749971168262023, "grad_norm": 4.025192935451012, "learning_rate": 2.6119402985074626e-07, "loss": 1.5447, "step": 84 }, { "epoch": 0.00784223272978895, "grad_norm": 3.937779371079708, "learning_rate": 2.643034825870647e-07, "loss": 1.5491, "step": 85 }, { "epoch": 0.00784223272978895, "eval_GEN Loss": 0.8156515955924988, "eval_GEN top-5 accuracy": 0.9368697939500219, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6749014854431152, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.4822115898132324, "eval_runtime": 56.7923, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 85 }, { "epoch": 0.00793449429131588, "grad_norm": 4.373961075167894, "learning_rate": 2.674129353233831e-07, "loss": 1.5427, "step": 86 }, { "epoch": 0.008026755852842809, "grad_norm": 4.003591369571609, "learning_rate": 2.7052238805970147e-07, "loss": 1.5683, "step": 87 }, { "epoch": 0.008119017414369737, "grad_norm": 1.9910457980372962, "learning_rate": 2.736318407960199e-07, "loss": 1.508, "step": 88 }, { "epoch": 0.008211278975896666, "grad_norm": 3.5811749558032298, "learning_rate": 2.767412935323383e-07, "loss": 1.434, "step": 89 }, { "epoch": 0.008303540537423595, "grad_norm": 2.949039054324564, "learning_rate": 2.7985074626865674e-07, "loss": 1.2979, "step": 90 }, { "epoch": 0.008303540537423595, "eval_GEN Loss": 0.7697263956069946, "eval_GEN top-5 accuracy": 0.9421306444541867, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6727759838104248, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.4397836923599243, "eval_runtime": 56.0328, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 90 }, { "epoch": 0.008395802098950524, "grad_norm": 4.300210380913143, "learning_rate": 2.829601990049751e-07, "loss": 1.3892, "step": 91 }, { "epoch": 0.008488063660477453, "grad_norm": 4.497865551632025, "learning_rate": 2.8606965174129356e-07, "loss": 1.3393, "step": 92 }, { "epoch": 0.008580325222004382, "grad_norm": 3.681475742018798, "learning_rate": 2.8917910447761195e-07, "loss": 1.3857, "step": 93 }, { "epoch": 0.00867258678353131, "grad_norm": 4.2811633470511605, "learning_rate": 2.922885572139304e-07, "loss": 1.5033, "step": 94 }, { "epoch": 0.00876484834505824, "grad_norm": 2.6063769382613136, "learning_rate": 2.9539800995024877e-07, "loss": 1.3467, "step": 95 }, { "epoch": 0.00876484834505824, "eval_GEN Loss": 0.7327077984809875, "eval_GEN top-5 accuracy": 0.9465146865409908, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6708540916442871, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.4075721502304077, "eval_runtime": 55.936, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 95 }, { "epoch": 0.008857109906585168, "grad_norm": 2.280241426078729, "learning_rate": 2.9850746268656716e-07, "loss": 1.4608, "step": 96 }, { "epoch": 0.008949371468112097, "grad_norm": 3.237155480971528, "learning_rate": 3.016169154228856e-07, "loss": 1.3498, "step": 97 }, { "epoch": 0.009041633029639026, "grad_norm": 4.845276940236311, "learning_rate": 3.04726368159204e-07, "loss": 1.4412, "step": 98 }, { "epoch": 0.009133894591165955, "grad_norm": 2.6876818129375284, "learning_rate": 3.078358208955224e-07, "loss": 1.4279, "step": 99 }, { "epoch": 0.009226156152692884, "grad_norm": 4.503626692399455, "learning_rate": 3.109452736318408e-07, "loss": 1.4015, "step": 100 }, { "epoch": 0.009226156152692884, "eval_GEN Loss": 0.6929720044136047, "eval_GEN top-5 accuracy": 0.9504603244191144, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6667302250862122, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.3634614944458008, "eval_runtime": 56.041, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 100 }, { "epoch": 0.009318417714219812, "grad_norm": 3.162280791834292, "learning_rate": 3.1405472636815924e-07, "loss": 1.386, "step": 101 }, { "epoch": 0.009410679275746741, "grad_norm": 3.5415551551296294, "learning_rate": 3.1716417910447763e-07, "loss": 1.3551, "step": 102 }, { "epoch": 0.00950294083727367, "grad_norm": 2.59884729682728, "learning_rate": 3.2027363184079607e-07, "loss": 1.3806, "step": 103 }, { "epoch": 0.009595202398800599, "grad_norm": 2.654981055039507, "learning_rate": 3.2338308457711446e-07, "loss": 1.321, "step": 104 }, { "epoch": 0.009687463960327528, "grad_norm": 2.2640850649522335, "learning_rate": 3.2649253731343284e-07, "loss": 1.3313, "step": 105 }, { "epoch": 0.009687463960327528, "eval_GEN Loss": 0.6564959287643433, "eval_GEN top-5 accuracy": 0.958790004384042, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6540261507034302, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.3162260055541992, "eval_runtime": 56.1397, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 105 }, { "epoch": 0.009779725521854457, "grad_norm": 2.6718127266221456, "learning_rate": 3.296019900497513e-07, "loss": 1.2695, "step": 106 }, { "epoch": 0.009871987083381386, "grad_norm": 2.3077499382198243, "learning_rate": 3.3271144278606967e-07, "loss": 1.3066, "step": 107 }, { "epoch": 0.009964248644908314, "grad_norm": 3.7464571642834916, "learning_rate": 3.358208955223881e-07, "loss": 1.2675, "step": 108 }, { "epoch": 0.010056510206435243, "grad_norm": 2.244849109531541, "learning_rate": 3.389303482587065e-07, "loss": 1.3297, "step": 109 }, { "epoch": 0.010148771767962172, "grad_norm": 3.3919027523850445, "learning_rate": 3.420398009950249e-07, "loss": 1.2619, "step": 110 }, { "epoch": 0.010148771767962172, "eval_GEN Loss": 0.632244348526001, "eval_GEN top-5 accuracy": 0.9644892590968873, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.64864581823349, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2882211208343506, "eval_runtime": 55.9108, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 110 }, { "epoch": 0.010241033329489101, "grad_norm": 1.487790956636087, "learning_rate": 3.451492537313433e-07, "loss": 1.1671, "step": 111 }, { "epoch": 0.01033329489101603, "grad_norm": 1.949272382635497, "learning_rate": 3.4825870646766175e-07, "loss": 1.4099, "step": 112 }, { "epoch": 0.010425556452542959, "grad_norm": 1.8034335034787636, "learning_rate": 3.5136815920398014e-07, "loss": 1.1681, "step": 113 }, { "epoch": 0.010517818014069888, "grad_norm": 2.3584905317190623, "learning_rate": 3.544776119402985e-07, "loss": 1.3049, "step": 114 }, { "epoch": 0.010610079575596816, "grad_norm": 4.7832735810400075, "learning_rate": 3.575870646766169e-07, "loss": 1.19, "step": 115 }, { "epoch": 0.010610079575596816, "eval_GEN Loss": 0.6159378290176392, "eval_GEN top-5 accuracy": 0.9675580885576501, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.646122932434082, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2694711685180664, "eval_runtime": 56.8869, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 115 }, { "epoch": 0.010702341137123745, "grad_norm": 3.159208513024856, "learning_rate": 3.6069651741293535e-07, "loss": 1.2334, "step": 116 }, { "epoch": 0.010794602698650674, "grad_norm": 2.7159029094213345, "learning_rate": 3.638059701492538e-07, "loss": 1.2048, "step": 117 }, { "epoch": 0.010886864260177603, "grad_norm": 5.919509251949845, "learning_rate": 3.669154228855722e-07, "loss": 1.1744, "step": 118 }, { "epoch": 0.010979125821704532, "grad_norm": 3.387517453611791, "learning_rate": 3.7002487562189056e-07, "loss": 1.239, "step": 119 }, { "epoch": 0.01107138738323146, "grad_norm": 3.0146841098526593, "learning_rate": 3.7313432835820895e-07, "loss": 1.29, "step": 120 }, { "epoch": 0.01107138738323146, "eval_GEN Loss": 0.6037746667861938, "eval_GEN top-5 accuracy": 0.9693117053923718, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6428813338279724, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2550480365753174, "eval_runtime": 56.9415, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 120 }, { "epoch": 0.01116364894475839, "grad_norm": 2.3794434955477186, "learning_rate": 3.7624378109452744e-07, "loss": 1.1949, "step": 121 }, { "epoch": 0.011255910506285318, "grad_norm": 3.322725738719409, "learning_rate": 3.793532338308458e-07, "loss": 1.2007, "step": 122 }, { "epoch": 0.011348172067812247, "grad_norm": 3.2082068601478473, "learning_rate": 3.824626865671642e-07, "loss": 1.2183, "step": 123 }, { "epoch": 0.011440433629339176, "grad_norm": 2.1721049460512023, "learning_rate": 3.855721393034826e-07, "loss": 1.2992, "step": 124 }, { "epoch": 0.011532695190866105, "grad_norm": 4.970164595238515, "learning_rate": 3.88681592039801e-07, "loss": 1.3881, "step": 125 }, { "epoch": 0.011532695190866105, "eval_GEN Loss": 0.5954346656799316, "eval_GEN top-5 accuracy": 0.9693117053923718, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.637204647064209, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2435096502304077, "eval_runtime": 56.9017, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 125 }, { "epoch": 0.011624956752393034, "grad_norm": 2.140319140328948, "learning_rate": 3.9179104477611947e-07, "loss": 1.3041, "step": 126 }, { "epoch": 0.011717218313919963, "grad_norm": 1.6493112799847287, "learning_rate": 3.9490049751243786e-07, "loss": 1.2208, "step": 127 }, { "epoch": 0.011809479875446892, "grad_norm": 2.361177425828381, "learning_rate": 3.9800995024875624e-07, "loss": 1.2167, "step": 128 }, { "epoch": 0.01190174143697382, "grad_norm": 1.575569515428191, "learning_rate": 4.0111940298507463e-07, "loss": 1.1579, "step": 129 }, { "epoch": 0.01199400299850075, "grad_norm": 1.954657491756902, "learning_rate": 4.042288557213931e-07, "loss": 1.2077, "step": 130 }, { "epoch": 0.01199400299850075, "eval_GEN Loss": 0.5868880748748779, "eval_GEN top-5 accuracy": 0.9697501096010521, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6340000033378601, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2335336208343506, "eval_runtime": 56.7979, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 130 }, { "epoch": 0.012086264560027678, "grad_norm": 3.3479998825199906, "learning_rate": 4.073383084577115e-07, "loss": 1.0645, "step": 131 }, { "epoch": 0.012178526121554607, "grad_norm": 3.8275086734185106, "learning_rate": 4.104477611940299e-07, "loss": 1.3601, "step": 132 }, { "epoch": 0.012270787683081536, "grad_norm": 1.6417110032987758, "learning_rate": 4.135572139303483e-07, "loss": 1.226, "step": 133 }, { "epoch": 0.012363049244608465, "grad_norm": 4.253174971807062, "learning_rate": 4.1666666666666667e-07, "loss": 1.187, "step": 134 }, { "epoch": 0.012455310806135394, "grad_norm": 2.4885860148602372, "learning_rate": 4.1977611940298516e-07, "loss": 1.2166, "step": 135 }, { "epoch": 0.012455310806135394, "eval_GEN Loss": 0.5787835121154785, "eval_GEN top-5 accuracy": 0.9706269180184129, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.630656361579895, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2252403497695923, "eval_runtime": 56.7719, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 135 }, { "epoch": 0.012547572367662322, "grad_norm": 3.8927966197390105, "learning_rate": 4.2288557213930354e-07, "loss": 1.3302, "step": 136 }, { "epoch": 0.012639833929189251, "grad_norm": 2.322490627211395, "learning_rate": 4.2599502487562193e-07, "loss": 1.2212, "step": 137 }, { "epoch": 0.01273209549071618, "grad_norm": 4.256376338969038, "learning_rate": 4.291044776119403e-07, "loss": 1.1828, "step": 138 }, { "epoch": 0.012824357052243109, "grad_norm": 2.197689682736893, "learning_rate": 4.322139303482587e-07, "loss": 1.148, "step": 139 }, { "epoch": 0.012916618613770038, "grad_norm": 2.524441418608464, "learning_rate": 4.353233830845772e-07, "loss": 1.2342, "step": 140 }, { "epoch": 0.012916618613770038, "eval_GEN Loss": 0.572195291519165, "eval_GEN top-5 accuracy": 0.9710653222270934, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6265490055084229, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2159855365753174, "eval_runtime": 56.7698, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 140 }, { "epoch": 0.013008880175296967, "grad_norm": 1.8499524568910997, "learning_rate": 4.384328358208956e-07, "loss": 1.1273, "step": 141 }, { "epoch": 0.013101141736823895, "grad_norm": 4.305504027393469, "learning_rate": 4.4154228855721396e-07, "loss": 1.2465, "step": 142 }, { "epoch": 0.013193403298350824, "grad_norm": 3.3734445402391686, "learning_rate": 4.4465174129353235e-07, "loss": 1.2308, "step": 143 }, { "epoch": 0.013285664859877753, "grad_norm": 1.3413274073357973, "learning_rate": 4.4776119402985074e-07, "loss": 1.1872, "step": 144 }, { "epoch": 0.013377926421404682, "grad_norm": 1.341728169252834, "learning_rate": 4.5087064676616923e-07, "loss": 1.115, "step": 145 }, { "epoch": 0.013377926421404682, "eval_GEN Loss": 0.5650824308395386, "eval_GEN top-5 accuracy": 0.9710653222270934, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6218520402908325, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2105768918991089, "eval_runtime": 56.9056, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 145 }, { "epoch": 0.013470187982931611, "grad_norm": 3.6616799188033853, "learning_rate": 4.539800995024876e-07, "loss": 1.1553, "step": 146 }, { "epoch": 0.01356244954445854, "grad_norm": 2.5202344461470774, "learning_rate": 4.57089552238806e-07, "loss": 1.1569, "step": 147 }, { "epoch": 0.013654711105985469, "grad_norm": 4.192930250780877, "learning_rate": 4.601990049751244e-07, "loss": 1.1474, "step": 148 }, { "epoch": 0.013746972667512397, "grad_norm": 3.937700910615772, "learning_rate": 4.6330845771144277e-07, "loss": 1.17, "step": 149 }, { "epoch": 0.013839234229039326, "grad_norm": 1.5356498681091049, "learning_rate": 4.6641791044776126e-07, "loss": 1.0327, "step": 150 }, { "epoch": 0.013839234229039326, "eval_GEN Loss": 0.5591273903846741, "eval_GEN top-5 accuracy": 0.9723805348531346, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6177559494972229, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.2018028497695923, "eval_runtime": 55.7981, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 150 }, { "epoch": 0.013931495790566255, "grad_norm": 3.426476007703366, "learning_rate": 4.6952736318407965e-07, "loss": 1.0698, "step": 151 }, { "epoch": 0.014023757352093184, "grad_norm": 3.84524761100555, "learning_rate": 4.7263681592039803e-07, "loss": 1.1573, "step": 152 }, { "epoch": 0.014116018913620113, "grad_norm": 2.700267632870109, "learning_rate": 4.757462686567164e-07, "loss": 1.1669, "step": 153 }, { "epoch": 0.014208280475147042, "grad_norm": 2.5411199119199406, "learning_rate": 4.788557213930348e-07, "loss": 1.127, "step": 154 }, { "epoch": 0.01430054203667397, "grad_norm": 2.630794237531673, "learning_rate": 4.819651741293534e-07, "loss": 1.1384, "step": 155 }, { "epoch": 0.01430054203667397, "eval_GEN Loss": 0.5535362362861633, "eval_GEN top-5 accuracy": 0.9723805348531346, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6125956177711487, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1959134340286255, "eval_runtime": 56.0126, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 155 }, { "epoch": 0.0143928035982009, "grad_norm": 3.0187035031997502, "learning_rate": 4.850746268656717e-07, "loss": 1.3768, "step": 156 }, { "epoch": 0.014485065159727828, "grad_norm": 2.911667717269186, "learning_rate": 4.881840796019901e-07, "loss": 1.2243, "step": 157 }, { "epoch": 0.014577326721254757, "grad_norm": 3.201497950034923, "learning_rate": 4.912935323383085e-07, "loss": 1.2479, "step": 158 }, { "epoch": 0.014669588282781686, "grad_norm": 4.372336363957918, "learning_rate": 4.944029850746269e-07, "loss": 1.0542, "step": 159 }, { "epoch": 0.014761849844308615, "grad_norm": 1.7042290709906678, "learning_rate": 4.975124378109453e-07, "loss": 1.1225, "step": 160 }, { "epoch": 0.014761849844308615, "eval_GEN Loss": 0.5486795902252197, "eval_GEN top-5 accuracy": 0.9723805348531346, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6068178415298462, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1885817050933838, "eval_runtime": 55.8918, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 160 }, { "epoch": 0.014854111405835544, "grad_norm": 2.2313977327125945, "learning_rate": 5.006218905472638e-07, "loss": 1.2895, "step": 161 }, { "epoch": 0.014946372967362473, "grad_norm": 1.6765634851215816, "learning_rate": 5.037313432835821e-07, "loss": 1.1747, "step": 162 }, { "epoch": 0.015038634528889401, "grad_norm": 2.3646330611673934, "learning_rate": 5.068407960199005e-07, "loss": 1.0631, "step": 163 }, { "epoch": 0.01513089609041633, "grad_norm": 2.6665593945894877, "learning_rate": 5.099502487562189e-07, "loss": 1.0604, "step": 164 }, { "epoch": 0.015223157651943259, "grad_norm": 3.6891562290617297, "learning_rate": 5.130597014925374e-07, "loss": 1.2219, "step": 165 }, { "epoch": 0.015223157651943259, "eval_GEN Loss": 0.5440877676010132, "eval_GEN top-5 accuracy": 0.972818939061815, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.6010922193527222, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1805288791656494, "eval_runtime": 55.9587, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 165 }, { "epoch": 0.015315419213470188, "grad_norm": 3.499835361395495, "learning_rate": 5.161691542288558e-07, "loss": 1.1838, "step": 166 }, { "epoch": 0.015407680774997117, "grad_norm": 1.9058665102788184, "learning_rate": 5.192786069651742e-07, "loss": 1.1222, "step": 167 }, { "epoch": 0.015499942336524046, "grad_norm": 1.7497038975039427, "learning_rate": 5.223880597014925e-07, "loss": 1.1473, "step": 168 }, { "epoch": 0.015592203898050975, "grad_norm": 1.376208125069818, "learning_rate": 5.25497512437811e-07, "loss": 1.2389, "step": 169 }, { "epoch": 0.0156844654595779, "grad_norm": 1.506267183082681, "learning_rate": 5.286069651741294e-07, "loss": 1.1814, "step": 170 }, { "epoch": 0.0156844654595779, "eval_GEN Loss": 0.5395631790161133, "eval_GEN top-5 accuracy": 0.9719421306444542, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5953467488288879, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1742788553237915, "eval_runtime": 55.8564, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 170 }, { "epoch": 0.01577672702110483, "grad_norm": 1.4669207809936677, "learning_rate": 5.317164179104478e-07, "loss": 1.104, "step": 171 }, { "epoch": 0.01586898858263176, "grad_norm": 3.187983413829535, "learning_rate": 5.348258706467662e-07, "loss": 1.1191, "step": 172 }, { "epoch": 0.015961250144158688, "grad_norm": 2.263443121489794, "learning_rate": 5.379353233830846e-07, "loss": 1.3148, "step": 173 }, { "epoch": 0.016053511705685617, "grad_norm": 1.6708278469196651, "learning_rate": 5.410447761194029e-07, "loss": 1.0963, "step": 174 }, { "epoch": 0.016145773267212546, "grad_norm": 1.2433902795383085, "learning_rate": 5.441542288557215e-07, "loss": 1.1433, "step": 175 }, { "epoch": 0.016145773267212546, "eval_GEN Loss": 0.5355656147003174, "eval_GEN top-5 accuracy": 0.972818939061815, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5899839401245117, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1680288314819336, "eval_runtime": 56.0484, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 175 }, { "epoch": 0.016238034828739475, "grad_norm": 3.123639407344628, "learning_rate": 5.472636815920398e-07, "loss": 1.0163, "step": 176 }, { "epoch": 0.016330296390266404, "grad_norm": 2.0634700843488134, "learning_rate": 5.503731343283583e-07, "loss": 1.0857, "step": 177 }, { "epoch": 0.016422557951793332, "grad_norm": 1.3954752682063847, "learning_rate": 5.534825870646766e-07, "loss": 1.157, "step": 178 }, { "epoch": 0.01651481951332026, "grad_norm": 2.3945957166778307, "learning_rate": 5.565920398009951e-07, "loss": 1.1593, "step": 179 }, { "epoch": 0.01660708107484719, "grad_norm": 2.0141835860911446, "learning_rate": 5.597014925373135e-07, "loss": 1.1564, "step": 180 }, { "epoch": 0.01660708107484719, "eval_GEN Loss": 0.5322163701057434, "eval_GEN top-5 accuracy": 0.9723805348531346, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5848449468612671, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1637018918991089, "eval_runtime": 56.2358, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 180 }, { "epoch": 0.01669934263637412, "grad_norm": 1.7479021559057548, "learning_rate": 5.628109452736319e-07, "loss": 1.1356, "step": 181 }, { "epoch": 0.016791604197901048, "grad_norm": 2.6506406095324624, "learning_rate": 5.659203980099502e-07, "loss": 1.0324, "step": 182 }, { "epoch": 0.016883865759427977, "grad_norm": 2.142269070565063, "learning_rate": 5.690298507462687e-07, "loss": 1.1757, "step": 183 }, { "epoch": 0.016976127320954906, "grad_norm": 1.392911091467902, "learning_rate": 5.721393034825871e-07, "loss": 1.1192, "step": 184 }, { "epoch": 0.017068388882481834, "grad_norm": 3.234694851702116, "learning_rate": 5.752487562189056e-07, "loss": 0.9247, "step": 185 }, { "epoch": 0.017068388882481834, "eval_GEN Loss": 0.5290143489837646, "eval_GEN top-5 accuracy": 0.9736957474791758, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5798476934432983, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1593749523162842, "eval_runtime": 55.7916, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 185 }, { "epoch": 0.017160650444008763, "grad_norm": 3.262504360848584, "learning_rate": 5.783582089552239e-07, "loss": 1.1936, "step": 186 }, { "epoch": 0.017252912005535692, "grad_norm": 1.2351033356893326, "learning_rate": 5.814676616915423e-07, "loss": 1.1101, "step": 187 }, { "epoch": 0.01734517356706262, "grad_norm": 2.9221099184657735, "learning_rate": 5.845771144278608e-07, "loss": 1.1287, "step": 188 }, { "epoch": 0.01743743512858955, "grad_norm": 1.2464805163577264, "learning_rate": 5.876865671641792e-07, "loss": 1.1525, "step": 189 }, { "epoch": 0.01752969669011648, "grad_norm": 1.719012479550381, "learning_rate": 5.907960199004975e-07, "loss": 1.2659, "step": 190 }, { "epoch": 0.01752969669011648, "eval_GEN Loss": 0.526759922504425, "eval_GEN top-5 accuracy": 0.972818939061815, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5763874650001526, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1551682949066162, "eval_runtime": 55.8238, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 190 }, { "epoch": 0.017621958251643408, "grad_norm": 2.036814904860174, "learning_rate": 5.93905472636816e-07, "loss": 1.1664, "step": 191 }, { "epoch": 0.017714219813170336, "grad_norm": 1.9093392405912946, "learning_rate": 5.970149253731343e-07, "loss": 1.0943, "step": 192 }, { "epoch": 0.017806481374697265, "grad_norm": 1.569505782183973, "learning_rate": 6.001243781094528e-07, "loss": 1.0698, "step": 193 }, { "epoch": 0.017898742936224194, "grad_norm": 1.5582990636644043, "learning_rate": 6.032338308457712e-07, "loss": 1.2057, "step": 194 }, { "epoch": 0.017991004497751123, "grad_norm": 1.8711371605271108, "learning_rate": 6.063432835820896e-07, "loss": 1.2447, "step": 195 }, { "epoch": 0.017991004497751123, "eval_GEN Loss": 0.5234596133232117, "eval_GEN top-5 accuracy": 0.9736957474791758, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5738641619682312, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1536058187484741, "eval_runtime": 56.0063, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 195 }, { "epoch": 0.018083266059278052, "grad_norm": 3.374081738855087, "learning_rate": 6.09452736318408e-07, "loss": 1.0396, "step": 196 }, { "epoch": 0.01817552762080498, "grad_norm": 2.2035285361727652, "learning_rate": 6.125621890547264e-07, "loss": 1.1203, "step": 197 }, { "epoch": 0.01826778918233191, "grad_norm": 2.467382046802569, "learning_rate": 6.156716417910448e-07, "loss": 1.0652, "step": 198 }, { "epoch": 0.01836005074385884, "grad_norm": 1.3431188681413289, "learning_rate": 6.187810945273633e-07, "loss": 1.1854, "step": 199 }, { "epoch": 0.018452312305385767, "grad_norm": 1.850275067257811, "learning_rate": 6.218905472636816e-07, "loss": 1.0531, "step": 200 }, { "epoch": 0.018452312305385767, "eval_GEN Loss": 0.5223154425621033, "eval_GEN top-5 accuracy": 0.9736957474791758, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5719572901725769, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1526442766189575, "eval_runtime": 55.998, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 200 }, { "epoch": 0.018544573866912696, "grad_norm": 1.8369164323211342, "learning_rate": 6.25e-07, "loss": 1.0348, "step": 201 }, { "epoch": 0.018636835428439625, "grad_norm": 4.042908754628373, "learning_rate": 6.281094527363185e-07, "loss": 1.2664, "step": 202 }, { "epoch": 0.018729096989966554, "grad_norm": 1.8835558742943022, "learning_rate": 6.312189054726368e-07, "loss": 1.1774, "step": 203 }, { "epoch": 0.018821358551493483, "grad_norm": 1.5364103259559745, "learning_rate": 6.343283582089553e-07, "loss": 1.2211, "step": 204 }, { "epoch": 0.01891362011302041, "grad_norm": 1.6463932144779783, "learning_rate": 6.374378109452736e-07, "loss": 1.2084, "step": 205 }, { "epoch": 0.01891362011302041, "eval_GEN Loss": 0.5205348134040833, "eval_GEN top-5 accuracy": 0.9754493643138974, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5690513849258423, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1484375, "eval_runtime": 56.0259, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 205 }, { "epoch": 0.01900588167454734, "grad_norm": 3.022050229054206, "learning_rate": 6.405472636815921e-07, "loss": 1.0556, "step": 206 }, { "epoch": 0.01909814323607427, "grad_norm": 3.5266726313156043, "learning_rate": 6.436567164179106e-07, "loss": 1.1038, "step": 207 }, { "epoch": 0.019190404797601198, "grad_norm": 1.2466144988035346, "learning_rate": 6.467661691542289e-07, "loss": 1.0974, "step": 208 }, { "epoch": 0.019282666359128127, "grad_norm": 1.962282295115707, "learning_rate": 6.498756218905473e-07, "loss": 1.0972, "step": 209 }, { "epoch": 0.019374927920655056, "grad_norm": 2.0357105644300755, "learning_rate": 6.529850746268657e-07, "loss": 1.1944, "step": 210 }, { "epoch": 0.019374927920655056, "eval_GEN Loss": 0.5192821025848389, "eval_GEN top-5 accuracy": 0.9736957474791758, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5659216046333313, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1461538076400757, "eval_runtime": 55.9503, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 210 }, { "epoch": 0.019467189482181985, "grad_norm": 2.506291963518388, "learning_rate": 6.560945273631841e-07, "loss": 1.1764, "step": 211 }, { "epoch": 0.019559451043708913, "grad_norm": 1.1739892120429067, "learning_rate": 6.592039800995026e-07, "loss": 1.1399, "step": 212 }, { "epoch": 0.019651712605235842, "grad_norm": 1.6811487213429959, "learning_rate": 6.623134328358209e-07, "loss": 1.1451, "step": 213 }, { "epoch": 0.01974397416676277, "grad_norm": 2.340710465050252, "learning_rate": 6.654228855721393e-07, "loss": 1.0598, "step": 214 }, { "epoch": 0.0198362357282897, "grad_norm": 2.8002553717549903, "learning_rate": 6.685323383084577e-07, "loss": 1.0842, "step": 215 }, { "epoch": 0.0198362357282897, "eval_GEN Loss": 0.5170443058013916, "eval_GEN top-5 accuracy": 0.9745725558965366, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5624172687530518, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.143990397453308, "eval_runtime": 55.9108, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 215 }, { "epoch": 0.01992849728981663, "grad_norm": 3.214947687116344, "learning_rate": 6.716417910447762e-07, "loss": 1.1459, "step": 216 }, { "epoch": 0.020020758851343558, "grad_norm": 3.029276370298952, "learning_rate": 6.747512437810946e-07, "loss": 1.0847, "step": 217 }, { "epoch": 0.020113020412870487, "grad_norm": 1.663984961233634, "learning_rate": 6.77860696517413e-07, "loss": 1.2899, "step": 218 }, { "epoch": 0.020205281974397415, "grad_norm": 1.4544759741871345, "learning_rate": 6.809701492537314e-07, "loss": 1.1231, "step": 219 }, { "epoch": 0.020297543535924344, "grad_norm": 2.203854407410451, "learning_rate": 6.840796019900498e-07, "loss": 1.1777, "step": 220 }, { "epoch": 0.020297543535924344, "eval_GEN Loss": 0.5135334730148315, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5585988163948059, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.137379765510559, "eval_runtime": 56.0845, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 220 }, { "epoch": 0.020389805097451273, "grad_norm": 2.0670558917920747, "learning_rate": 6.871890547263682e-07, "loss": 1.1395, "step": 221 }, { "epoch": 0.020482066658978202, "grad_norm": 2.8771722472921004, "learning_rate": 6.902985074626866e-07, "loss": 0.9456, "step": 222 }, { "epoch": 0.02057432822050513, "grad_norm": 1.3261488963028663, "learning_rate": 6.93407960199005e-07, "loss": 1.0876, "step": 223 }, { "epoch": 0.02066658978203206, "grad_norm": 1.5730855667159154, "learning_rate": 6.965174129353235e-07, "loss": 1.0239, "step": 224 }, { "epoch": 0.02075885134355899, "grad_norm": 3.621240004877932, "learning_rate": 6.996268656716417e-07, "loss": 0.8469, "step": 225 }, { "epoch": 0.02075885134355899, "eval_GEN Loss": 0.5120242834091187, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5553549528121948, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1325721740722656, "eval_runtime": 56.002, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 225 }, { "epoch": 0.020851112905085917, "grad_norm": 1.484888422594663, "learning_rate": 7.027363184079603e-07, "loss": 1.0099, "step": 226 }, { "epoch": 0.020943374466612846, "grad_norm": 1.3755576735455195, "learning_rate": 7.058457711442787e-07, "loss": 1.1258, "step": 227 }, { "epoch": 0.021035636028139775, "grad_norm": 1.2243039274674814, "learning_rate": 7.08955223880597e-07, "loss": 1.0561, "step": 228 }, { "epoch": 0.021127897589666704, "grad_norm": 2.2021697636941155, "learning_rate": 7.120646766169155e-07, "loss": 1.1327, "step": 229 }, { "epoch": 0.021220159151193633, "grad_norm": 3.22855391632117, "learning_rate": 7.151741293532338e-07, "loss": 1.088, "step": 230 }, { "epoch": 0.021220159151193633, "eval_GEN Loss": 0.5095731616020203, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5523665547370911, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1322115659713745, "eval_runtime": 55.9755, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 230 }, { "epoch": 0.02131242071272056, "grad_norm": 2.1624933493323497, "learning_rate": 7.182835820895523e-07, "loss": 0.9234, "step": 231 }, { "epoch": 0.02140468227424749, "grad_norm": 1.9286550194070369, "learning_rate": 7.213930348258707e-07, "loss": 1.1006, "step": 232 }, { "epoch": 0.02149694383577442, "grad_norm": 1.9879188571883055, "learning_rate": 7.24502487562189e-07, "loss": 1.0354, "step": 233 }, { "epoch": 0.02158920539730135, "grad_norm": 1.7033235635672739, "learning_rate": 7.276119402985076e-07, "loss": 1.1862, "step": 234 }, { "epoch": 0.021681466958828277, "grad_norm": 2.971431635426475, "learning_rate": 7.307213930348259e-07, "loss": 0.8153, "step": 235 }, { "epoch": 0.021681466958828277, "eval_GEN Loss": 0.5085355639457703, "eval_GEN top-5 accuracy": 0.9763261727312582, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5487057566642761, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.131009578704834, "eval_runtime": 56.2583, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 235 }, { "epoch": 0.021773728520355206, "grad_norm": 2.3170545130056195, "learning_rate": 7.338308457711443e-07, "loss": 0.9272, "step": 236 }, { "epoch": 0.021865990081882135, "grad_norm": 2.5063211979179623, "learning_rate": 7.369402985074628e-07, "loss": 1.1512, "step": 237 }, { "epoch": 0.021958251643409064, "grad_norm": 2.6050090210752845, "learning_rate": 7.400497512437811e-07, "loss": 1.1128, "step": 238 }, { "epoch": 0.022050513204935993, "grad_norm": 0.9438638212182147, "learning_rate": 7.431592039800996e-07, "loss": 1.0492, "step": 239 }, { "epoch": 0.02214277476646292, "grad_norm": 1.7367803016092296, "learning_rate": 7.462686567164179e-07, "loss": 1.0682, "step": 240 }, { "epoch": 0.02214277476646292, "eval_GEN Loss": 0.5049706697463989, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5450387001037598, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1257210969924927, "eval_runtime": 55.9463, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 240 }, { "epoch": 0.02223503632798985, "grad_norm": 1.0587270737449548, "learning_rate": 7.493781094527363e-07, "loss": 1.0032, "step": 241 }, { "epoch": 0.02232729788951678, "grad_norm": 1.5482171931689053, "learning_rate": 7.524875621890549e-07, "loss": 1.1029, "step": 242 }, { "epoch": 0.022419559451043708, "grad_norm": 1.5518736555259462, "learning_rate": 7.555970149253732e-07, "loss": 1.0056, "step": 243 }, { "epoch": 0.022511821012570637, "grad_norm": 2.8331292567857047, "learning_rate": 7.587064676616916e-07, "loss": 1.0184, "step": 244 }, { "epoch": 0.022604082574097566, "grad_norm": 2.549284096825949, "learning_rate": 7.6181592039801e-07, "loss": 0.9846, "step": 245 }, { "epoch": 0.022604082574097566, "eval_GEN Loss": 0.5028582215309143, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5410569310188293, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.126201868057251, "eval_runtime": 55.9978, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 245 }, { "epoch": 0.022696344135624495, "grad_norm": 2.7637017707401457, "learning_rate": 7.649253731343284e-07, "loss": 1.1036, "step": 246 }, { "epoch": 0.022788605697151423, "grad_norm": 1.7165914392239319, "learning_rate": 7.680348258706469e-07, "loss": 1.0846, "step": 247 }, { "epoch": 0.022880867258678352, "grad_norm": 1.7964868558424398, "learning_rate": 7.711442786069652e-07, "loss": 1.1794, "step": 248 }, { "epoch": 0.02297312882020528, "grad_norm": 1.5067101117393125, "learning_rate": 7.742537313432836e-07, "loss": 1.1901, "step": 249 }, { "epoch": 0.02306539038173221, "grad_norm": 1.885967326150524, "learning_rate": 7.77363184079602e-07, "loss": 1.1061, "step": 250 }, { "epoch": 0.02306539038173221, "eval_GEN Loss": 0.49827855825424194, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5379000902175903, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.120192289352417, "eval_runtime": 56.2878, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 250 }, { "epoch": 0.02315765194325914, "grad_norm": 1.7081726615257915, "learning_rate": 7.804726368159204e-07, "loss": 0.9803, "step": 251 }, { "epoch": 0.023249913504786068, "grad_norm": 1.962242829716037, "learning_rate": 7.835820895522389e-07, "loss": 1.1248, "step": 252 }, { "epoch": 0.023342175066312996, "grad_norm": 1.3568711442449137, "learning_rate": 7.866915422885573e-07, "loss": 1.1357, "step": 253 }, { "epoch": 0.023434436627839925, "grad_norm": 1.847285767372738, "learning_rate": 7.898009950248757e-07, "loss": 1.1333, "step": 254 }, { "epoch": 0.023526698189366854, "grad_norm": 2.2990666027216897, "learning_rate": 7.929104477611942e-07, "loss": 0.8898, "step": 255 }, { "epoch": 0.023526698189366854, "eval_GEN Loss": 0.49851059913635254, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5344753861427307, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1207932233810425, "eval_runtime": 55.867, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 255 }, { "epoch": 0.023618959750893783, "grad_norm": 1.9308137024234377, "learning_rate": 7.960199004975125e-07, "loss": 1.1893, "step": 256 }, { "epoch": 0.023711221312420712, "grad_norm": 2.4493692503226265, "learning_rate": 7.991293532338309e-07, "loss": 1.1574, "step": 257 }, { "epoch": 0.02380348287394764, "grad_norm": 1.553760673770195, "learning_rate": 8.022388059701493e-07, "loss": 1.0206, "step": 258 }, { "epoch": 0.02389574443547457, "grad_norm": 2.010889516326646, "learning_rate": 8.053482587064677e-07, "loss": 1.1219, "step": 259 }, { "epoch": 0.0239880059970015, "grad_norm": 2.2948511162812566, "learning_rate": 8.084577114427862e-07, "loss": 1.0648, "step": 260 }, { "epoch": 0.0239880059970015, "eval_GEN Loss": 0.499536395072937, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5314286947250366, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.123798131942749, "eval_runtime": 56.2249, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 260 }, { "epoch": 0.024080267558528427, "grad_norm": 1.3984976010614756, "learning_rate": 8.115671641791046e-07, "loss": 1.0773, "step": 261 }, { "epoch": 0.024172529120055356, "grad_norm": 2.7309847518077404, "learning_rate": 8.14676616915423e-07, "loss": 1.1736, "step": 262 }, { "epoch": 0.024264790681582285, "grad_norm": 1.3141521911071716, "learning_rate": 8.177860696517413e-07, "loss": 0.9211, "step": 263 }, { "epoch": 0.024357052243109214, "grad_norm": 2.1621667375131914, "learning_rate": 8.208955223880598e-07, "loss": 1.1967, "step": 264 }, { "epoch": 0.024449313804636143, "grad_norm": 1.65439325524114, "learning_rate": 8.240049751243782e-07, "loss": 0.9722, "step": 265 }, { "epoch": 0.024449313804636143, "eval_GEN Loss": 0.49999383091926575, "eval_GEN top-5 accuracy": 0.9763261727312582, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5308574438095093, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1251201629638672, "eval_runtime": 55.8955, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 265 }, { "epoch": 0.02454157536616307, "grad_norm": 2.623145414454357, "learning_rate": 8.271144278606966e-07, "loss": 1.1088, "step": 266 }, { "epoch": 0.02463383692769, "grad_norm": 2.288403387365106, "learning_rate": 8.30223880597015e-07, "loss": 1.0018, "step": 267 }, { "epoch": 0.02472609848921693, "grad_norm": 1.4482698240184462, "learning_rate": 8.333333333333333e-07, "loss": 1.0952, "step": 268 }, { "epoch": 0.024818360050743858, "grad_norm": 1.1600946139990198, "learning_rate": 8.364427860696518e-07, "loss": 0.9762, "step": 269 }, { "epoch": 0.024910621612270787, "grad_norm": 1.4967658760734532, "learning_rate": 8.395522388059703e-07, "loss": 1.2571, "step": 270 }, { "epoch": 0.024910621612270787, "eval_GEN Loss": 0.5007842779159546, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5283689498901367, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.125, "eval_runtime": 55.9944, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 270 }, { "epoch": 0.025002883173797716, "grad_norm": 2.328523158673554, "learning_rate": 8.426616915422886e-07, "loss": 1.0343, "step": 271 }, { "epoch": 0.025095144735324645, "grad_norm": 1.4909803648560656, "learning_rate": 8.457711442786071e-07, "loss": 1.104, "step": 272 }, { "epoch": 0.025187406296851574, "grad_norm": 1.8657451248588977, "learning_rate": 8.488805970149254e-07, "loss": 0.9584, "step": 273 }, { "epoch": 0.025279667858378502, "grad_norm": 1.0806269013565903, "learning_rate": 8.519900497512439e-07, "loss": 0.9994, "step": 274 }, { "epoch": 0.02537192941990543, "grad_norm": 1.8828202710100699, "learning_rate": 8.550995024875623e-07, "loss": 1.0252, "step": 275 }, { "epoch": 0.02537192941990543, "eval_GEN Loss": 0.4993970990180969, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5242939591407776, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1192307472229004, "eval_runtime": 55.9406, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 275 }, { "epoch": 0.02546419098143236, "grad_norm": 1.9910428682832662, "learning_rate": 8.582089552238806e-07, "loss": 0.9602, "step": 276 }, { "epoch": 0.02555645254295929, "grad_norm": 2.205952921717709, "learning_rate": 8.613184079601991e-07, "loss": 1.1484, "step": 277 }, { "epoch": 0.025648714104486218, "grad_norm": 1.6616398335829814, "learning_rate": 8.644278606965174e-07, "loss": 1.0244, "step": 278 }, { "epoch": 0.025740975666013147, "grad_norm": 1.6161884507818356, "learning_rate": 8.675373134328359e-07, "loss": 0.8702, "step": 279 }, { "epoch": 0.025833237227540076, "grad_norm": 1.1562188681419945, "learning_rate": 8.706467661691544e-07, "loss": 1.0532, "step": 280 }, { "epoch": 0.025833237227540076, "eval_GEN Loss": 0.49678125977516174, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5206115245819092, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.115625023841858, "eval_runtime": 55.937, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 280 }, { "epoch": 0.025925498789067004, "grad_norm": 1.9707863917005386, "learning_rate": 8.737562189054727e-07, "loss": 1.0873, "step": 281 }, { "epoch": 0.026017760350593933, "grad_norm": 4.278966152269661, "learning_rate": 8.768656716417912e-07, "loss": 1.277, "step": 282 }, { "epoch": 0.026110021912120862, "grad_norm": 1.2908293416193641, "learning_rate": 8.799751243781095e-07, "loss": 0.9749, "step": 283 }, { "epoch": 0.02620228347364779, "grad_norm": 1.2684817107225679, "learning_rate": 8.830845771144279e-07, "loss": 1.0421, "step": 284 }, { "epoch": 0.02629454503517472, "grad_norm": 1.5940989867178927, "learning_rate": 8.861940298507464e-07, "loss": 1.1096, "step": 285 }, { "epoch": 0.02629454503517472, "eval_GEN Loss": 0.4946899712085724, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5191790461540222, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1149038076400757, "eval_runtime": 56.0251, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 285 }, { "epoch": 0.02638680659670165, "grad_norm": 2.055428248373644, "learning_rate": 8.893034825870647e-07, "loss": 0.9623, "step": 286 }, { "epoch": 0.026479068158228578, "grad_norm": 1.9264725448015343, "learning_rate": 8.924129353233831e-07, "loss": 0.9619, "step": 287 }, { "epoch": 0.026571329719755506, "grad_norm": 2.4195160243952674, "learning_rate": 8.955223880597015e-07, "loss": 1.2104, "step": 288 }, { "epoch": 0.026663591281282435, "grad_norm": 1.9500252731013148, "learning_rate": 8.9863184079602e-07, "loss": 1.1173, "step": 289 }, { "epoch": 0.026755852842809364, "grad_norm": 1.1811091155512554, "learning_rate": 9.017412935323385e-07, "loss": 0.985, "step": 290 }, { "epoch": 0.026755852842809364, "eval_GEN Loss": 0.4933905303478241, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5175021290779114, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1144230365753174, "eval_runtime": 57.0475, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 290 }, { "epoch": 0.026848114404336293, "grad_norm": 1.2546086202256017, "learning_rate": 9.048507462686568e-07, "loss": 1.0852, "step": 291 }, { "epoch": 0.026940375965863222, "grad_norm": 3.1134612905257883, "learning_rate": 9.079601990049752e-07, "loss": 1.1482, "step": 292 }, { "epoch": 0.02703263752739015, "grad_norm": 1.400022154726557, "learning_rate": 9.110696517412936e-07, "loss": 1.0331, "step": 293 }, { "epoch": 0.02712489908891708, "grad_norm": 1.0246627685545686, "learning_rate": 9.14179104477612e-07, "loss": 1.0233, "step": 294 }, { "epoch": 0.02721716065044401, "grad_norm": 2.7396386216256223, "learning_rate": 9.172885572139304e-07, "loss": 1.1775, "step": 295 }, { "epoch": 0.02721716065044401, "eval_GEN Loss": 0.49512484669685364, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5191892385482788, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.118749976158142, "eval_runtime": 56.9037, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 295 }, { "epoch": 0.027309422211970937, "grad_norm": 1.5007117831839922, "learning_rate": 9.203980099502488e-07, "loss": 0.976, "step": 296 }, { "epoch": 0.027401683773497866, "grad_norm": 1.5792917701848133, "learning_rate": 9.235074626865673e-07, "loss": 1.2102, "step": 297 }, { "epoch": 0.027493945335024795, "grad_norm": 3.098253837116703, "learning_rate": 9.266169154228855e-07, "loss": 1.2062, "step": 298 }, { "epoch": 0.027586206896551724, "grad_norm": 2.44234681946125, "learning_rate": 9.297263681592041e-07, "loss": 1.1697, "step": 299 }, { "epoch": 0.027678468458078653, "grad_norm": 1.3977209211043808, "learning_rate": 9.328358208955225e-07, "loss": 1.0619, "step": 300 }, { "epoch": 0.027678468458078653, "eval_GEN Loss": 0.4945972263813019, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5235617756843567, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1182692050933838, "eval_runtime": 56.9471, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 300 }, { "epoch": 0.02777073001960558, "grad_norm": 1.7627879947578182, "learning_rate": 9.359452736318409e-07, "loss": 0.9506, "step": 301 }, { "epoch": 0.02786299158113251, "grad_norm": 2.5988992466232568, "learning_rate": 9.390547263681593e-07, "loss": 0.8767, "step": 302 }, { "epoch": 0.02795525314265944, "grad_norm": 4.085254431764655, "learning_rate": 9.421641791044776e-07, "loss": 1.1512, "step": 303 }, { "epoch": 0.028047514704186368, "grad_norm": 2.6136174838400663, "learning_rate": 9.452736318407961e-07, "loss": 1.103, "step": 304 }, { "epoch": 0.028139776265713297, "grad_norm": 2.108395179560001, "learning_rate": 9.483830845771146e-07, "loss": 1.1541, "step": 305 }, { "epoch": 0.028139776265713297, "eval_GEN Loss": 0.4926488697528839, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5267210006713867, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.113942265510559, "eval_runtime": 56.8595, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 305 }, { "epoch": 0.028232037827240226, "grad_norm": 2.495153869564682, "learning_rate": 9.514925373134328e-07, "loss": 0.9752, "step": 306 }, { "epoch": 0.028324299388767155, "grad_norm": 2.387247198562086, "learning_rate": 9.546019900497513e-07, "loss": 0.8936, "step": 307 }, { "epoch": 0.028416560950294083, "grad_norm": 1.460754878627914, "learning_rate": 9.577114427860696e-07, "loss": 0.9544, "step": 308 }, { "epoch": 0.028508822511821012, "grad_norm": 2.0395098214067002, "learning_rate": 9.608208955223882e-07, "loss": 0.9313, "step": 309 }, { "epoch": 0.02860108407334794, "grad_norm": 1.437449786362347, "learning_rate": 9.639303482587067e-07, "loss": 1.0574, "step": 310 }, { "epoch": 0.02860108407334794, "eval_GEN Loss": 0.49192938208580017, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.527777373790741, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1115384101867676, "eval_runtime": 56.9538, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 310 }, { "epoch": 0.02869334563487487, "grad_norm": 1.5733885494961437, "learning_rate": 9.670398009950248e-07, "loss": 0.9618, "step": 311 }, { "epoch": 0.0287856071964018, "grad_norm": 2.604042706490351, "learning_rate": 9.701492537313434e-07, "loss": 0.9865, "step": 312 }, { "epoch": 0.028877868757928728, "grad_norm": 2.1168350541971095, "learning_rate": 9.732587064676617e-07, "loss": 1.0898, "step": 313 }, { "epoch": 0.028970130319455657, "grad_norm": 1.3268050898742347, "learning_rate": 9.763681592039802e-07, "loss": 1.1057, "step": 314 }, { "epoch": 0.029062391880982585, "grad_norm": 1.9214658491996879, "learning_rate": 9.794776119402986e-07, "loss": 1.1069, "step": 315 }, { "epoch": 0.029062391880982585, "eval_GEN Loss": 0.4930776357650757, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5243564248085022, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1070913076400757, "eval_runtime": 56.8272, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 315 }, { "epoch": 0.029154653442509514, "grad_norm": 1.391531246930202, "learning_rate": 9.82587064676617e-07, "loss": 1.0834, "step": 316 }, { "epoch": 0.029246915004036443, "grad_norm": 1.7684232974539065, "learning_rate": 9.856965174129355e-07, "loss": 0.9377, "step": 317 }, { "epoch": 0.029339176565563372, "grad_norm": 1.394772844206612, "learning_rate": 9.888059701492538e-07, "loss": 1.0288, "step": 318 }, { "epoch": 0.0294314381270903, "grad_norm": 1.954988795164839, "learning_rate": 9.919154228855721e-07, "loss": 1.0052, "step": 319 }, { "epoch": 0.02952369968861723, "grad_norm": 2.2258500441193436, "learning_rate": 9.950248756218907e-07, "loss": 0.9812, "step": 320 }, { "epoch": 0.02952369968861723, "eval_GEN Loss": 0.49087533354759216, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5189715623855591, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.1018028259277344, "eval_runtime": 57.0008, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 320 }, { "epoch": 0.02961596125014416, "grad_norm": 2.3727144188815235, "learning_rate": 9.98134328358209e-07, "loss": 1.1373, "step": 321 }, { "epoch": 0.029708222811671087, "grad_norm": 1.8414136026249512, "learning_rate": 1.0012437810945275e-06, "loss": 1.0329, "step": 322 }, { "epoch": 0.029800484373198016, "grad_norm": 2.183721854667889, "learning_rate": 1.0043532338308459e-06, "loss": 1.1187, "step": 323 }, { "epoch": 0.029892745934724945, "grad_norm": 2.709076311722809, "learning_rate": 1.0074626865671642e-06, "loss": 1.0809, "step": 324 }, { "epoch": 0.029985007496251874, "grad_norm": 2.0096601825645157, "learning_rate": 1.0105721393034828e-06, "loss": 1.0652, "step": 325 }, { "epoch": 0.029985007496251874, "eval_GEN Loss": 0.4871484637260437, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.521902322769165, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.095312476158142, "eval_runtime": 56.9629, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 325 }, { "epoch": 0.030077269057778803, "grad_norm": 1.4424187514027385, "learning_rate": 1.013681592039801e-06, "loss": 0.978, "step": 326 }, { "epoch": 0.03016953061930573, "grad_norm": 2.009952390028351, "learning_rate": 1.0167910447761194e-06, "loss": 1.045, "step": 327 }, { "epoch": 0.03026179218083266, "grad_norm": 1.6533431602033455, "learning_rate": 1.0199004975124378e-06, "loss": 1.1309, "step": 328 }, { "epoch": 0.03035405374235959, "grad_norm": 1.1151714587863297, "learning_rate": 1.0230099502487563e-06, "loss": 1.0358, "step": 329 }, { "epoch": 0.030446315303886518, "grad_norm": 3.18926319432028, "learning_rate": 1.0261194029850748e-06, "loss": 1.2152, "step": 330 }, { "epoch": 0.030446315303886518, "eval_GEN Loss": 0.4860176146030426, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5272826552391052, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.092548131942749, "eval_runtime": 56.2808, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 330 }, { "epoch": 0.030538576865413447, "grad_norm": 2.5222962270206155, "learning_rate": 1.0292288557213932e-06, "loss": 0.913, "step": 331 }, { "epoch": 0.030630838426940376, "grad_norm": 2.71533521054579, "learning_rate": 1.0323383084577115e-06, "loss": 0.9796, "step": 332 }, { "epoch": 0.030723099988467305, "grad_norm": 1.4512743704884454, "learning_rate": 1.0354477611940298e-06, "loss": 1.0495, "step": 333 }, { "epoch": 0.030815361549994234, "grad_norm": 1.649164586450439, "learning_rate": 1.0385572139303484e-06, "loss": 1.1252, "step": 334 }, { "epoch": 0.030907623111521162, "grad_norm": 1.4892318199359345, "learning_rate": 1.0416666666666667e-06, "loss": 1.0085, "step": 335 }, { "epoch": 0.030907623111521162, "eval_GEN Loss": 0.4881289303302765, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5235222578048706, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.0868990421295166, "eval_runtime": 55.9602, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 335 }, { "epoch": 0.03099988467304809, "grad_norm": 1.532233030413437, "learning_rate": 1.044776119402985e-06, "loss": 1.1126, "step": 336 }, { "epoch": 0.03109214623457502, "grad_norm": 1.9975806321345762, "learning_rate": 1.0478855721393036e-06, "loss": 1.1373, "step": 337 }, { "epoch": 0.03118440779610195, "grad_norm": 1.922418107580109, "learning_rate": 1.050995024875622e-06, "loss": 1.1442, "step": 338 }, { "epoch": 0.03127666935762888, "grad_norm": 2.5195638644586813, "learning_rate": 1.0541044776119405e-06, "loss": 0.8737, "step": 339 }, { "epoch": 0.0313689309191558, "grad_norm": 1.935740382197344, "learning_rate": 1.0572139303482588e-06, "loss": 0.9634, "step": 340 }, { "epoch": 0.0313689309191558, "eval_GEN Loss": 0.4911785125732422, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.523034930229187, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.090504765510559, "eval_runtime": 55.9064, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 340 }, { "epoch": 0.031461192480682736, "grad_norm": 1.9486286152465724, "learning_rate": 1.0603233830845771e-06, "loss": 0.9855, "step": 341 }, { "epoch": 0.03155345404220966, "grad_norm": 1.8546603370864803, "learning_rate": 1.0634328358208957e-06, "loss": 0.9511, "step": 342 }, { "epoch": 0.03164571560373659, "grad_norm": 1.7799476055488155, "learning_rate": 1.066542288557214e-06, "loss": 1.2302, "step": 343 }, { "epoch": 0.03173797716526352, "grad_norm": 1.680439411630123, "learning_rate": 1.0696517412935323e-06, "loss": 1.0727, "step": 344 }, { "epoch": 0.03183023872679045, "grad_norm": 1.6792308304460757, "learning_rate": 1.0727611940298509e-06, "loss": 0.9026, "step": 345 }, { "epoch": 0.03183023872679045, "eval_GEN Loss": 0.49160081148147583, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.518447756767273, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.0872596502304077, "eval_runtime": 56.2021, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 345 }, { "epoch": 0.031922500288317376, "grad_norm": 2.1885529669090316, "learning_rate": 1.0758706467661692e-06, "loss": 0.995, "step": 346 }, { "epoch": 0.03201476184984431, "grad_norm": 2.742387418896271, "learning_rate": 1.0789800995024878e-06, "loss": 0.7945, "step": 347 }, { "epoch": 0.032107023411371234, "grad_norm": 1.4403393167685103, "learning_rate": 1.0820895522388059e-06, "loss": 1.0051, "step": 348 }, { "epoch": 0.032199284972898166, "grad_norm": 1.371955107543284, "learning_rate": 1.0851990049751244e-06, "loss": 1.1058, "step": 349 }, { "epoch": 0.03229154653442509, "grad_norm": 2.8464898439478494, "learning_rate": 1.088308457711443e-06, "loss": 0.8464, "step": 350 }, { "epoch": 0.03229154653442509, "eval_GEN Loss": 0.493305504322052, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.511089026927948, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.0890624523162842, "eval_runtime": 55.8793, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 350 }, { "epoch": 0.032383808095952024, "grad_norm": 1.5514112449284048, "learning_rate": 1.0914179104477613e-06, "loss": 1.0468, "step": 351 }, { "epoch": 0.03247606965747895, "grad_norm": 1.6275512940031138, "learning_rate": 1.0945273631840796e-06, "loss": 1.0689, "step": 352 }, { "epoch": 0.03256833121900588, "grad_norm": 1.8446916567920402, "learning_rate": 1.0976368159203982e-06, "loss": 1.0027, "step": 353 }, { "epoch": 0.03266059278053281, "grad_norm": 2.2633912193599217, "learning_rate": 1.1007462686567165e-06, "loss": 1.1833, "step": 354 }, { "epoch": 0.03275285434205974, "grad_norm": 1.8695264550249542, "learning_rate": 1.1038557213930349e-06, "loss": 1.0588, "step": 355 }, { "epoch": 0.03275285434205974, "eval_GEN Loss": 0.4953005909919739, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8783068783068783, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 Neg": 0.0, "eval_PRM Loss": 0.5123229026794434, "eval_PRM NPV": 0.0, "eval_PRM Precision": 0.7830188679245284, "eval_PRM Recall": 1.0, "eval_PRM Specificty": 0.0, "eval_loss": 1.087499976158142, "eval_runtime": 56.1679, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 355 }, { "epoch": 0.032845115903586665, "grad_norm": 1.8335053955860532, "learning_rate": 1.1069651741293532e-06, "loss": 1.037, "step": 356 }, { "epoch": 0.0329373774651136, "grad_norm": 1.6486659896008766, "learning_rate": 1.1100746268656717e-06, "loss": 1.1072, "step": 357 }, { "epoch": 0.03302963902664052, "grad_norm": 1.572195389553314, "learning_rate": 1.1131840796019903e-06, "loss": 0.9697, "step": 358 }, { "epoch": 0.033121900588167455, "grad_norm": 2.7687689049610777, "learning_rate": 1.1162935323383086e-06, "loss": 0.916, "step": 359 }, { "epoch": 0.03321416214969438, "grad_norm": 1.7728085056791567, "learning_rate": 1.119402985074627e-06, "loss": 1.0788, "step": 360 }, { "epoch": 0.03321416214969438, "eval_GEN Loss": 0.4948984682559967, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.5221074223518372, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0902644395828247, "eval_runtime": 56.9761, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 360 }, { "epoch": 0.03330642371122131, "grad_norm": 1.5701375146458443, "learning_rate": 1.1225124378109453e-06, "loss": 1.0978, "step": 361 }, { "epoch": 0.03339868527274824, "grad_norm": 2.1204690039490304, "learning_rate": 1.1256218905472638e-06, "loss": 1.0687, "step": 362 }, { "epoch": 0.03349094683427517, "grad_norm": 1.601233790604872, "learning_rate": 1.1287313432835822e-06, "loss": 0.9983, "step": 363 }, { "epoch": 0.033583208395802096, "grad_norm": 1.8898677542781388, "learning_rate": 1.1318407960199005e-06, "loss": 0.9063, "step": 364 }, { "epoch": 0.03367546995732903, "grad_norm": 2.2649661149457727, "learning_rate": 1.134950248756219e-06, "loss": 0.9561, "step": 365 }, { "epoch": 0.03367546995732903, "eval_GEN Loss": 0.4931755065917969, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.5178951025009155, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.088641881942749, "eval_runtime": 56.9362, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 365 }, { "epoch": 0.033767731518855953, "grad_norm": 2.5696075162247354, "learning_rate": 1.1380597014925374e-06, "loss": 0.8822, "step": 366 }, { "epoch": 0.033859993080382886, "grad_norm": 1.4433836855901425, "learning_rate": 1.141169154228856e-06, "loss": 1.0123, "step": 367 }, { "epoch": 0.03395225464190981, "grad_norm": 1.4558018932634749, "learning_rate": 1.1442786069651742e-06, "loss": 1.0535, "step": 368 }, { "epoch": 0.034044516203436744, "grad_norm": 3.175675569714823, "learning_rate": 1.1473880597014926e-06, "loss": 1.2205, "step": 369 }, { "epoch": 0.03413677776496367, "grad_norm": 1.7693144783390349, "learning_rate": 1.1504975124378111e-06, "loss": 0.9804, "step": 370 }, { "epoch": 0.03413677776496367, "eval_GEN Loss": 0.4947631359100342, "eval_GEN top-5 accuracy": 0.9754493643138974, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.5144875645637512, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0914663076400757, "eval_runtime": 56.9019, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 370 }, { "epoch": 0.0342290393264906, "grad_norm": 1.7432989957940266, "learning_rate": 1.1536069651741295e-06, "loss": 0.9745, "step": 371 }, { "epoch": 0.03432130088801753, "grad_norm": 1.62302846536514, "learning_rate": 1.1567164179104478e-06, "loss": 0.9044, "step": 372 }, { "epoch": 0.03441356244954446, "grad_norm": 2.1506916661651183, "learning_rate": 1.1598258706467663e-06, "loss": 1.1325, "step": 373 }, { "epoch": 0.034505824011071384, "grad_norm": 1.7935705697116229, "learning_rate": 1.1629353233830847e-06, "loss": 0.9483, "step": 374 }, { "epoch": 0.03459808557259832, "grad_norm": 1.763019620661752, "learning_rate": 1.1660447761194032e-06, "loss": 0.9373, "step": 375 }, { "epoch": 0.03459808557259832, "eval_GEN Loss": 0.4980253577232361, "eval_GEN top-5 accuracy": 0.9754493643138974, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8901098901098901, "eval_PRM F1 AUC": 0.5966474594028287, "eval_PRM F1 Neg": 0.3333333333333333, "eval_PRM Loss": 0.513366162776947, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.8181818181818182, "eval_PRM Recall": 0.9759036144578314, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0947115421295166, "eval_runtime": 56.9597, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 375 }, { "epoch": 0.03469034713412524, "grad_norm": 1.768254678969684, "learning_rate": 1.1691542288557215e-06, "loss": 1.0563, "step": 376 }, { "epoch": 0.034782608695652174, "grad_norm": 1.8553706418639913, "learning_rate": 1.1722636815920399e-06, "loss": 1.2008, "step": 377 }, { "epoch": 0.0348748702571791, "grad_norm": 1.4481012889071891, "learning_rate": 1.1753731343283584e-06, "loss": 1.0245, "step": 378 }, { "epoch": 0.03496713181870603, "grad_norm": 1.7256487619893692, "learning_rate": 1.1784825870646768e-06, "loss": 1.002, "step": 379 }, { "epoch": 0.03505939338023296, "grad_norm": 2.5508092701959217, "learning_rate": 1.181592039800995e-06, "loss": 0.9065, "step": 380 }, { "epoch": 0.03505939338023296, "eval_GEN Loss": 0.495575875043869, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.5119543075561523, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0922476053237915, "eval_runtime": 57.038, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 380 }, { "epoch": 0.03515165494175989, "grad_norm": 1.4722059115710762, "learning_rate": 1.1847014925373134e-06, "loss": 0.9706, "step": 381 }, { "epoch": 0.035243916503286815, "grad_norm": 1.536297412134017, "learning_rate": 1.187810945273632e-06, "loss": 0.9951, "step": 382 }, { "epoch": 0.03533617806481375, "grad_norm": 1.5079787215711309, "learning_rate": 1.1909203980099505e-06, "loss": 1.0306, "step": 383 }, { "epoch": 0.03542843962634067, "grad_norm": 1.5422442471822861, "learning_rate": 1.1940298507462686e-06, "loss": 1.0272, "step": 384 }, { "epoch": 0.035520701187867605, "grad_norm": 1.657448677437209, "learning_rate": 1.1971393034825872e-06, "loss": 0.838, "step": 385 }, { "epoch": 0.035520701187867605, "eval_GEN Loss": 0.49375835061073303, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.500721275806427, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0851562023162842, "eval_runtime": 56.0198, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 385 }, { "epoch": 0.03561296274939453, "grad_norm": 2.249630661061084, "learning_rate": 1.2002487562189055e-06, "loss": 1.1123, "step": 386 }, { "epoch": 0.03570522431092146, "grad_norm": 1.5608366240192577, "learning_rate": 1.203358208955224e-06, "loss": 0.9374, "step": 387 }, { "epoch": 0.03579748587244839, "grad_norm": 2.726231550430038, "learning_rate": 1.2064676616915424e-06, "loss": 1.1078, "step": 388 }, { "epoch": 0.03588974743397532, "grad_norm": 1.358167054618328, "learning_rate": 1.2095771144278607e-06, "loss": 1.0385, "step": 389 }, { "epoch": 0.035982008995502246, "grad_norm": 1.4329854592023732, "learning_rate": 1.2126865671641793e-06, "loss": 0.9826, "step": 390 }, { "epoch": 0.035982008995502246, "eval_GEN Loss": 0.4905219078063965, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8839779005524862, "eval_PRM F1 AUC": 0.5906233630172866, "eval_PRM F1 Neg": 0.3225806451612903, "eval_PRM Loss": 0.4987432360649109, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8163265306122449, "eval_PRM Recall": 0.963855421686747, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 1.0786057710647583, "eval_runtime": 55.9471, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 390 }, { "epoch": 0.03607427055702918, "grad_norm": 1.8050566080096448, "learning_rate": 1.2157960199004976e-06, "loss": 0.8972, "step": 391 }, { "epoch": 0.036166532118556104, "grad_norm": 2.425921846861029, "learning_rate": 1.218905472636816e-06, "loss": 1.075, "step": 392 }, { "epoch": 0.036258793680083036, "grad_norm": 2.7081453428234146, "learning_rate": 1.2220149253731345e-06, "loss": 0.7915, "step": 393 }, { "epoch": 0.03635105524160996, "grad_norm": 1.4076303908682901, "learning_rate": 1.2251243781094528e-06, "loss": 0.9477, "step": 394 }, { "epoch": 0.036443316803136894, "grad_norm": 1.5556668203320005, "learning_rate": 1.2282338308457713e-06, "loss": 0.9539, "step": 395 }, { "epoch": 0.036443316803136894, "eval_GEN Loss": 0.4896683394908905, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8926553672316384, "eval_PRM F1 AUC": 0.6498166579360922, "eval_PRM F1 Neg": 0.45714285714285713, "eval_PRM Loss": 0.5040706396102905, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.8404255319148937, "eval_PRM Recall": 0.9518072289156626, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 1.0819711685180664, "eval_runtime": 56.9164, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 395 }, { "epoch": 0.03653557836466382, "grad_norm": 2.2235428048145374, "learning_rate": 1.2313432835820897e-06, "loss": 1.1407, "step": 396 }, { "epoch": 0.03662783992619075, "grad_norm": 1.77863726581506, "learning_rate": 1.234452736318408e-06, "loss": 1.0715, "step": 397 }, { "epoch": 0.03672010148771768, "grad_norm": 1.4604250196141944, "learning_rate": 1.2375621890547266e-06, "loss": 0.9055, "step": 398 }, { "epoch": 0.03681236304924461, "grad_norm": 2.200986884891539, "learning_rate": 1.2406716417910449e-06, "loss": 1.2049, "step": 399 }, { "epoch": 0.036904624610771534, "grad_norm": 1.1855948742026567, "learning_rate": 1.2437810945273632e-06, "loss": 0.9039, "step": 400 }, { "epoch": 0.036904624610771534, "eval_GEN Loss": 0.4911164343357086, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8914285714285715, "eval_PRM F1 AUC": 0.6655316919853327, "eval_PRM F1 Neg": 0.4864864864864865, "eval_PRM Loss": 0.5084080100059509, "eval_PRM NPV": 0.6428571428571429, "eval_PRM Precision": 0.8478260869565217, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0823317766189575, "eval_runtime": 56.9601, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 400 }, { "epoch": 0.03699688617229847, "grad_norm": 3.4674853596817603, "learning_rate": 1.2468905472636816e-06, "loss": 1.1359, "step": 401 }, { "epoch": 0.03708914773382539, "grad_norm": 2.0138986976213227, "learning_rate": 1.25e-06, "loss": 1.0893, "step": 402 }, { "epoch": 0.037181409295352325, "grad_norm": 1.7482583349421175, "learning_rate": 1.2499999716807582e-06, "loss": 0.9825, "step": 403 }, { "epoch": 0.03727367085687925, "grad_norm": 2.0783198737242836, "learning_rate": 1.249999886723035e-06, "loss": 0.9184, "step": 404 }, { "epoch": 0.03736593241840618, "grad_norm": 1.3697661624020034, "learning_rate": 1.2499997451268387e-06, "loss": 0.866, "step": 405 }, { "epoch": 0.03736593241840618, "eval_GEN Loss": 0.49147337675094604, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 Neg": 0.45, "eval_PRM Loss": 0.5320136547088623, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0904446840286255, "eval_runtime": 56.9151, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 405 }, { "epoch": 0.03745819397993311, "grad_norm": 2.125000262304555, "learning_rate": 1.2499995468921814e-06, "loss": 1.1024, "step": 406 }, { "epoch": 0.03755045554146004, "grad_norm": 3.4249056948683068, "learning_rate": 1.2499992920190814e-06, "loss": 0.9481, "step": 407 }, { "epoch": 0.037642717102986965, "grad_norm": 1.7365912485637587, "learning_rate": 1.2499989805075618e-06, "loss": 0.9993, "step": 408 }, { "epoch": 0.0377349786645139, "grad_norm": 1.8287690837900874, "learning_rate": 1.249998612357651e-06, "loss": 0.9735, "step": 409 }, { "epoch": 0.03782724022604082, "grad_norm": 2.443614782953873, "learning_rate": 1.249998187569382e-06, "loss": 0.9865, "step": 410 }, { "epoch": 0.03782724022604082, "eval_GEN Loss": 0.48897504806518555, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8850574712643678, "eval_PRM F1 AUC": 0.6595075955997904, "eval_PRM F1 Neg": 0.47368421052631576, "eval_PRM Loss": 0.5099429488182068, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.8461538461538461, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0731971263885498, "eval_runtime": 55.9536, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 410 }, { "epoch": 0.037919501787567755, "grad_norm": 3.4338451669618215, "learning_rate": 1.2499977061427935e-06, "loss": 1.1171, "step": 411 }, { "epoch": 0.03801176334909468, "grad_norm": 2.0289882614581076, "learning_rate": 1.2499971680779291e-06, "loss": 0.8247, "step": 412 }, { "epoch": 0.03810402491062161, "grad_norm": 2.298527207458775, "learning_rate": 1.2499965733748375e-06, "loss": 1.0174, "step": 413 }, { "epoch": 0.03819628647214854, "grad_norm": 1.3183253127786805, "learning_rate": 1.2499959220335727e-06, "loss": 0.8969, "step": 414 }, { "epoch": 0.03828854803367547, "grad_norm": 3.9704666165868616, "learning_rate": 1.249995214054194e-06, "loss": 1.1768, "step": 415 }, { "epoch": 0.03828854803367547, "eval_GEN Loss": 0.486381858587265, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8850574712643678, "eval_PRM F1 AUC": 0.6595075955997904, "eval_PRM F1 Neg": 0.47368421052631576, "eval_PRM Loss": 0.49420467019081116, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.8461538461538461, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0578124523162842, "eval_runtime": 56.0141, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 415 }, { "epoch": 0.038380809595202396, "grad_norm": 1.6175496053472633, "learning_rate": 1.2499944494367649e-06, "loss": 0.9617, "step": 416 }, { "epoch": 0.03847307115672933, "grad_norm": 2.8215401472618398, "learning_rate": 1.2499936281813551e-06, "loss": 0.888, "step": 417 }, { "epoch": 0.038565332718256254, "grad_norm": 3.067168938139133, "learning_rate": 1.2499927502880391e-06, "loss": 0.9159, "step": 418 }, { "epoch": 0.038657594279783186, "grad_norm": 1.4636998556443914, "learning_rate": 1.249991815756896e-06, "loss": 0.9951, "step": 419 }, { "epoch": 0.03874985584131011, "grad_norm": 2.244478144941869, "learning_rate": 1.2499908245880114e-06, "loss": 1.071, "step": 420 }, { "epoch": 0.03874985584131011, "eval_GEN Loss": 0.4856526851654053, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8850574712643678, "eval_PRM F1 AUC": 0.6595075955997904, "eval_PRM F1 Neg": 0.47368421052631576, "eval_PRM Loss": 0.48444485664367676, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.8461538461538461, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0461539030075073, "eval_runtime": 56.0607, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 420 }, { "epoch": 0.038842117402837044, "grad_norm": 1.986588212280402, "learning_rate": 1.249989776781474e-06, "loss": 0.9483, "step": 421 }, { "epoch": 0.03893437896436397, "grad_norm": 1.2109181066291579, "learning_rate": 1.2499886723373795e-06, "loss": 0.8441, "step": 422 }, { "epoch": 0.0390266405258909, "grad_norm": 1.7634910222087619, "learning_rate": 1.2499875112558277e-06, "loss": 0.9839, "step": 423 }, { "epoch": 0.03911890208741783, "grad_norm": 1.7202561747692766, "learning_rate": 1.2499862935369238e-06, "loss": 1.0435, "step": 424 }, { "epoch": 0.03921116364894476, "grad_norm": 1.394069525167447, "learning_rate": 1.2499850191807783e-06, "loss": 0.9949, "step": 425 }, { "epoch": 0.03921116364894476, "eval_GEN Loss": 0.48652511835098267, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM Loss": 0.4757426679134369, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 1.0393028259277344, "eval_runtime": 56.0661, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 425 }, { "epoch": 0.039303425210471685, "grad_norm": 1.7432266075385632, "learning_rate": 1.2499836881875066e-06, "loss": 0.9469, "step": 426 }, { "epoch": 0.03939568677199862, "grad_norm": 1.7296291983439422, "learning_rate": 1.2499823005572294e-06, "loss": 0.9209, "step": 427 }, { "epoch": 0.03948794833352554, "grad_norm": 2.2430648621312077, "learning_rate": 1.2499808562900723e-06, "loss": 1.1083, "step": 428 }, { "epoch": 0.039580209895052475, "grad_norm": 2.4839328433585277, "learning_rate": 1.2499793553861664e-06, "loss": 0.8595, "step": 429 }, { "epoch": 0.0396724714565794, "grad_norm": 1.5598120753532012, "learning_rate": 1.2499777978456475e-06, "loss": 0.9752, "step": 430 }, { "epoch": 0.0396724714565794, "eval_GEN Loss": 0.48572012782096863, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.6511262441068623, "eval_PRM F1 Neg": 0.45454545454545453, "eval_PRM Loss": 0.4870435893535614, "eval_PRM NPV": 0.47619047619047616, "eval_PRM Precision": 0.8470588235294118, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 1.043870210647583, "eval_runtime": 56.0713, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 430 }, { "epoch": 0.03976473301810633, "grad_norm": 2.1524630412012176, "learning_rate": 1.2499761836686567e-06, "loss": 1.2483, "step": 431 }, { "epoch": 0.03985699457963326, "grad_norm": 1.684216300151307, "learning_rate": 1.2499745128553406e-06, "loss": 0.9628, "step": 432 }, { "epoch": 0.03994925614116019, "grad_norm": 1.8621080525821148, "learning_rate": 1.2499727854058505e-06, "loss": 1.1252, "step": 433 }, { "epoch": 0.040041517702687116, "grad_norm": 1.5520774876746433, "learning_rate": 1.2499710013203426e-06, "loss": 1.1255, "step": 434 }, { "epoch": 0.04013377926421405, "grad_norm": 2.613192298018756, "learning_rate": 1.249969160598979e-06, "loss": 1.0245, "step": 435 }, { "epoch": 0.04013377926421405, "eval_GEN Loss": 0.48517999053001404, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.84472049689441, "eval_PRM F1 AUC": 0.6922472498690415, "eval_PRM F1 Neg": 0.5098039215686274, "eval_PRM Loss": 0.5124436616897583, "eval_PRM NPV": 0.4642857142857143, "eval_PRM Precision": 0.8717948717948718, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 1.0579928159713745, "eval_runtime": 55.9343, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 435 }, { "epoch": 0.04022604082574097, "grad_norm": 1.5090261556949027, "learning_rate": 1.2499672632419262e-06, "loss": 0.9561, "step": 436 }, { "epoch": 0.040318302387267906, "grad_norm": 1.7390946058193508, "learning_rate": 1.2499653092493567e-06, "loss": 0.9918, "step": 437 }, { "epoch": 0.04041056394879483, "grad_norm": 2.765509328605111, "learning_rate": 1.2499632986214468e-06, "loss": 0.9601, "step": 438 }, { "epoch": 0.04050282551032176, "grad_norm": 1.5586441018546473, "learning_rate": 1.249961231358379e-06, "loss": 0.9044, "step": 439 }, { "epoch": 0.04059508707184869, "grad_norm": 2.2748830104553357, "learning_rate": 1.249959107460341e-06, "loss": 0.9474, "step": 440 }, { "epoch": 0.04059508707184869, "eval_GEN Loss": 0.48855283856391907, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.47612351179122925, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 1.0473557710647583, "eval_runtime": 56.2396, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 440 }, { "epoch": 0.04068734863337562, "grad_norm": 1.8201253581714998, "learning_rate": 1.249956926927525e-06, "loss": 0.8294, "step": 441 }, { "epoch": 0.040779610194902546, "grad_norm": 1.9508496557784138, "learning_rate": 1.2499546897601284e-06, "loss": 0.8903, "step": 442 }, { "epoch": 0.04087187175642948, "grad_norm": 2.3625577338752297, "learning_rate": 1.249952395958354e-06, "loss": 0.7296, "step": 443 }, { "epoch": 0.040964133317956404, "grad_norm": 1.6663025871239967, "learning_rate": 1.24995004552241e-06, "loss": 0.9373, "step": 444 }, { "epoch": 0.041056394879483336, "grad_norm": 1.6603489043388613, "learning_rate": 1.2499476384525092e-06, "loss": 0.9188, "step": 445 }, { "epoch": 0.041056394879483336, "eval_GEN Loss": 0.4943142831325531, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8863636363636364, "eval_PRM F1 AUC": 0.6437925615505501, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM Loss": 0.43712368607521057, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.8387096774193549, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 1.0341947078704834, "eval_runtime": 56.2179, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 445 }, { "epoch": 0.04114865644101026, "grad_norm": 2.9126230204462487, "learning_rate": 1.2499451747488695e-06, "loss": 1.0148, "step": 446 }, { "epoch": 0.041240918002537194, "grad_norm": 1.6767556924452518, "learning_rate": 1.2499426544117146e-06, "loss": 1.0057, "step": 447 }, { "epoch": 0.04133317956406412, "grad_norm": 1.2491079330246846, "learning_rate": 1.2499400774412725e-06, "loss": 0.9206, "step": 448 }, { "epoch": 0.04142544112559105, "grad_norm": 1.6211871447944266, "learning_rate": 1.249937443837777e-06, "loss": 0.8217, "step": 449 }, { "epoch": 0.04151770268711798, "grad_norm": 1.5443566788338265, "learning_rate": 1.2499347536014667e-06, "loss": 0.8358, "step": 450 }, { "epoch": 0.04151770268711798, "eval_GEN Loss": 0.48962274193763733, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM Loss": 0.4641878008842468, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 1.0381009578704834, "eval_runtime": 57.0011, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 450 }, { "epoch": 0.04160996424864491, "grad_norm": 1.4733450427095798, "learning_rate": 1.2499320067325854e-06, "loss": 0.9267, "step": 451 }, { "epoch": 0.041702225810171835, "grad_norm": 2.9303870595244903, "learning_rate": 1.249929203231382e-06, "loss": 0.8684, "step": 452 }, { "epoch": 0.04179448737169877, "grad_norm": 1.785876435180517, "learning_rate": 1.2499263430981106e-06, "loss": 0.9132, "step": 453 }, { "epoch": 0.04188674893322569, "grad_norm": 2.148315533111999, "learning_rate": 1.2499234263330302e-06, "loss": 0.8028, "step": 454 }, { "epoch": 0.041979010494752625, "grad_norm": 2.0582297728234127, "learning_rate": 1.2499204529364053e-06, "loss": 0.7296, "step": 455 }, { "epoch": 0.041979010494752625, "eval_GEN Loss": 0.48988714814186096, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8764044943820225, "eval_PRM F1 AUC": 0.6003143006809848, "eval_PRM F1 Neg": 0.35294117647058826, "eval_PRM Loss": 0.45193052291870117, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8210526315789474, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 1.038401484489441, "eval_runtime": 56.9886, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 455 }, { "epoch": 0.04207127205627955, "grad_norm": 1.9190244382111306, "learning_rate": 1.2499174229085053e-06, "loss": 1.0398, "step": 456 }, { "epoch": 0.04216353361780648, "grad_norm": 1.8902843000632146, "learning_rate": 1.249914336249605e-06, "loss": 0.951, "step": 457 }, { "epoch": 0.04225579517933341, "grad_norm": 1.8539637597556553, "learning_rate": 1.2499111929599836e-06, "loss": 0.921, "step": 458 }, { "epoch": 0.04234805674086034, "grad_norm": 2.476016793580202, "learning_rate": 1.2499079930399266e-06, "loss": 0.8745, "step": 459 }, { "epoch": 0.042440318302387266, "grad_norm": 1.8361355698224726, "learning_rate": 1.2499047364897234e-06, "loss": 0.7503, "step": 460 }, { "epoch": 0.042440318302387266, "eval_GEN Loss": 0.4883134067058563, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8636363636363636, "eval_PRM F1 AUC": 0.5882661079099004, "eval_PRM F1 Neg": 0.3333333333333333, "eval_PRM Loss": 0.46063748002052307, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8172043010752689, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 1.0429086685180664, "eval_runtime": 56.9469, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 460 }, { "epoch": 0.0425325798639142, "grad_norm": 2.4697307017515753, "learning_rate": 1.2499014233096694e-06, "loss": 0.8739, "step": 461 }, { "epoch": 0.04262484142544112, "grad_norm": 2.1777696172759966, "learning_rate": 1.2498980535000649e-06, "loss": 1.0281, "step": 462 }, { "epoch": 0.042717102986968056, "grad_norm": 1.9585664156482705, "learning_rate": 1.249894627061215e-06, "loss": 0.8492, "step": 463 }, { "epoch": 0.04280936454849498, "grad_norm": 1.8737817400264731, "learning_rate": 1.2498911439934306e-06, "loss": 0.934, "step": 464 }, { "epoch": 0.04290162611002191, "grad_norm": 1.6298637608830269, "learning_rate": 1.249887604297027e-06, "loss": 0.8942, "step": 465 }, { "epoch": 0.04290162611002191, "eval_GEN Loss": 0.49040842056274414, "eval_GEN top-5 accuracy": 0.9758877685225779, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8681318681318682, "eval_PRM F1 AUC": 0.5411210057621791, "eval_PRM F1 Neg": 0.2, "eval_PRM Loss": 0.4450353980064392, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.797979797979798, "eval_PRM Recall": 0.9518072289156626, "eval_PRM Specificty": 0.13043478260869565, "eval_loss": 1.0331730842590332, "eval_runtime": 56.9373, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 465 }, { "epoch": 0.04299388767154884, "grad_norm": 3.533649562896908, "learning_rate": 1.2498840079723252e-06, "loss": 0.8994, "step": 466 }, { "epoch": 0.04308614923307577, "grad_norm": 1.8933966875151385, "learning_rate": 1.249880355019651e-06, "loss": 0.9002, "step": 467 }, { "epoch": 0.0431784107946027, "grad_norm": 1.6618181663533436, "learning_rate": 1.2498766454393354e-06, "loss": 0.8512, "step": 468 }, { "epoch": 0.04327067235612963, "grad_norm": 2.2357348374085952, "learning_rate": 1.2498728792317146e-06, "loss": 0.8073, "step": 469 }, { "epoch": 0.043362933917656554, "grad_norm": 1.9890022894412644, "learning_rate": 1.2498690563971302e-06, "loss": 0.6942, "step": 470 }, { "epoch": 0.043362933917656554, "eval_GEN Loss": 0.49270206689834595, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.474351167678833, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 1.0350961685180664, "eval_runtime": 56.9081, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 470 }, { "epoch": 0.04345519547918349, "grad_norm": 1.5430350756935, "learning_rate": 1.2498651769359282e-06, "loss": 0.9192, "step": 471 }, { "epoch": 0.04354745704071041, "grad_norm": 1.903783246574929, "learning_rate": 1.24986124084846e-06, "loss": 0.7874, "step": 472 }, { "epoch": 0.043639718602237344, "grad_norm": 2.5498924226341617, "learning_rate": 1.249857248135083e-06, "loss": 1.0717, "step": 473 }, { "epoch": 0.04373198016376427, "grad_norm": 1.7294727852998102, "learning_rate": 1.2498531987961584e-06, "loss": 0.9471, "step": 474 }, { "epoch": 0.0438242417252912, "grad_norm": 2.1361973305253974, "learning_rate": 1.2498490928320537e-06, "loss": 0.9701, "step": 475 }, { "epoch": 0.0438242417252912, "eval_GEN Loss": 0.4921441972255707, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.437370240688324, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9977163672447205, "eval_runtime": 56.8242, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 475 }, { "epoch": 0.04391650328681813, "grad_norm": 1.5290437108743213, "learning_rate": 1.2498449302431404e-06, "loss": 0.9156, "step": 476 }, { "epoch": 0.04400876484834506, "grad_norm": 3.9898809086088347, "learning_rate": 1.2498407110297961e-06, "loss": 1.045, "step": 477 }, { "epoch": 0.044101026409871985, "grad_norm": 1.713146486887783, "learning_rate": 1.249836435192403e-06, "loss": 1.0169, "step": 478 }, { "epoch": 0.04419328797139892, "grad_norm": 1.7998586465129913, "learning_rate": 1.2498321027313486e-06, "loss": 0.8223, "step": 479 }, { "epoch": 0.04428554953292584, "grad_norm": 2.3953689065770876, "learning_rate": 1.2498277136470255e-06, "loss": 0.7211, "step": 480 }, { "epoch": 0.04428554953292584, "eval_GEN Loss": 0.4898214042186737, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4590703248977661, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9987980723381042, "eval_runtime": 56.7968, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 480 }, { "epoch": 0.044377811094452775, "grad_norm": 2.392990239491769, "learning_rate": 1.2498232679398317e-06, "loss": 0.8219, "step": 481 }, { "epoch": 0.0444700726559797, "grad_norm": 1.6793203035636983, "learning_rate": 1.2498187656101698e-06, "loss": 0.8014, "step": 482 }, { "epoch": 0.04456233421750663, "grad_norm": 2.296906461119564, "learning_rate": 1.2498142066584478e-06, "loss": 0.8739, "step": 483 }, { "epoch": 0.04465459577903356, "grad_norm": 2.466338328508299, "learning_rate": 1.249809591085079e-06, "loss": 0.8223, "step": 484 }, { "epoch": 0.04474685734056049, "grad_norm": 2.2045465950681216, "learning_rate": 1.2498049188904814e-06, "loss": 0.873, "step": 485 }, { "epoch": 0.04474685734056049, "eval_GEN Loss": 0.490390807390213, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4337656497955322, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9806490540504456, "eval_runtime": 56.8854, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 485 }, { "epoch": 0.044839118902087416, "grad_norm": 1.8767930377025188, "learning_rate": 1.2498001900750788e-06, "loss": 0.7161, "step": 486 }, { "epoch": 0.04493138046361435, "grad_norm": 1.5220048281800544, "learning_rate": 1.2497954046392995e-06, "loss": 0.9338, "step": 487 }, { "epoch": 0.045023642025141274, "grad_norm": 2.5084112217548404, "learning_rate": 1.2497905625835773e-06, "loss": 0.9706, "step": 488 }, { "epoch": 0.045115903586668206, "grad_norm": 1.8840675032339782, "learning_rate": 1.2497856639083508e-06, "loss": 0.7622, "step": 489 }, { "epoch": 0.04520816514819513, "grad_norm": 1.6871894439217352, "learning_rate": 1.249780708614064e-06, "loss": 0.8241, "step": 490 }, { "epoch": 0.04520816514819513, "eval_GEN Loss": 0.4915316104888916, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.41830411553382874, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9688100814819336, "eval_runtime": 57.0794, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 490 }, { "epoch": 0.045300426709722064, "grad_norm": 1.7444544329434182, "learning_rate": 1.2497756967011658e-06, "loss": 0.7967, "step": 491 }, { "epoch": 0.04539268827124899, "grad_norm": 2.95337755170944, "learning_rate": 1.2497706281701107e-06, "loss": 1.0388, "step": 492 }, { "epoch": 0.04548494983277592, "grad_norm": 1.9349385229854092, "learning_rate": 1.249765503021358e-06, "loss": 0.8927, "step": 493 }, { "epoch": 0.04557721139430285, "grad_norm": 1.6823368055068961, "learning_rate": 1.2497603212553718e-06, "loss": 0.8645, "step": 494 }, { "epoch": 0.04566947295582978, "grad_norm": 1.1607320411290694, "learning_rate": 1.249755082872622e-06, "loss": 0.8193, "step": 495 }, { "epoch": 0.04566947295582978, "eval_GEN Loss": 0.48993173241615295, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4339875280857086, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9669471383094788, "eval_runtime": 57.1224, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 495 }, { "epoch": 0.045761734517356704, "grad_norm": 2.5211869469282977, "learning_rate": 1.2497497878735831e-06, "loss": 0.9542, "step": 496 }, { "epoch": 0.04585399607888364, "grad_norm": 1.8091471907694843, "learning_rate": 1.2497444362587352e-06, "loss": 0.7601, "step": 497 }, { "epoch": 0.04594625764041056, "grad_norm": 1.7687992668461012, "learning_rate": 1.249739028028563e-06, "loss": 0.7659, "step": 498 }, { "epoch": 0.046038519201937494, "grad_norm": 1.4396309371176, "learning_rate": 1.2497335631835569e-06, "loss": 0.878, "step": 499 }, { "epoch": 0.04613078076346442, "grad_norm": 1.9668782595980827, "learning_rate": 1.2497280417242117e-06, "loss": 0.8463, "step": 500 }, { "epoch": 0.04613078076346442, "eval_GEN Loss": 0.49217748641967773, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4544593095779419, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9750000238418579, "eval_runtime": 56.8259, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 500 }, { "epoch": 0.04622304232499135, "grad_norm": 2.6448659618140278, "learning_rate": 1.2497224636510282e-06, "loss": 0.9017, "step": 501 }, { "epoch": 0.04631530388651828, "grad_norm": 2.865230099490025, "learning_rate": 1.2497168289645117e-06, "loss": 0.5919, "step": 502 }, { "epoch": 0.04640756544804521, "grad_norm": 3.5435121302194768, "learning_rate": 1.2497111376651728e-06, "loss": 1.0819, "step": 503 }, { "epoch": 0.046499827009572135, "grad_norm": 2.1265478178651334, "learning_rate": 1.2497053897535275e-06, "loss": 0.9577, "step": 504 }, { "epoch": 0.04659208857109907, "grad_norm": 2.3646329293378567, "learning_rate": 1.249699585230096e-06, "loss": 0.7973, "step": 505 }, { "epoch": 0.04659208857109907, "eval_GEN Loss": 0.49786898493766785, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.4246281087398529, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9762019515037537, "eval_runtime": 55.8521, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 505 }, { "epoch": 0.04668435013262599, "grad_norm": 1.7789669025076071, "learning_rate": 1.2496937240954053e-06, "loss": 0.9174, "step": 506 }, { "epoch": 0.046776611694152925, "grad_norm": 1.4940974641561018, "learning_rate": 1.2496878063499859e-06, "loss": 0.7763, "step": 507 }, { "epoch": 0.04686887325567985, "grad_norm": 2.240464981910987, "learning_rate": 1.249681831994374e-06, "loss": 0.9162, "step": 508 }, { "epoch": 0.04696113481720678, "grad_norm": 1.7331241048782036, "learning_rate": 1.2496758010291115e-06, "loss": 0.7101, "step": 509 }, { "epoch": 0.04705339637873371, "grad_norm": 2.1776111323371206, "learning_rate": 1.2496697134547445e-06, "loss": 0.9251, "step": 510 }, { "epoch": 0.04705339637873371, "eval_GEN Loss": 0.5021944642066956, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.42142724990844727, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9699519276618958, "eval_runtime": 55.9135, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 510 }, { "epoch": 0.04714565794026064, "grad_norm": 1.8149877200200812, "learning_rate": 1.249663569271825e-06, "loss": 0.8276, "step": 511 }, { "epoch": 0.047237919501787566, "grad_norm": 2.311685094068292, "learning_rate": 1.2496573684809093e-06, "loss": 1.0577, "step": 512 }, { "epoch": 0.0473301810633145, "grad_norm": 1.8430300506162633, "learning_rate": 1.24965111108256e-06, "loss": 1.0098, "step": 513 }, { "epoch": 0.047422442624841424, "grad_norm": 1.7150755345180988, "learning_rate": 1.2496447970773435e-06, "loss": 0.8558, "step": 514 }, { "epoch": 0.047514704186368356, "grad_norm": 2.322171852550018, "learning_rate": 1.2496384264658322e-06, "loss": 1.1605, "step": 515 }, { "epoch": 0.047514704186368356, "eval_GEN Loss": 0.5072044730186462, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7169811320754716, "eval_PRM F1": 0.7945205479452054, "eval_PRM F1 AUC": 0.7407019381875328, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.5061312317848206, "eval_PRM NPV": 0.4186046511627907, "eval_PRM Precision": 0.9206349206349206, "eval_PRM Recall": 0.6987951807228916, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 1.0418870449066162, "eval_runtime": 56.1244, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 515 }, { "epoch": 0.04760696574789528, "grad_norm": 2.376452841356278, "learning_rate": 1.249631999248604e-06, "loss": 0.8696, "step": 516 }, { "epoch": 0.047699227309422214, "grad_norm": 2.1697200720346226, "learning_rate": 1.2496255154262405e-06, "loss": 0.7282, "step": 517 }, { "epoch": 0.04779148887094914, "grad_norm": 2.231618573506481, "learning_rate": 1.2496189749993296e-06, "loss": 1.0144, "step": 518 }, { "epoch": 0.04788375043247607, "grad_norm": 1.4477856564989626, "learning_rate": 1.249612377968464e-06, "loss": 0.7972, "step": 519 }, { "epoch": 0.047976011994003, "grad_norm": 2.522904308533631, "learning_rate": 1.2496057243342416e-06, "loss": 0.9651, "step": 520 }, { "epoch": 0.047976011994003, "eval_GEN Loss": 0.5013367533683777, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.44258493185043335, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9829326868057251, "eval_runtime": 56.1787, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 520 }, { "epoch": 0.04806827355552993, "grad_norm": 1.3827215268108803, "learning_rate": 1.2495990140972653e-06, "loss": 0.9284, "step": 521 }, { "epoch": 0.048160535117056855, "grad_norm": 1.9755875110206902, "learning_rate": 1.2495922472581435e-06, "loss": 0.8925, "step": 522 }, { "epoch": 0.04825279667858379, "grad_norm": 2.0814499114539373, "learning_rate": 1.2495854238174887e-06, "loss": 1.1083, "step": 523 }, { "epoch": 0.04834505824011071, "grad_norm": 2.5417062148450147, "learning_rate": 1.24957854377592e-06, "loss": 1.0285, "step": 524 }, { "epoch": 0.048437319801637645, "grad_norm": 1.4908946062519384, "learning_rate": 1.2495716071340602e-06, "loss": 0.8482, "step": 525 }, { "epoch": 0.048437319801637645, "eval_GEN Loss": 0.4994891285896301, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.44036853313446045, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9760817289352417, "eval_runtime": 55.9269, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 525 }, { "epoch": 0.04852958136316457, "grad_norm": 1.5067261309429942, "learning_rate": 1.2495646138925384e-06, "loss": 0.863, "step": 526 }, { "epoch": 0.0486218429246915, "grad_norm": 1.7909389832906948, "learning_rate": 1.2495575640519886e-06, "loss": 0.8381, "step": 527 }, { "epoch": 0.04871410448621843, "grad_norm": 1.603287958124817, "learning_rate": 1.2495504576130488e-06, "loss": 0.8497, "step": 528 }, { "epoch": 0.04880636604774536, "grad_norm": 2.4102436997096057, "learning_rate": 1.2495432945763638e-06, "loss": 0.8235, "step": 529 }, { "epoch": 0.048898627609272285, "grad_norm": 1.6308890605210715, "learning_rate": 1.2495360749425821e-06, "loss": 0.9034, "step": 530 }, { "epoch": 0.048898627609272285, "eval_GEN Loss": 0.49671459197998047, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM Loss": 0.4215235710144043, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9649639129638672, "eval_runtime": 55.754, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 530 }, { "epoch": 0.04899088917079922, "grad_norm": 1.6207713329635076, "learning_rate": 1.2495287987123587e-06, "loss": 0.9246, "step": 531 }, { "epoch": 0.04908315073232614, "grad_norm": 2.137962559846118, "learning_rate": 1.2495214658863521e-06, "loss": 1.0508, "step": 532 }, { "epoch": 0.049175412293853075, "grad_norm": 3.0740623866229284, "learning_rate": 1.2495140764652274e-06, "loss": 0.9697, "step": 533 }, { "epoch": 0.04926767385538, "grad_norm": 1.915824797340991, "learning_rate": 1.2495066304496542e-06, "loss": 0.7938, "step": 534 }, { "epoch": 0.04935993541690693, "grad_norm": 2.0017572967949744, "learning_rate": 1.2494991278403068e-06, "loss": 0.8639, "step": 535 }, { "epoch": 0.04935993541690693, "eval_GEN Loss": 0.49528592824935913, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM Loss": 0.4145190715789795, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9653846025466919, "eval_runtime": 55.8675, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 535 }, { "epoch": 0.04945219697843386, "grad_norm": 1.7101567064092154, "learning_rate": 1.2494915686378658e-06, "loss": 0.7717, "step": 536 }, { "epoch": 0.04954445853996079, "grad_norm": 1.8633417800502488, "learning_rate": 1.2494839528430158e-06, "loss": 0.9391, "step": 537 }, { "epoch": 0.049636720101487716, "grad_norm": 2.255765287910322, "learning_rate": 1.2494762804564472e-06, "loss": 0.9261, "step": 538 }, { "epoch": 0.04972898166301465, "grad_norm": 2.097067196958236, "learning_rate": 1.2494685514788548e-06, "loss": 0.8661, "step": 539 }, { "epoch": 0.049821243224541574, "grad_norm": 1.8120378173288358, "learning_rate": 1.2494607659109396e-06, "loss": 0.9078, "step": 540 }, { "epoch": 0.049821243224541574, "eval_GEN Loss": 0.500647246837616, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8789808917197452, "eval_PRM F1 AUC": 0.8069669984284967, "eval_PRM F1 Neg": 0.6545454545454545, "eval_PRM Loss": 0.44509997963905334, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.9324324324324325, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9778845906257629, "eval_runtime": 55.9283, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 540 }, { "epoch": 0.049913504786068506, "grad_norm": 1.9209686059123097, "learning_rate": 1.2494529237534067e-06, "loss": 0.9968, "step": 541 }, { "epoch": 0.05000576634759543, "grad_norm": 2.791385333364772, "learning_rate": 1.249445025006967e-06, "loss": 0.7469, "step": 542 }, { "epoch": 0.050098027909122364, "grad_norm": 2.070234368370357, "learning_rate": 1.2494370696723362e-06, "loss": 0.9128, "step": 543 }, { "epoch": 0.05019028947064929, "grad_norm": 1.8867484348866532, "learning_rate": 1.2494290577502354e-06, "loss": 0.8872, "step": 544 }, { "epoch": 0.05028255103217622, "grad_norm": 2.5572474728796784, "learning_rate": 1.2494209892413905e-06, "loss": 0.8109, "step": 545 }, { "epoch": 0.05028255103217622, "eval_GEN Loss": 0.5057682394981384, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8627450980392157, "eval_PRM F1 AUC": 0.8106338397066527, "eval_PRM F1 Neg": 0.6440677966101694, "eval_PRM Loss": 0.4570285379886627, "eval_PRM NPV": 0.5277777777777778, "eval_PRM Precision": 0.9428571428571428, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.9915865659713745, "eval_runtime": 55.772, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 545 }, { "epoch": 0.05037481259370315, "grad_norm": 1.5454658736067963, "learning_rate": 1.2494128641465328e-06, "loss": 0.9491, "step": 546 }, { "epoch": 0.05046707415523008, "grad_norm": 2.0036633039639886, "learning_rate": 1.2494046824663983e-06, "loss": 0.8376, "step": 547 }, { "epoch": 0.050559335716757005, "grad_norm": 1.4598488584859581, "learning_rate": 1.2493964442017286e-06, "loss": 0.8602, "step": 548 }, { "epoch": 0.05065159727828394, "grad_norm": 2.1035556200520196, "learning_rate": 1.2493881493532705e-06, "loss": 0.9633, "step": 549 }, { "epoch": 0.05074385883981086, "grad_norm": 2.1527492930053396, "learning_rate": 1.2493797979217755e-06, "loss": 0.8665, "step": 550 }, { "epoch": 0.05074385883981086, "eval_GEN Loss": 0.5002301931381226, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.4020197093486786, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9468749761581421, "eval_runtime": 56.4, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 550 }, { "epoch": 0.050836120401337795, "grad_norm": 1.833646828545211, "learning_rate": 1.2493713899080004e-06, "loss": 0.821, "step": 551 }, { "epoch": 0.05092838196286472, "grad_norm": 1.30148826318895, "learning_rate": 1.2493629253127071e-06, "loss": 0.8375, "step": 552 }, { "epoch": 0.05102064352439165, "grad_norm": 1.4962814588034477, "learning_rate": 1.2493544041366627e-06, "loss": 0.868, "step": 553 }, { "epoch": 0.05111290508591858, "grad_norm": 1.1764107105303518, "learning_rate": 1.2493458263806397e-06, "loss": 0.8314, "step": 554 }, { "epoch": 0.05120516664744551, "grad_norm": 1.8363744781281612, "learning_rate": 1.2493371920454148e-06, "loss": 0.7943, "step": 555 }, { "epoch": 0.05120516664744551, "eval_GEN Loss": 0.5007193684577942, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM Loss": 0.4065876603126526, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9555288553237915, "eval_runtime": 55.9094, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 555 }, { "epoch": 0.051297428208972436, "grad_norm": 1.550613414062432, "learning_rate": 1.249328501131771e-06, "loss": 0.8468, "step": 556 }, { "epoch": 0.05138968977049937, "grad_norm": 2.7132984825720463, "learning_rate": 1.2493197536404958e-06, "loss": 0.8685, "step": 557 }, { "epoch": 0.05148195133202629, "grad_norm": 1.942546454934521, "learning_rate": 1.2493109495723817e-06, "loss": 0.929, "step": 558 }, { "epoch": 0.051574212893553226, "grad_norm": 1.747050475065823, "learning_rate": 1.249302088928227e-06, "loss": 0.8059, "step": 559 }, { "epoch": 0.05166647445508015, "grad_norm": 2.179161275340723, "learning_rate": 1.2492931717088338e-06, "loss": 0.8583, "step": 560 }, { "epoch": 0.05166647445508015, "eval_GEN Loss": 0.4996907711029053, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4268765449523926, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9620192050933838, "eval_runtime": 56.3711, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 560 }, { "epoch": 0.05175873601660708, "grad_norm": 3.458615325297117, "learning_rate": 1.2492841979150112e-06, "loss": 1.1285, "step": 561 }, { "epoch": 0.05185099757813401, "grad_norm": 1.580788882347539, "learning_rate": 1.2492751675475717e-06, "loss": 0.9045, "step": 562 }, { "epoch": 0.05194325913966094, "grad_norm": 1.7784183829994715, "learning_rate": 1.2492660806073339e-06, "loss": 0.9334, "step": 563 }, { "epoch": 0.052035520701187866, "grad_norm": 2.05324686189782, "learning_rate": 1.2492569370951214e-06, "loss": 0.9087, "step": 564 }, { "epoch": 0.0521277822627148, "grad_norm": 2.1872773094388736, "learning_rate": 1.2492477370117626e-06, "loss": 0.9456, "step": 565 }, { "epoch": 0.0521277822627148, "eval_GEN Loss": 0.5036789178848267, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8289473684210527, "eval_PRM F1 AUC": 0.749083289680461, "eval_PRM F1 Neg": 0.5666666666666667, "eval_PRM Loss": 0.47351765632629395, "eval_PRM NPV": 0.4594594594594595, "eval_PRM Precision": 0.9130434782608695, "eval_PRM Recall": 0.7590361445783133, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9850360751152039, "eval_runtime": 56.0195, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 565 }, { "epoch": 0.052220043824241724, "grad_norm": 2.250551754667014, "learning_rate": 1.2492384803580913e-06, "loss": 1.0084, "step": 566 }, { "epoch": 0.052312305385768657, "grad_norm": 1.796614062913743, "learning_rate": 1.2492291671349464e-06, "loss": 0.8762, "step": 567 }, { "epoch": 0.05240456694729558, "grad_norm": 2.4404571448323558, "learning_rate": 1.2492197973431716e-06, "loss": 0.9033, "step": 568 }, { "epoch": 0.052496828508822514, "grad_norm": 2.0002215859856256, "learning_rate": 1.2492103709836166e-06, "loss": 0.8474, "step": 569 }, { "epoch": 0.05258909007034944, "grad_norm": 2.031138317769336, "learning_rate": 1.249200888057135e-06, "loss": 0.8613, "step": 570 }, { "epoch": 0.05258909007034944, "eval_GEN Loss": 0.5067321062088013, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.45650914311408997, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9834134578704834, "eval_runtime": 55.9727, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 570 }, { "epoch": 0.05268135163187637, "grad_norm": 1.2268314366957531, "learning_rate": 1.2491913485645862e-06, "loss": 0.8199, "step": 571 }, { "epoch": 0.0527736131934033, "grad_norm": 2.776007518800226, "learning_rate": 1.2491817525068354e-06, "loss": 0.7782, "step": 572 }, { "epoch": 0.05286587475493023, "grad_norm": 1.7140385408739764, "learning_rate": 1.2491720998847515e-06, "loss": 0.8507, "step": 573 }, { "epoch": 0.052958136316457155, "grad_norm": 1.504065091867208, "learning_rate": 1.2491623906992092e-06, "loss": 0.7926, "step": 574 }, { "epoch": 0.05305039787798409, "grad_norm": 3.8341411486065207, "learning_rate": 1.2491526249510887e-06, "loss": 1.2054, "step": 575 }, { "epoch": 0.05305039787798409, "eval_GEN Loss": 0.5083337426185608, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.4059189558029175, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 1.0139423608779907, "eval_runtime": 55.9813, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 575 }, { "epoch": 0.05314265943951101, "grad_norm": 2.428060017967457, "learning_rate": 1.2491428026412752e-06, "loss": 0.8207, "step": 576 }, { "epoch": 0.053234921001037945, "grad_norm": 1.6934940756786587, "learning_rate": 1.2491329237706585e-06, "loss": 0.7227, "step": 577 }, { "epoch": 0.05332718256256487, "grad_norm": 2.866311618541313, "learning_rate": 1.2491229883401335e-06, "loss": 0.755, "step": 578 }, { "epoch": 0.0534194441240918, "grad_norm": 1.4945832523138576, "learning_rate": 1.249112996350601e-06, "loss": 0.8642, "step": 579 }, { "epoch": 0.05351170568561873, "grad_norm": 2.2047133714725686, "learning_rate": 1.2491029478029667e-06, "loss": 0.7895, "step": 580 }, { "epoch": 0.05351170568561873, "eval_GEN Loss": 0.5080254673957825, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.40413254499435425, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9838341474533081, "eval_runtime": 57.004, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 580 }, { "epoch": 0.05360396724714566, "grad_norm": 3.386791216845856, "learning_rate": 1.2490928426981406e-06, "loss": 1.0675, "step": 581 }, { "epoch": 0.053696228808672586, "grad_norm": 1.8008239620645539, "learning_rate": 1.2490826810370388e-06, "loss": 0.8744, "step": 582 }, { "epoch": 0.05378849037019952, "grad_norm": 2.1841412190942178, "learning_rate": 1.249072462820582e-06, "loss": 0.7634, "step": 583 }, { "epoch": 0.053880751931726444, "grad_norm": 1.8399717770459827, "learning_rate": 1.2490621880496968e-06, "loss": 0.953, "step": 584 }, { "epoch": 0.053973013493253376, "grad_norm": 1.8292775229199802, "learning_rate": 1.2490518567253136e-06, "loss": 0.9233, "step": 585 }, { "epoch": 0.053973013493253376, "eval_GEN Loss": 0.5101640820503235, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7264150943396226, "eval_PRM F1": 0.8053691275167785, "eval_PRM F1 AUC": 0.7310110005238345, "eval_PRM F1 Neg": 0.5396825396825397, "eval_PRM Loss": 0.48764801025390625, "eval_PRM NPV": 0.425, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.7228915662650602, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 1.0290865898132324, "eval_runtime": 55.8138, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 585 }, { "epoch": 0.0540652750547803, "grad_norm": 2.3623630200412364, "learning_rate": 1.2490414688483688e-06, "loss": 0.8771, "step": 586 }, { "epoch": 0.054157536616307234, "grad_norm": 2.680394664733209, "learning_rate": 1.2490310244198036e-06, "loss": 0.9148, "step": 587 }, { "epoch": 0.05424979817783416, "grad_norm": 2.3588791333181307, "learning_rate": 1.2490205234405652e-06, "loss": 0.8595, "step": 588 }, { "epoch": 0.05434205973936109, "grad_norm": 2.099221453060737, "learning_rate": 1.2490099659116045e-06, "loss": 0.88, "step": 589 }, { "epoch": 0.05443432130088802, "grad_norm": 1.8877239678915219, "learning_rate": 1.2489993518338784e-06, "loss": 0.7525, "step": 590 }, { "epoch": 0.05443432130088802, "eval_GEN Loss": 0.5080305337905884, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7169811320754716, "eval_PRM F1": 0.7945205479452054, "eval_PRM F1 AUC": 0.7407019381875328, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.5066564083099365, "eval_PRM NPV": 0.4186046511627907, "eval_PRM Precision": 0.9206349206349206, "eval_PRM Recall": 0.6987951807228916, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 1.0357571840286255, "eval_runtime": 55.6673, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 590 }, { "epoch": 0.05452658286241495, "grad_norm": 2.0831530454994596, "learning_rate": 1.248988681208349e-06, "loss": 0.8641, "step": 591 }, { "epoch": 0.054618844423941874, "grad_norm": 2.434562035432444, "learning_rate": 1.2489779540359831e-06, "loss": 0.9395, "step": 592 }, { "epoch": 0.05471110598546881, "grad_norm": 1.9821337764100029, "learning_rate": 1.2489671703177527e-06, "loss": 0.9168, "step": 593 }, { "epoch": 0.05480336754699573, "grad_norm": 1.6688384237423188, "learning_rate": 1.2489563300546353e-06, "loss": 0.9708, "step": 594 }, { "epoch": 0.054895629108522664, "grad_norm": 2.071824994069014, "learning_rate": 1.2489454332476133e-06, "loss": 1.0497, "step": 595 }, { "epoch": 0.054895629108522664, "eval_GEN Loss": 0.5029069185256958, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.45642784237861633, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9888221025466919, "eval_runtime": 55.781, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 595 }, { "epoch": 0.05498789067004959, "grad_norm": 1.5930169744134677, "learning_rate": 1.2489344798976737e-06, "loss": 0.8281, "step": 596 }, { "epoch": 0.05508015223157652, "grad_norm": 1.6643989876991003, "learning_rate": 1.2489234700058098e-06, "loss": 0.9325, "step": 597 }, { "epoch": 0.05517241379310345, "grad_norm": 2.053707907675361, "learning_rate": 1.2489124035730189e-06, "loss": 0.8368, "step": 598 }, { "epoch": 0.05526467535463038, "grad_norm": 1.3682926993227886, "learning_rate": 1.248901280600304e-06, "loss": 0.7565, "step": 599 }, { "epoch": 0.055356936916157305, "grad_norm": 1.3096687655332433, "learning_rate": 1.2488901010886727e-06, "loss": 0.8928, "step": 600 }, { "epoch": 0.055356936916157305, "eval_GEN Loss": 0.5018876194953918, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4348255693912506, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9718149304389954, "eval_runtime": 55.8031, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 600 }, { "epoch": 0.05544919847768424, "grad_norm": 1.6840601316309256, "learning_rate": 1.2488788650391388e-06, "loss": 0.9862, "step": 601 }, { "epoch": 0.05554146003921116, "grad_norm": 1.6312387559443748, "learning_rate": 1.2488675724527198e-06, "loss": 0.7968, "step": 602 }, { "epoch": 0.055633721600738095, "grad_norm": 2.4815635062361445, "learning_rate": 1.2488562233304396e-06, "loss": 0.9873, "step": 603 }, { "epoch": 0.05572598316226502, "grad_norm": 2.0552191331719247, "learning_rate": 1.2488448176733262e-06, "loss": 0.8915, "step": 604 }, { "epoch": 0.05581824472379195, "grad_norm": 2.117906169476475, "learning_rate": 1.2488333554824138e-06, "loss": 0.9145, "step": 605 }, { "epoch": 0.05581824472379195, "eval_GEN Loss": 0.5006439685821533, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.44969943165779114, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9799278974533081, "eval_runtime": 55.7109, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 605 }, { "epoch": 0.05591050628531888, "grad_norm": 2.038318905132651, "learning_rate": 1.2488218367587406e-06, "loss": 0.8549, "step": 606 }, { "epoch": 0.05600276784684581, "grad_norm": 1.778697446036608, "learning_rate": 1.2488102615033509e-06, "loss": 0.7878, "step": 607 }, { "epoch": 0.056095029408372736, "grad_norm": 1.8828030591591378, "learning_rate": 1.2487986297172933e-06, "loss": 0.7999, "step": 608 }, { "epoch": 0.05618729096989967, "grad_norm": 2.1397135575934847, "learning_rate": 1.248786941401622e-06, "loss": 0.9599, "step": 609 }, { "epoch": 0.056279552531426594, "grad_norm": 2.161450949773939, "learning_rate": 1.248775196557396e-06, "loss": 0.7918, "step": 610 }, { "epoch": 0.056279552531426594, "eval_GEN Loss": 0.49783971905708313, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.43421003222465515, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9634615182876587, "eval_runtime": 55.7168, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 610 }, { "epoch": 0.056371814092953526, "grad_norm": 1.7052262220432919, "learning_rate": 1.24876339518568e-06, "loss": 0.785, "step": 611 }, { "epoch": 0.05646407565448045, "grad_norm": 1.844819283964889, "learning_rate": 1.2487515372875434e-06, "loss": 0.8631, "step": 612 }, { "epoch": 0.056556337216007384, "grad_norm": 2.002989390981208, "learning_rate": 1.2487396228640606e-06, "loss": 0.7582, "step": 613 }, { "epoch": 0.05664859877753431, "grad_norm": 3.118346437681846, "learning_rate": 1.2487276519163114e-06, "loss": 0.9991, "step": 614 }, { "epoch": 0.05674086033906124, "grad_norm": 2.5488199308499677, "learning_rate": 1.2487156244453807e-06, "loss": 0.9039, "step": 615 }, { "epoch": 0.05674086033906124, "eval_GEN Loss": 0.4985102713108063, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.4201836884021759, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9504807591438293, "eval_runtime": 55.8043, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 615 }, { "epoch": 0.05683312190058817, "grad_norm": 3.8890403160471334, "learning_rate": 1.2487035404523583e-06, "loss": 1.1244, "step": 616 }, { "epoch": 0.0569253834621151, "grad_norm": 2.0172657598100177, "learning_rate": 1.2486913999383393e-06, "loss": 0.8988, "step": 617 }, { "epoch": 0.057017645023642025, "grad_norm": 1.4561923092029698, "learning_rate": 1.248679202904424e-06, "loss": 0.7902, "step": 618 }, { "epoch": 0.05710990658516896, "grad_norm": 2.702825562484095, "learning_rate": 1.2486669493517176e-06, "loss": 0.993, "step": 619 }, { "epoch": 0.05720216814669588, "grad_norm": 2.2481441663700052, "learning_rate": 1.2486546392813307e-06, "loss": 0.8837, "step": 620 }, { "epoch": 0.05720216814669588, "eval_GEN Loss": 0.4994538128376007, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM Loss": 0.45006895065307617, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9386418461799622, "eval_runtime": 55.781, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 620 }, { "epoch": 0.057294429708222815, "grad_norm": 1.5164571122984896, "learning_rate": 1.2486422726943786e-06, "loss": 0.8415, "step": 621 }, { "epoch": 0.05738669126974974, "grad_norm": 1.770771183189257, "learning_rate": 1.2486298495919822e-06, "loss": 0.8257, "step": 622 }, { "epoch": 0.05747895283127667, "grad_norm": 1.6682291902578132, "learning_rate": 1.2486173699752672e-06, "loss": 0.821, "step": 623 }, { "epoch": 0.0575712143928036, "grad_norm": 2.108982914483475, "learning_rate": 1.2486048338453646e-06, "loss": 0.9856, "step": 624 }, { "epoch": 0.05766347595433053, "grad_norm": 1.810862754522022, "learning_rate": 1.2485922412034102e-06, "loss": 0.786, "step": 625 }, { "epoch": 0.05766347595433053, "eval_GEN Loss": 0.5000378489494324, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.43361374735832214, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.932812511920929, "eval_runtime": 55.7417, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 625 }, { "epoch": 0.057755737515857455, "grad_norm": 1.772217409354434, "learning_rate": 1.2485795920505455e-06, "loss": 0.6705, "step": 626 }, { "epoch": 0.05784799907738439, "grad_norm": 2.001067166174967, "learning_rate": 1.2485668863879167e-06, "loss": 1.0233, "step": 627 }, { "epoch": 0.05794026063891131, "grad_norm": 1.4840923781348787, "learning_rate": 1.248554124216675e-06, "loss": 0.9001, "step": 628 }, { "epoch": 0.058032522200438245, "grad_norm": 1.8101679414620182, "learning_rate": 1.248541305537977e-06, "loss": 0.7187, "step": 629 }, { "epoch": 0.05812478376196517, "grad_norm": 2.073748668928117, "learning_rate": 1.2485284303529847e-06, "loss": 0.8885, "step": 630 }, { "epoch": 0.05812478376196517, "eval_GEN Loss": 0.501082181930542, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM Loss": 0.41623395681381226, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9604567289352417, "eval_runtime": 55.9232, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 630 }, { "epoch": 0.0582170453234921, "grad_norm": 1.993221305531676, "learning_rate": 1.2485154986628646e-06, "loss": 0.8211, "step": 631 }, { "epoch": 0.05830930688501903, "grad_norm": 1.6783005576180885, "learning_rate": 1.2485025104687885e-06, "loss": 0.8251, "step": 632 }, { "epoch": 0.05840156844654596, "grad_norm": 1.7378727446242044, "learning_rate": 1.248489465771933e-06, "loss": 0.8405, "step": 633 }, { "epoch": 0.058493830008072886, "grad_norm": 1.9168838737841298, "learning_rate": 1.2484763645734816e-06, "loss": 0.913, "step": 634 }, { "epoch": 0.05858609156959982, "grad_norm": 1.5552224413451192, "learning_rate": 1.24846320687462e-06, "loss": 0.9587, "step": 635 }, { "epoch": 0.05858609156959982, "eval_GEN Loss": 0.49984222650527954, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 Neg": 0.5, "eval_PRM Loss": 0.40613850951194763, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9527644515037537, "eval_runtime": 56.0062, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 635 }, { "epoch": 0.058678353131126744, "grad_norm": 2.752900272064645, "learning_rate": 1.2484499926765416e-06, "loss": 1.0392, "step": 636 }, { "epoch": 0.058770614692653676, "grad_norm": 2.478031843513477, "learning_rate": 1.2484367219804435e-06, "loss": 0.7721, "step": 637 }, { "epoch": 0.0588628762541806, "grad_norm": 1.750905595546406, "learning_rate": 1.2484233947875282e-06, "loss": 0.8989, "step": 638 }, { "epoch": 0.058955137815707534, "grad_norm": 1.7510339767346743, "learning_rate": 1.2484100110990035e-06, "loss": 0.9025, "step": 639 }, { "epoch": 0.05904739937723446, "grad_norm": 2.2048689696788135, "learning_rate": 1.2483965709160827e-06, "loss": 0.8448, "step": 640 }, { "epoch": 0.05904739937723446, "eval_GEN Loss": 0.5029840469360352, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.39927953481674194, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9294471144676208, "eval_runtime": 55.8663, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 640 }, { "epoch": 0.05913966093876139, "grad_norm": 1.5209893142275832, "learning_rate": 1.248383074239983e-06, "loss": 0.7128, "step": 641 }, { "epoch": 0.05923192250028832, "grad_norm": 1.843063551533251, "learning_rate": 1.2483695210719282e-06, "loss": 0.792, "step": 642 }, { "epoch": 0.05932418406181525, "grad_norm": 1.4352538619861959, "learning_rate": 1.248355911413146e-06, "loss": 0.6026, "step": 643 }, { "epoch": 0.059416445623342175, "grad_norm": 3.812000845948826, "learning_rate": 1.2483422452648702e-06, "loss": 1.0718, "step": 644 }, { "epoch": 0.05950870718486911, "grad_norm": 3.590813734052817, "learning_rate": 1.2483285226283387e-06, "loss": 0.9815, "step": 645 }, { "epoch": 0.05950870718486911, "eval_GEN Loss": 0.502841591835022, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM Loss": 0.39608943462371826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9320913553237915, "eval_runtime": 55.9501, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 645 }, { "epoch": 0.05960096874639603, "grad_norm": 1.9928220967621102, "learning_rate": 1.2483147435047954e-06, "loss": 0.7131, "step": 646 }, { "epoch": 0.059693230307922965, "grad_norm": 1.9365920045835188, "learning_rate": 1.248300907895489e-06, "loss": 0.9459, "step": 647 }, { "epoch": 0.05978549186944989, "grad_norm": 2.6623701009527387, "learning_rate": 1.2482870158016733e-06, "loss": 0.7441, "step": 648 }, { "epoch": 0.05987775343097682, "grad_norm": 2.6690979217425994, "learning_rate": 1.2482730672246069e-06, "loss": 0.8438, "step": 649 }, { "epoch": 0.05997001499250375, "grad_norm": 1.74071030127736, "learning_rate": 1.2482590621655544e-06, "loss": 0.8071, "step": 650 }, { "epoch": 0.05997001499250375, "eval_GEN Loss": 0.5032788515090942, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4073921740055084, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9045072197914124, "eval_runtime": 55.6871, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 650 }, { "epoch": 0.06006227655403068, "grad_norm": 1.867697574685573, "learning_rate": 1.2482450006257845e-06, "loss": 0.7068, "step": 651 }, { "epoch": 0.060154538115557606, "grad_norm": 3.150656478669109, "learning_rate": 1.2482308826065717e-06, "loss": 1.0362, "step": 652 }, { "epoch": 0.06024679967708454, "grad_norm": 2.0723154529102277, "learning_rate": 1.2482167081091953e-06, "loss": 0.8605, "step": 653 }, { "epoch": 0.06033906123861146, "grad_norm": 1.5733706218276544, "learning_rate": 1.24820247713494e-06, "loss": 0.8048, "step": 654 }, { "epoch": 0.060431322800138396, "grad_norm": 1.9533228833495297, "learning_rate": 1.248188189685095e-06, "loss": 0.8584, "step": 655 }, { "epoch": 0.060431322800138396, "eval_GEN Loss": 0.5047159194946289, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.43611615896224976, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.907932698726654, "eval_runtime": 55.742, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 655 }, { "epoch": 0.06052358436166532, "grad_norm": 1.8164491320202634, "learning_rate": 1.2481738457609554e-06, "loss": 0.7616, "step": 656 }, { "epoch": 0.06061584592319225, "grad_norm": 2.9805106768035183, "learning_rate": 1.2481594453638213e-06, "loss": 1.0346, "step": 657 }, { "epoch": 0.06070810748471918, "grad_norm": 2.198359986050082, "learning_rate": 1.248144988494997e-06, "loss": 0.9404, "step": 658 }, { "epoch": 0.06080036904624611, "grad_norm": 1.7843818714451314, "learning_rate": 1.2481304751557932e-06, "loss": 0.7976, "step": 659 }, { "epoch": 0.060892630607773036, "grad_norm": 1.852373355865221, "learning_rate": 1.248115905347525e-06, "loss": 0.6315, "step": 660 }, { "epoch": 0.060892630607773036, "eval_GEN Loss": 0.5038718581199646, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.379349946975708, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.887620210647583, "eval_runtime": 55.8929, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 660 }, { "epoch": 0.06098489216929997, "grad_norm": 2.5190164743513677, "learning_rate": 1.2481012790715125e-06, "loss": 0.9121, "step": 661 }, { "epoch": 0.061077153730826894, "grad_norm": 2.1642822732493094, "learning_rate": 1.2480865963290814e-06, "loss": 0.9153, "step": 662 }, { "epoch": 0.061169415292353826, "grad_norm": 2.4869822741610736, "learning_rate": 1.2480718571215622e-06, "loss": 0.8426, "step": 663 }, { "epoch": 0.06126167685388075, "grad_norm": 1.4804113543475204, "learning_rate": 1.2480570614502905e-06, "loss": 0.7338, "step": 664 }, { "epoch": 0.061353938415407684, "grad_norm": 2.5825031570366948, "learning_rate": 1.2480422093166072e-06, "loss": 0.988, "step": 665 }, { "epoch": 0.061353938415407684, "eval_GEN Loss": 0.5030157566070557, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3597264587879181, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.891406238079071, "eval_runtime": 55.8048, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 665 }, { "epoch": 0.06144619997693461, "grad_norm": 2.4865553091482386, "learning_rate": 1.2480273007218583e-06, "loss": 0.7469, "step": 666 }, { "epoch": 0.06153846153846154, "grad_norm": 1.4962681330808214, "learning_rate": 1.2480123356673947e-06, "loss": 0.7616, "step": 667 }, { "epoch": 0.06163072309998847, "grad_norm": 3.3098298083873035, "learning_rate": 1.2479973141545727e-06, "loss": 1.007, "step": 668 }, { "epoch": 0.0617229846615154, "grad_norm": 1.9786754768724968, "learning_rate": 1.2479822361847532e-06, "loss": 0.9201, "step": 669 }, { "epoch": 0.061815246223042325, "grad_norm": 2.2883225948352206, "learning_rate": 1.2479671017593031e-06, "loss": 0.9133, "step": 670 }, { "epoch": 0.061815246223042325, "eval_GEN Loss": 0.5008916258811951, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8717948717948718, "eval_PRM F1 AUC": 0.8009429020429545, "eval_PRM F1 Neg": 0.6428571428571429, "eval_PRM Loss": 0.388599693775177, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.9315068493150684, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8749399185180664, "eval_runtime": 55.8347, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 670 }, { "epoch": 0.06190750778456926, "grad_norm": 1.6824160258294973, "learning_rate": 1.2479519108795937e-06, "loss": 0.8843, "step": 671 }, { "epoch": 0.06199976934609618, "grad_norm": 1.8734800223296395, "learning_rate": 1.2479366635470014e-06, "loss": 0.9205, "step": 672 }, { "epoch": 0.06209203090762311, "grad_norm": 2.410707480946803, "learning_rate": 1.2479213597629084e-06, "loss": 1.0086, "step": 673 }, { "epoch": 0.06218429246915004, "grad_norm": 2.0368417016154154, "learning_rate": 1.247905999528701e-06, "loss": 1.0038, "step": 674 }, { "epoch": 0.062276554030676966, "grad_norm": 1.6606314268932567, "learning_rate": 1.2478905828457716e-06, "loss": 0.9871, "step": 675 }, { "epoch": 0.062276554030676966, "eval_GEN Loss": 0.5003483295440674, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8533333333333334, "eval_PRM F1 AUC": 0.8203247773703509, "eval_PRM F1 Neg": 0.6451612903225806, "eval_PRM Loss": 0.4477854371070862, "eval_PRM NPV": 0.5128205128205128, "eval_PRM Precision": 0.9552238805970149, "eval_PRM Recall": 0.7710843373493976, "eval_PRM Specificty": 0.8695652173913043, "eval_loss": 0.9173076748847961, "eval_runtime": 55.7039, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 675 }, { "epoch": 0.0623688155922039, "grad_norm": 2.4488961881294107, "learning_rate": 1.247875109715517e-06, "loss": 0.9534, "step": 676 }, { "epoch": 0.062461077153730823, "grad_norm": 2.0301141579032165, "learning_rate": 1.2478595801393397e-06, "loss": 0.9554, "step": 677 }, { "epoch": 0.06255333871525776, "grad_norm": 1.7484711809717781, "learning_rate": 1.247843994118647e-06, "loss": 0.9209, "step": 678 }, { "epoch": 0.06264560027678469, "grad_norm": 2.031267928666826, "learning_rate": 1.2478283516548509e-06, "loss": 0.9142, "step": 679 }, { "epoch": 0.0627378618383116, "grad_norm": 1.884594680835046, "learning_rate": 1.2478126527493695e-06, "loss": 0.7914, "step": 680 }, { "epoch": 0.0627378618383116, "eval_GEN Loss": 0.49689099192619324, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8860759493670886, "eval_PRM F1 AUC": 0.8129910948140389, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3846823275089264, "eval_PRM NPV": 0.5806451612903226, "eval_PRM Precision": 0.9333333333333333, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.879687488079071, "eval_runtime": 56.6869, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 680 }, { "epoch": 0.06283012339983854, "grad_norm": 2.353693418975392, "learning_rate": 1.247796897403625e-06, "loss": 0.7576, "step": 681 }, { "epoch": 0.06292238496136547, "grad_norm": 2.459026074737489, "learning_rate": 1.2477810856190454e-06, "loss": 0.9668, "step": 682 }, { "epoch": 0.0630146465228924, "grad_norm": 1.5088873303678316, "learning_rate": 1.2477652173970633e-06, "loss": 0.7493, "step": 683 }, { "epoch": 0.06310690808441932, "grad_norm": 2.066196603628531, "learning_rate": 1.2477492927391172e-06, "loss": 0.996, "step": 684 }, { "epoch": 0.06319916964594625, "grad_norm": 2.563516949224603, "learning_rate": 1.2477333116466501e-06, "loss": 1.1314, "step": 685 }, { "epoch": 0.06319916964594625, "eval_GEN Loss": 0.49459177255630493, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.35469162464141846, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9004807472229004, "eval_runtime": 56.8087, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 685 }, { "epoch": 0.06329143120747319, "grad_norm": 1.7918439395513766, "learning_rate": 1.2477172741211097e-06, "loss": 0.7747, "step": 686 }, { "epoch": 0.06338369276900012, "grad_norm": 1.6754035191224634, "learning_rate": 1.2477011801639502e-06, "loss": 0.8361, "step": 687 }, { "epoch": 0.06347595433052704, "grad_norm": 2.9061349298415404, "learning_rate": 1.2476850297766294e-06, "loss": 0.9363, "step": 688 }, { "epoch": 0.06356821589205397, "grad_norm": 1.8680575195107672, "learning_rate": 1.247668822960611e-06, "loss": 0.7602, "step": 689 }, { "epoch": 0.0636604774535809, "grad_norm": 2.0860233465747173, "learning_rate": 1.247652559717364e-06, "loss": 0.7808, "step": 690 }, { "epoch": 0.0636604774535809, "eval_GEN Loss": 0.4925038814544678, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.35282284021377563, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.884495198726654, "eval_runtime": 56.5919, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 690 }, { "epoch": 0.06375273901510783, "grad_norm": 1.8577118351161288, "learning_rate": 1.2476362400483617e-06, "loss": 0.8205, "step": 691 }, { "epoch": 0.06384500057663475, "grad_norm": 1.4626529248849887, "learning_rate": 1.2476198639550833e-06, "loss": 0.7822, "step": 692 }, { "epoch": 0.06393726213816169, "grad_norm": 2.315929103420837, "learning_rate": 1.247603431439013e-06, "loss": 0.8778, "step": 693 }, { "epoch": 0.06402952369968862, "grad_norm": 1.4148957871947343, "learning_rate": 1.2475869425016396e-06, "loss": 0.7385, "step": 694 }, { "epoch": 0.06412178526121555, "grad_norm": 1.9927127988576974, "learning_rate": 1.2475703971444575e-06, "loss": 0.7152, "step": 695 }, { "epoch": 0.06412178526121555, "eval_GEN Loss": 0.49013301730155945, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.36663177609443665, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8553485870361328, "eval_runtime": 56.8218, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 695 }, { "epoch": 0.06421404682274247, "grad_norm": 2.207444043712501, "learning_rate": 1.2475537953689662e-06, "loss": 0.713, "step": 696 }, { "epoch": 0.0643063083842694, "grad_norm": 1.886201426859166, "learning_rate": 1.2475371371766702e-06, "loss": 0.8012, "step": 697 }, { "epoch": 0.06439856994579633, "grad_norm": 2.5680702309053136, "learning_rate": 1.2475204225690785e-06, "loss": 0.9574, "step": 698 }, { "epoch": 0.06449083150732327, "grad_norm": 2.658370152428033, "learning_rate": 1.2475036515477065e-06, "loss": 1.0898, "step": 699 }, { "epoch": 0.06458309306885018, "grad_norm": 2.197277787521508, "learning_rate": 1.2474868241140737e-06, "loss": 0.928, "step": 700 }, { "epoch": 0.06458309306885018, "eval_GEN Loss": 0.4897848963737488, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34977298974990845, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8474759459495544, "eval_runtime": 55.9244, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 700 }, { "epoch": 0.06467535463037712, "grad_norm": 2.42990179685859, "learning_rate": 1.2474699402697052e-06, "loss": 0.8279, "step": 701 }, { "epoch": 0.06476761619190405, "grad_norm": 2.472823147937655, "learning_rate": 1.2474530000161308e-06, "loss": 0.9482, "step": 702 }, { "epoch": 0.06485987775343098, "grad_norm": 2.446117329514279, "learning_rate": 1.2474360033548858e-06, "loss": 0.7692, "step": 703 }, { "epoch": 0.0649521393149579, "grad_norm": 1.973986088568778, "learning_rate": 1.2474189502875105e-06, "loss": 0.8697, "step": 704 }, { "epoch": 0.06504440087648483, "grad_norm": 2.7409896385756114, "learning_rate": 1.2474018408155502e-06, "loss": 0.8734, "step": 705 }, { "epoch": 0.06504440087648483, "eval_GEN Loss": 0.49004632234573364, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.3554302752017975, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8493990302085876, "eval_runtime": 56.0916, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 705 }, { "epoch": 0.06513666243801176, "grad_norm": 2.219226330814617, "learning_rate": 1.2473846749405556e-06, "loss": 1.0019, "step": 706 }, { "epoch": 0.0652289239995387, "grad_norm": 1.8740037144485404, "learning_rate": 1.2473674526640817e-06, "loss": 0.8388, "step": 707 }, { "epoch": 0.06532118556106561, "grad_norm": 2.2348521337067724, "learning_rate": 1.2473501739876899e-06, "loss": 1.0764, "step": 708 }, { "epoch": 0.06541344712259255, "grad_norm": 1.9185201204998532, "learning_rate": 1.2473328389129457e-06, "loss": 0.8188, "step": 709 }, { "epoch": 0.06550570868411948, "grad_norm": 1.7479011149182606, "learning_rate": 1.2473154474414201e-06, "loss": 0.8953, "step": 710 }, { "epoch": 0.06550570868411948, "eval_GEN Loss": 0.4939427077770233, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8789808917197452, "eval_PRM F1 AUC": 0.8069669984284967, "eval_PRM F1 Neg": 0.6545454545454545, "eval_PRM Loss": 0.3669225573539734, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.9324324324324325, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8590745329856873, "eval_runtime": 55.7164, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 710 }, { "epoch": 0.06559797024564641, "grad_norm": 1.9154297915300535, "learning_rate": 1.247297999574689e-06, "loss": 0.8618, "step": 711 }, { "epoch": 0.06569023180717333, "grad_norm": 2.020703353307214, "learning_rate": 1.2472804953143337e-06, "loss": 0.8877, "step": 712 }, { "epoch": 0.06578249336870026, "grad_norm": 1.8524179286156006, "learning_rate": 1.2472629346619405e-06, "loss": 0.7848, "step": 713 }, { "epoch": 0.0658747549302272, "grad_norm": 1.9779243978117849, "learning_rate": 1.2472453176191007e-06, "loss": 0.8378, "step": 714 }, { "epoch": 0.06596701649175413, "grad_norm": 2.1877741410284397, "learning_rate": 1.2472276441874107e-06, "loss": 0.8562, "step": 715 }, { "epoch": 0.06596701649175413, "eval_GEN Loss": 0.49638262391090393, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3564877510070801, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.859375, "eval_runtime": 55.895, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 715 }, { "epoch": 0.06605927805328105, "grad_norm": 2.4350153073154597, "learning_rate": 1.2472099143684723e-06, "loss": 0.8768, "step": 716 }, { "epoch": 0.06615153961480798, "grad_norm": 1.4549457216393873, "learning_rate": 1.247192128163892e-06, "loss": 0.7692, "step": 717 }, { "epoch": 0.06624380117633491, "grad_norm": 2.505367115067907, "learning_rate": 1.2471742855752816e-06, "loss": 0.8329, "step": 718 }, { "epoch": 0.06633606273786184, "grad_norm": 1.8190506564213158, "learning_rate": 1.2471563866042583e-06, "loss": 0.9022, "step": 719 }, { "epoch": 0.06642832429938876, "grad_norm": 1.7817688080675171, "learning_rate": 1.247138431252444e-06, "loss": 0.9805, "step": 720 }, { "epoch": 0.06642832429938876, "eval_GEN Loss": 0.4984198212623596, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34813085198402405, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8671875, "eval_runtime": 55.8061, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 720 }, { "epoch": 0.06652058586091569, "grad_norm": 2.7336873193573243, "learning_rate": 1.2471204195214656e-06, "loss": 0.8606, "step": 721 }, { "epoch": 0.06661284742244263, "grad_norm": 2.3306084563214933, "learning_rate": 1.2471023514129557e-06, "loss": 0.7781, "step": 722 }, { "epoch": 0.06670510898396956, "grad_norm": 1.7219822318993079, "learning_rate": 1.2470842269285517e-06, "loss": 0.8055, "step": 723 }, { "epoch": 0.06679737054549648, "grad_norm": 1.9205101088879777, "learning_rate": 1.2470660460698954e-06, "loss": 0.9165, "step": 724 }, { "epoch": 0.06688963210702341, "grad_norm": 2.9798148380574, "learning_rate": 1.2470478088386351e-06, "loss": 0.9771, "step": 725 }, { "epoch": 0.06688963210702341, "eval_GEN Loss": 0.49796873331069946, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34290528297424316, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8899038434028625, "eval_runtime": 56.1946, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 725 }, { "epoch": 0.06698189366855034, "grad_norm": 2.662186811434316, "learning_rate": 1.2470295152364233e-06, "loss": 0.9973, "step": 726 }, { "epoch": 0.06707415523007727, "grad_norm": 2.2845077888095373, "learning_rate": 1.2470111652649179e-06, "loss": 0.9237, "step": 727 }, { "epoch": 0.06716641679160419, "grad_norm": 2.720090139434416, "learning_rate": 1.2469927589257813e-06, "loss": 0.7501, "step": 728 }, { "epoch": 0.06725867835313112, "grad_norm": 1.522941660785064, "learning_rate": 1.2469742962206818e-06, "loss": 0.8071, "step": 729 }, { "epoch": 0.06735093991465806, "grad_norm": 1.4019671017176252, "learning_rate": 1.2469557771512929e-06, "loss": 0.7039, "step": 730 }, { "epoch": 0.06735093991465806, "eval_GEN Loss": 0.4958108067512512, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.36516496539115906, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8774639368057251, "eval_runtime": 55.7974, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 730 }, { "epoch": 0.06744320147618499, "grad_norm": 1.1680217200435885, "learning_rate": 1.2469372017192924e-06, "loss": 0.8015, "step": 731 }, { "epoch": 0.06753546303771191, "grad_norm": 1.5781252944765307, "learning_rate": 1.2469185699263637e-06, "loss": 0.8491, "step": 732 }, { "epoch": 0.06762772459923884, "grad_norm": 1.8145479068747337, "learning_rate": 1.2468998817741953e-06, "loss": 0.7989, "step": 733 }, { "epoch": 0.06771998616076577, "grad_norm": 1.6535751360344864, "learning_rate": 1.2468811372644807e-06, "loss": 0.9262, "step": 734 }, { "epoch": 0.0678122477222927, "grad_norm": 1.9278342852110244, "learning_rate": 1.2468623363989185e-06, "loss": 1.0176, "step": 735 }, { "epoch": 0.0678122477222927, "eval_GEN Loss": 0.49498119950294495, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8481012658227848, "eval_PRM F1 AUC": 0.7297014143530645, "eval_PRM F1 Neg": 0.5555555555555556, "eval_PRM Loss": 0.4146951138973236, "eval_PRM NPV": 0.4838709677419355, "eval_PRM Precision": 0.8933333333333333, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8856971263885498, "eval_runtime": 55.6896, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 735 }, { "epoch": 0.06790450928381962, "grad_norm": 1.6121518007170748, "learning_rate": 1.2468434791792128e-06, "loss": 0.9168, "step": 736 }, { "epoch": 0.06799677084534655, "grad_norm": 2.38794987956524, "learning_rate": 1.246824565607072e-06, "loss": 0.9095, "step": 737 }, { "epoch": 0.06808903240687349, "grad_norm": 1.813456431482765, "learning_rate": 1.2468055956842105e-06, "loss": 0.9157, "step": 738 }, { "epoch": 0.06818129396840042, "grad_norm": 1.4495805711914043, "learning_rate": 1.2467865694123468e-06, "loss": 0.5399, "step": 739 }, { "epoch": 0.06827355552992734, "grad_norm": 2.3167972690740153, "learning_rate": 1.2467674867932058e-06, "loss": 0.7926, "step": 740 }, { "epoch": 0.06827355552992734, "eval_GEN Loss": 0.49450138211250305, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.43435630202293396, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8999999761581421, "eval_runtime": 55.9371, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 740 }, { "epoch": 0.06836581709145427, "grad_norm": 1.5071480108442745, "learning_rate": 1.2467483478285164e-06, "loss": 0.7966, "step": 741 }, { "epoch": 0.0684580786529812, "grad_norm": 2.702874301518555, "learning_rate": 1.2467291525200132e-06, "loss": 1.0614, "step": 742 }, { "epoch": 0.06855034021450813, "grad_norm": 2.365685824108943, "learning_rate": 1.2467099008694353e-06, "loss": 0.9154, "step": 743 }, { "epoch": 0.06864260177603505, "grad_norm": 2.95301854010953, "learning_rate": 1.2466905928785278e-06, "loss": 0.8738, "step": 744 }, { "epoch": 0.06873486333756199, "grad_norm": 1.5476261126743078, "learning_rate": 1.24667122854904e-06, "loss": 0.6732, "step": 745 }, { "epoch": 0.06873486333756199, "eval_GEN Loss": 0.4933946132659912, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM Loss": 0.4207013249397278, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9192307591438293, "eval_runtime": 55.8318, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 745 }, { "epoch": 0.06882712489908892, "grad_norm": 2.3640495382258315, "learning_rate": 1.2466518078827272e-06, "loss": 0.9631, "step": 746 }, { "epoch": 0.06891938646061585, "grad_norm": 2.8018933198562173, "learning_rate": 1.246632330881349e-06, "loss": 0.859, "step": 747 }, { "epoch": 0.06901164802214277, "grad_norm": 1.8883189644042988, "learning_rate": 1.2466127975466704e-06, "loss": 0.9006, "step": 748 }, { "epoch": 0.0691039095836697, "grad_norm": 1.6165626373161106, "learning_rate": 1.2465932078804618e-06, "loss": 0.6278, "step": 749 }, { "epoch": 0.06919617114519663, "grad_norm": 2.5763895171342583, "learning_rate": 1.2465735618844982e-06, "loss": 0.7422, "step": 750 }, { "epoch": 0.06919617114519663, "eval_GEN Loss": 0.4946337640285492, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.4318975508213043, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9271033406257629, "eval_runtime": 55.804, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 750 }, { "epoch": 0.06928843270672357, "grad_norm": 1.6546090660530792, "learning_rate": 1.2465538595605603e-06, "loss": 0.8247, "step": 751 }, { "epoch": 0.06938069426825048, "grad_norm": 2.1096823021207367, "learning_rate": 1.2465341009104332e-06, "loss": 0.8506, "step": 752 }, { "epoch": 0.06947295582977742, "grad_norm": 2.1639271288843616, "learning_rate": 1.2465142859359071e-06, "loss": 1.0005, "step": 753 }, { "epoch": 0.06956521739130435, "grad_norm": 2.036608387513846, "learning_rate": 1.2464944146387788e-06, "loss": 0.7255, "step": 754 }, { "epoch": 0.06965747895283128, "grad_norm": 2.231108365933131, "learning_rate": 1.2464744870208482e-06, "loss": 0.8253, "step": 755 }, { "epoch": 0.06965747895283128, "eval_GEN Loss": 0.49510422348976135, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8481012658227848, "eval_PRM F1 AUC": 0.7297014143530645, "eval_PRM F1 Neg": 0.5555555555555556, "eval_PRM Loss": 0.42670556902885437, "eval_PRM NPV": 0.4838709677419355, "eval_PRM Precision": 0.8933333333333333, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9216346144676208, "eval_runtime": 55.7729, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 755 }, { "epoch": 0.0697497405143582, "grad_norm": 2.458747699242366, "learning_rate": 1.2464545030839211e-06, "loss": 0.88, "step": 756 }, { "epoch": 0.06984200207588513, "grad_norm": 1.7411311492077937, "learning_rate": 1.2464344628298089e-06, "loss": 0.779, "step": 757 }, { "epoch": 0.06993426363741206, "grad_norm": 1.7288453764623393, "learning_rate": 1.2464143662603276e-06, "loss": 0.7594, "step": 758 }, { "epoch": 0.070026525198939, "grad_norm": 1.8324765053708996, "learning_rate": 1.2463942133772982e-06, "loss": 0.7864, "step": 759 }, { "epoch": 0.07011878676046591, "grad_norm": 2.4382269154942757, "learning_rate": 1.2463740041825472e-06, "loss": 0.8951, "step": 760 }, { "epoch": 0.07011878676046591, "eval_GEN Loss": 0.4967345595359802, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.4055047035217285, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9228966236114502, "eval_runtime": 55.7798, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 760 }, { "epoch": 0.07021104832199285, "grad_norm": 1.8272948263291933, "learning_rate": 1.2463537386779058e-06, "loss": 0.949, "step": 761 }, { "epoch": 0.07030330988351978, "grad_norm": 1.7831105003221732, "learning_rate": 1.2463334168652106e-06, "loss": 0.9366, "step": 762 }, { "epoch": 0.07039557144504671, "grad_norm": 1.4386035838480709, "learning_rate": 1.2463130387463033e-06, "loss": 0.7774, "step": 763 }, { "epoch": 0.07048783300657363, "grad_norm": 2.5212138362814307, "learning_rate": 1.2462926043230303e-06, "loss": 0.9012, "step": 764 }, { "epoch": 0.07058009456810056, "grad_norm": 1.7618420271161546, "learning_rate": 1.2462721135972436e-06, "loss": 0.8087, "step": 765 }, { "epoch": 0.07058009456810056, "eval_GEN Loss": 0.4948992133140564, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM Loss": 0.3998696208000183, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.901562511920929, "eval_runtime": 55.6741, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 765 }, { "epoch": 0.0706723561296275, "grad_norm": 1.9743598065521322, "learning_rate": 1.2462515665708e-06, "loss": 0.6323, "step": 766 }, { "epoch": 0.07076461769115443, "grad_norm": 1.8900912865651107, "learning_rate": 1.2462309632455616e-06, "loss": 0.8452, "step": 767 }, { "epoch": 0.07085687925268135, "grad_norm": 1.9386372731860115, "learning_rate": 1.2462103036233957e-06, "loss": 0.8129, "step": 768 }, { "epoch": 0.07094914081420828, "grad_norm": 1.5221375336860836, "learning_rate": 1.246189587706174e-06, "loss": 0.7972, "step": 769 }, { "epoch": 0.07104140237573521, "grad_norm": 1.946764142267064, "learning_rate": 1.2461688154957744e-06, "loss": 0.759, "step": 770 }, { "epoch": 0.07104140237573521, "eval_GEN Loss": 0.4942178428173065, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.39047446846961975, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8980769515037537, "eval_runtime": 55.8653, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 770 }, { "epoch": 0.07113366393726214, "grad_norm": 2.1233654864649485, "learning_rate": 1.2461479869940787e-06, "loss": 0.8307, "step": 771 }, { "epoch": 0.07122592549878906, "grad_norm": 2.017896776743582, "learning_rate": 1.2461271022029748e-06, "loss": 1.0371, "step": 772 }, { "epoch": 0.071318187060316, "grad_norm": 1.7703832595630926, "learning_rate": 1.2461061611243553e-06, "loss": 0.9259, "step": 773 }, { "epoch": 0.07141044862184293, "grad_norm": 2.8705218440160527, "learning_rate": 1.246085163760118e-06, "loss": 0.8962, "step": 774 }, { "epoch": 0.07150271018336986, "grad_norm": 2.6644405002345675, "learning_rate": 1.246064110112165e-06, "loss": 0.9875, "step": 775 }, { "epoch": 0.07150271018336986, "eval_GEN Loss": 0.4935784339904785, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.3880944550037384, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8998197317123413, "eval_runtime": 55.8179, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 775 }, { "epoch": 0.07159497174489678, "grad_norm": 2.039120209572376, "learning_rate": 1.2460430001824053e-06, "loss": 0.8678, "step": 776 }, { "epoch": 0.07168723330642371, "grad_norm": 1.8770441809021905, "learning_rate": 1.2460218339727512e-06, "loss": 0.7401, "step": 777 }, { "epoch": 0.07177949486795064, "grad_norm": 2.367333899626303, "learning_rate": 1.2460006114851212e-06, "loss": 1.145, "step": 778 }, { "epoch": 0.07187175642947757, "grad_norm": 1.5591185213212513, "learning_rate": 1.245979332721438e-06, "loss": 0.9962, "step": 779 }, { "epoch": 0.07196401799100449, "grad_norm": 2.1569361671091802, "learning_rate": 1.2459579976836303e-06, "loss": 0.9726, "step": 780 }, { "epoch": 0.07196401799100449, "eval_GEN Loss": 0.49650710821151733, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.3951421082019806, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9027644395828247, "eval_runtime": 56.9022, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 780 }, { "epoch": 0.07205627955253142, "grad_norm": 1.8591473145629258, "learning_rate": 1.2459366063736318e-06, "loss": 0.8798, "step": 781 }, { "epoch": 0.07214854111405836, "grad_norm": 2.414556386299106, "learning_rate": 1.2459151587933801e-06, "loss": 0.7836, "step": 782 }, { "epoch": 0.07224080267558529, "grad_norm": 1.7918474384343825, "learning_rate": 1.2458936549448198e-06, "loss": 0.7399, "step": 783 }, { "epoch": 0.07233306423711221, "grad_norm": 1.9349954353770182, "learning_rate": 1.2458720948298992e-06, "loss": 0.8301, "step": 784 }, { "epoch": 0.07242532579863914, "grad_norm": 2.243189487230969, "learning_rate": 1.2458504784505717e-06, "loss": 0.8181, "step": 785 }, { "epoch": 0.07242532579863914, "eval_GEN Loss": 0.49928420782089233, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.37937721610069275, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9114182591438293, "eval_runtime": 56.9808, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 785 }, { "epoch": 0.07251758736016607, "grad_norm": 2.163418551734592, "learning_rate": 1.245828805808797e-06, "loss": 0.5935, "step": 786 }, { "epoch": 0.072609848921693, "grad_norm": 2.1430336298179045, "learning_rate": 1.2458070769065385e-06, "loss": 0.9858, "step": 787 }, { "epoch": 0.07270211048321992, "grad_norm": 2.756131543633587, "learning_rate": 1.2457852917457656e-06, "loss": 0.919, "step": 788 }, { "epoch": 0.07279437204474686, "grad_norm": 3.10291318997362, "learning_rate": 1.2457634503284525e-06, "loss": 0.7908, "step": 789 }, { "epoch": 0.07288663360627379, "grad_norm": 1.9828118890125443, "learning_rate": 1.2457415526565784e-06, "loss": 0.9122, "step": 790 }, { "epoch": 0.07288663360627379, "eval_GEN Loss": 0.4999357759952545, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37910550832748413, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9312499761581421, "eval_runtime": 56.6552, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 790 }, { "epoch": 0.07297889516780072, "grad_norm": 1.8759492012191048, "learning_rate": 1.2457195987321278e-06, "loss": 1.0204, "step": 791 }, { "epoch": 0.07307115672932764, "grad_norm": 1.7356039772475023, "learning_rate": 1.2456975885570899e-06, "loss": 0.8332, "step": 792 }, { "epoch": 0.07316341829085457, "grad_norm": 2.2456585233178714, "learning_rate": 1.2456755221334597e-06, "loss": 0.8643, "step": 793 }, { "epoch": 0.0732556798523815, "grad_norm": 1.6329985065250308, "learning_rate": 1.2456533994632366e-06, "loss": 0.5548, "step": 794 }, { "epoch": 0.07334794141390844, "grad_norm": 2.2492550574621477, "learning_rate": 1.2456312205484256e-06, "loss": 0.8706, "step": 795 }, { "epoch": 0.07334794141390844, "eval_GEN Loss": 0.4971840977668762, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.39162924885749817, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9308894276618958, "eval_runtime": 57.1847, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 795 }, { "epoch": 0.07344020297543535, "grad_norm": 2.33775263480178, "learning_rate": 1.2456089853910366e-06, "loss": 0.8396, "step": 796 }, { "epoch": 0.07353246453696229, "grad_norm": 1.9459634424275452, "learning_rate": 1.2455866939930844e-06, "loss": 0.924, "step": 797 }, { "epoch": 0.07362472609848922, "grad_norm": 2.163106136718416, "learning_rate": 1.2455643463565893e-06, "loss": 0.6806, "step": 798 }, { "epoch": 0.07371698766001615, "grad_norm": 1.5412218241088955, "learning_rate": 1.245541942483576e-06, "loss": 0.8529, "step": 799 }, { "epoch": 0.07380924922154307, "grad_norm": 2.0771376002130038, "learning_rate": 1.2455194823760756e-06, "loss": 0.9164, "step": 800 }, { "epoch": 0.07380924922154307, "eval_GEN Loss": 0.4945929944515228, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.4143304228782654, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9093149304389954, "eval_runtime": 57.0837, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 800 }, { "epoch": 0.07390151078307, "grad_norm": 2.203026010894973, "learning_rate": 1.2454969660361228e-06, "loss": 0.912, "step": 801 }, { "epoch": 0.07399377234459693, "grad_norm": 1.6362508475412942, "learning_rate": 1.2454743934657582e-06, "loss": 0.6309, "step": 802 }, { "epoch": 0.07408603390612387, "grad_norm": 1.8245987540417024, "learning_rate": 1.2454517646670273e-06, "loss": 0.9523, "step": 803 }, { "epoch": 0.07417829546765078, "grad_norm": 2.565586744284615, "learning_rate": 1.245429079641981e-06, "loss": 0.7819, "step": 804 }, { "epoch": 0.07427055702917772, "grad_norm": 1.4786286126417236, "learning_rate": 1.245406338392675e-06, "loss": 0.8991, "step": 805 }, { "epoch": 0.07427055702917772, "eval_GEN Loss": 0.4920736849308014, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4271751940250397, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.90234375, "eval_runtime": 56.8199, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 805 }, { "epoch": 0.07436281859070465, "grad_norm": 2.533897967555276, "learning_rate": 1.2453835409211701e-06, "loss": 0.7043, "step": 806 }, { "epoch": 0.07445508015223158, "grad_norm": 1.8240446733405726, "learning_rate": 1.2453606872295321e-06, "loss": 0.9383, "step": 807 }, { "epoch": 0.0745473417137585, "grad_norm": 2.5124258386859206, "learning_rate": 1.2453377773198321e-06, "loss": 0.8692, "step": 808 }, { "epoch": 0.07463960327528543, "grad_norm": 2.7066494905774383, "learning_rate": 1.2453148111941465e-06, "loss": 0.9071, "step": 809 }, { "epoch": 0.07473186483681236, "grad_norm": 1.408810146832989, "learning_rate": 1.2452917888545563e-06, "loss": 0.7177, "step": 810 }, { "epoch": 0.07473186483681236, "eval_GEN Loss": 0.4875481426715851, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.3897683620452881, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9242788553237915, "eval_runtime": 56.6804, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 810 }, { "epoch": 0.0748241263983393, "grad_norm": 1.8834786631308178, "learning_rate": 1.2452687103031478e-06, "loss": 0.875, "step": 811 }, { "epoch": 0.07491638795986622, "grad_norm": 1.5732525514551252, "learning_rate": 1.2452455755420124e-06, "loss": 0.6362, "step": 812 }, { "epoch": 0.07500864952139315, "grad_norm": 2.282625772188802, "learning_rate": 1.2452223845732467e-06, "loss": 1.0403, "step": 813 }, { "epoch": 0.07510091108292008, "grad_norm": 2.104306217863785, "learning_rate": 1.2451991373989522e-06, "loss": 0.7805, "step": 814 }, { "epoch": 0.07519317264444701, "grad_norm": 1.633308231347707, "learning_rate": 1.245175834021236e-06, "loss": 0.7325, "step": 815 }, { "epoch": 0.07519317264444701, "eval_GEN Loss": 0.4881250858306885, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM Loss": 0.3997836709022522, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9693509340286255, "eval_runtime": 56.7256, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 815 }, { "epoch": 0.07528543420597393, "grad_norm": 2.0255801243871656, "learning_rate": 1.2451524744422091e-06, "loss": 0.9489, "step": 816 }, { "epoch": 0.07537769576750086, "grad_norm": 2.9147138178744822, "learning_rate": 1.245129058663989e-06, "loss": 1.0011, "step": 817 }, { "epoch": 0.0754699573290278, "grad_norm": 1.4163130766664815, "learning_rate": 1.2451055866886974e-06, "loss": 0.6281, "step": 818 }, { "epoch": 0.07556221889055473, "grad_norm": 1.5326618856461074, "learning_rate": 1.2450820585184618e-06, "loss": 0.861, "step": 819 }, { "epoch": 0.07565448045208165, "grad_norm": 2.2389560997418094, "learning_rate": 1.2450584741554137e-06, "loss": 0.9153, "step": 820 }, { "epoch": 0.07565448045208165, "eval_GEN Loss": 0.48855963349342346, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM Loss": 0.4276357591152191, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9779447317123413, "eval_runtime": 56.9661, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 820 }, { "epoch": 0.07574674201360858, "grad_norm": 2.416810091664023, "learning_rate": 1.2450348336016907e-06, "loss": 0.8267, "step": 821 }, { "epoch": 0.07583900357513551, "grad_norm": 2.376343332622679, "learning_rate": 1.2450111368594353e-06, "loss": 0.9099, "step": 822 }, { "epoch": 0.07593126513666244, "grad_norm": 1.5609925923787278, "learning_rate": 1.2449873839307946e-06, "loss": 0.7421, "step": 823 }, { "epoch": 0.07602352669818936, "grad_norm": 2.0250215905922775, "learning_rate": 1.2449635748179214e-06, "loss": 0.7673, "step": 824 }, { "epoch": 0.0761157882597163, "grad_norm": 2.381198063048954, "learning_rate": 1.2449397095229733e-06, "loss": 0.8431, "step": 825 }, { "epoch": 0.0761157882597163, "eval_GEN Loss": 0.48923951387405396, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.4137907922267914, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9695913195610046, "eval_runtime": 56.8733, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 825 }, { "epoch": 0.07620804982124323, "grad_norm": 2.3543419232709706, "learning_rate": 1.2449157880481128e-06, "loss": 0.7274, "step": 826 }, { "epoch": 0.07630031138277016, "grad_norm": 1.5937985167746698, "learning_rate": 1.244891810395508e-06, "loss": 0.8499, "step": 827 }, { "epoch": 0.07639257294429708, "grad_norm": 1.944719113741731, "learning_rate": 1.2448677765673314e-06, "loss": 0.8374, "step": 828 }, { "epoch": 0.07648483450582401, "grad_norm": 2.5598233470175784, "learning_rate": 1.2448436865657613e-06, "loss": 0.8337, "step": 829 }, { "epoch": 0.07657709606735094, "grad_norm": 1.9857330422071102, "learning_rate": 1.2448195403929806e-06, "loss": 0.8968, "step": 830 }, { "epoch": 0.07657709606735094, "eval_GEN Loss": 0.4866617023944855, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM Loss": 0.40177038311958313, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9986177682876587, "eval_runtime": 56.8728, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 830 }, { "epoch": 0.07666935762887787, "grad_norm": 2.135657820144189, "learning_rate": 1.2447953380511777e-06, "loss": 0.7917, "step": 831 }, { "epoch": 0.07676161919040479, "grad_norm": 2.611450488338792, "learning_rate": 1.2447710795425455e-06, "loss": 0.9619, "step": 832 }, { "epoch": 0.07685388075193172, "grad_norm": 1.8469631495600116, "learning_rate": 1.2447467648692827e-06, "loss": 0.747, "step": 833 }, { "epoch": 0.07694614231345866, "grad_norm": 1.6536962967012152, "learning_rate": 1.2447223940335923e-06, "loss": 0.6887, "step": 834 }, { "epoch": 0.07703840387498559, "grad_norm": 2.2203734977559035, "learning_rate": 1.2446979670376833e-06, "loss": 1.023, "step": 835 }, { "epoch": 0.07703840387498559, "eval_GEN Loss": 0.4862686097621918, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4109131097793579, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9471153616905212, "eval_runtime": 56.6381, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 835 }, { "epoch": 0.07713066543651251, "grad_norm": 1.8404547050667157, "learning_rate": 1.244673483883769e-06, "loss": 0.8868, "step": 836 }, { "epoch": 0.07722292699803944, "grad_norm": 1.6246090485457525, "learning_rate": 1.2446489445740683e-06, "loss": 0.7601, "step": 837 }, { "epoch": 0.07731518855956637, "grad_norm": 1.585357583735492, "learning_rate": 1.244624349110805e-06, "loss": 0.8628, "step": 838 }, { "epoch": 0.0774074501210933, "grad_norm": 2.995908072129442, "learning_rate": 1.2445996974962078e-06, "loss": 0.8864, "step": 839 }, { "epoch": 0.07749971168262022, "grad_norm": 2.71225165118734, "learning_rate": 1.2445749897325106e-06, "loss": 0.8182, "step": 840 }, { "epoch": 0.07749971168262022, "eval_GEN Loss": 0.4852362275123596, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.4437427222728729, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9168870449066162, "eval_runtime": 56.7321, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 840 }, { "epoch": 0.07759197324414716, "grad_norm": 2.4546522919332583, "learning_rate": 1.2445502258219528e-06, "loss": 0.8936, "step": 841 }, { "epoch": 0.07768423480567409, "grad_norm": 1.7161177572020176, "learning_rate": 1.2445254057667783e-06, "loss": 0.8069, "step": 842 }, { "epoch": 0.07777649636720102, "grad_norm": 1.5790672985944891, "learning_rate": 1.2445005295692364e-06, "loss": 0.7169, "step": 843 }, { "epoch": 0.07786875792872794, "grad_norm": 2.013552860185453, "learning_rate": 1.2444755972315813e-06, "loss": 0.8245, "step": 844 }, { "epoch": 0.07796101949025487, "grad_norm": 2.1417414885459904, "learning_rate": 1.2444506087560725e-06, "loss": 0.8883, "step": 845 }, { "epoch": 0.07796101949025487, "eval_GEN Loss": 0.4868348240852356, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8280254777070064, "eval_PRM F1 AUC": 0.6959140911471975, "eval_PRM F1 Neg": 0.509090909090909, "eval_PRM Loss": 0.4720483124256134, "eval_PRM NPV": 0.4375, "eval_PRM Precision": 0.8783783783783784, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9293269515037537, "eval_runtime": 56.9438, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 845 }, { "epoch": 0.0780532810517818, "grad_norm": 1.8469790639648116, "learning_rate": 1.2444255641449746e-06, "loss": 0.8698, "step": 846 }, { "epoch": 0.07814554261330874, "grad_norm": 2.755446596183262, "learning_rate": 1.2444004634005572e-06, "loss": 0.7381, "step": 847 }, { "epoch": 0.07823780417483565, "grad_norm": 2.007426586044603, "learning_rate": 1.2443753065250947e-06, "loss": 0.696, "step": 848 }, { "epoch": 0.07833006573636259, "grad_norm": 1.6971518291669285, "learning_rate": 1.2443500935208673e-06, "loss": 0.7656, "step": 849 }, { "epoch": 0.07842232729788952, "grad_norm": 1.9358908564041117, "learning_rate": 1.244324824390159e-06, "loss": 0.8341, "step": 850 }, { "epoch": 0.07842232729788952, "eval_GEN Loss": 0.4880904257297516, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM Loss": 0.4468076825141907, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.943088948726654, "eval_runtime": 56.6384, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 850 }, { "epoch": 0.07851458885941645, "grad_norm": 1.9723772554221473, "learning_rate": 1.2442994991352604e-06, "loss": 0.7479, "step": 851 }, { "epoch": 0.07860685042094337, "grad_norm": 1.5806776439548738, "learning_rate": 1.2442741177584669e-06, "loss": 0.7837, "step": 852 }, { "epoch": 0.0786991119824703, "grad_norm": 3.5942277704877754, "learning_rate": 1.2442486802620776e-06, "loss": 0.8349, "step": 853 }, { "epoch": 0.07879137354399723, "grad_norm": 1.9765224349151842, "learning_rate": 1.2442231866483983e-06, "loss": 0.6078, "step": 854 }, { "epoch": 0.07888363510552417, "grad_norm": 3.481110541921185, "learning_rate": 1.2441976369197393e-06, "loss": 1.1207, "step": 855 }, { "epoch": 0.07888363510552417, "eval_GEN Loss": 0.4901587963104248, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4273208677768707, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9876201748847961, "eval_runtime": 56.9564, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 855 }, { "epoch": 0.07897589666705108, "grad_norm": 1.5284528662332821, "learning_rate": 1.2441720310784157e-06, "loss": 0.7793, "step": 856 }, { "epoch": 0.07906815822857802, "grad_norm": 1.5133521433785049, "learning_rate": 1.244146369126748e-06, "loss": 0.6137, "step": 857 }, { "epoch": 0.07916041979010495, "grad_norm": 2.130285114985017, "learning_rate": 1.244120651067062e-06, "loss": 0.7553, "step": 858 }, { "epoch": 0.07925268135163188, "grad_norm": 2.0300028976770537, "learning_rate": 1.2440948769016879e-06, "loss": 0.6827, "step": 859 }, { "epoch": 0.0793449429131588, "grad_norm": 1.6635017425255172, "learning_rate": 1.2440690466329617e-06, "loss": 0.7518, "step": 860 }, { "epoch": 0.0793449429131588, "eval_GEN Loss": 0.490712970495224, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.4272684156894684, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9701322317123413, "eval_runtime": 56.7977, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 860 }, { "epoch": 0.07943720447468573, "grad_norm": 2.504983146550541, "learning_rate": 1.244043160263224e-06, "loss": 0.7125, "step": 861 }, { "epoch": 0.07952946603621266, "grad_norm": 1.4474241072175298, "learning_rate": 1.2440172177948207e-06, "loss": 0.5333, "step": 862 }, { "epoch": 0.0796217275977396, "grad_norm": 1.6976002637301968, "learning_rate": 1.2439912192301027e-06, "loss": 0.7309, "step": 863 }, { "epoch": 0.07971398915926652, "grad_norm": 2.610885285690451, "learning_rate": 1.2439651645714263e-06, "loss": 0.9831, "step": 864 }, { "epoch": 0.07980625072079345, "grad_norm": 2.2277261457261646, "learning_rate": 1.2439390538211522e-06, "loss": 0.8019, "step": 865 }, { "epoch": 0.07980625072079345, "eval_GEN Loss": 0.49128982424736023, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.43341773748397827, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9430288672447205, "eval_runtime": 56.5487, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 865 }, { "epoch": 0.07989851228232038, "grad_norm": 2.0245463264697907, "learning_rate": 1.2439128869816468e-06, "loss": 0.8017, "step": 866 }, { "epoch": 0.07999077384384731, "grad_norm": 1.6616743102186426, "learning_rate": 1.2438866640552816e-06, "loss": 0.8502, "step": 867 }, { "epoch": 0.08008303540537423, "grad_norm": 1.9057241421259494, "learning_rate": 1.2438603850444328e-06, "loss": 0.8247, "step": 868 }, { "epoch": 0.08017529696690116, "grad_norm": 2.440056653745764, "learning_rate": 1.2438340499514817e-06, "loss": 0.8581, "step": 869 }, { "epoch": 0.0802675585284281, "grad_norm": 2.0871783888188493, "learning_rate": 1.243807658778815e-06, "loss": 0.8389, "step": 870 }, { "epoch": 0.0802675585284281, "eval_GEN Loss": 0.4900650382041931, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.42185112833976746, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.939723551273346, "eval_runtime": 56.657, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 870 }, { "epoch": 0.08035982008995503, "grad_norm": 2.167709794516737, "learning_rate": 1.243781211528824e-06, "loss": 0.8505, "step": 871 }, { "epoch": 0.08045208165148195, "grad_norm": 2.6216805950295323, "learning_rate": 1.243754708203906e-06, "loss": 0.9081, "step": 872 }, { "epoch": 0.08054434321300888, "grad_norm": 1.5561520009829226, "learning_rate": 1.243728148806462e-06, "loss": 0.8009, "step": 873 }, { "epoch": 0.08063660477453581, "grad_norm": 1.7864929931020381, "learning_rate": 1.2437015333388996e-06, "loss": 0.7929, "step": 874 }, { "epoch": 0.08072886633606274, "grad_norm": 2.4580123714254465, "learning_rate": 1.2436748618036302e-06, "loss": 0.8353, "step": 875 }, { "epoch": 0.08072886633606274, "eval_GEN Loss": 0.49164655804634094, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8427672955974843, "eval_PRM F1 AUC": 0.707962283918282, "eval_PRM F1 Neg": 0.5283018867924528, "eval_PRM Loss": 0.44592949748039246, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.881578947368421, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9358773827552795, "eval_runtime": 56.9863, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 875 }, { "epoch": 0.08082112789758966, "grad_norm": 1.8016659935710604, "learning_rate": 1.2436481342030712e-06, "loss": 0.6954, "step": 876 }, { "epoch": 0.0809133894591166, "grad_norm": 1.6708701334542464, "learning_rate": 1.2436213505396445e-06, "loss": 0.8919, "step": 877 }, { "epoch": 0.08100565102064353, "grad_norm": 1.5697716770569945, "learning_rate": 1.243594510815777e-06, "loss": 0.9492, "step": 878 }, { "epoch": 0.08109791258217046, "grad_norm": 1.7560814536415021, "learning_rate": 1.2435676150339016e-06, "loss": 0.8383, "step": 879 }, { "epoch": 0.08119017414369738, "grad_norm": 2.2993878777535506, "learning_rate": 1.243540663196455e-06, "loss": 0.7426, "step": 880 }, { "epoch": 0.08119017414369738, "eval_GEN Loss": 0.4915597438812256, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8427672955974843, "eval_PRM F1 AUC": 0.707962283918282, "eval_PRM F1 Neg": 0.5283018867924528, "eval_PRM Loss": 0.45518842339515686, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.881578947368421, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9466345906257629, "eval_runtime": 56.7621, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 880 }, { "epoch": 0.08128243570522431, "grad_norm": 2.425938989001129, "learning_rate": 1.2435136553058802e-06, "loss": 0.9346, "step": 881 }, { "epoch": 0.08137469726675124, "grad_norm": 2.1066464670940035, "learning_rate": 1.2434865913646242e-06, "loss": 0.957, "step": 882 }, { "epoch": 0.08146695882827817, "grad_norm": 2.2420383948380653, "learning_rate": 1.2434594713751398e-06, "loss": 1.0105, "step": 883 }, { "epoch": 0.08155922038980509, "grad_norm": 2.1763898304110336, "learning_rate": 1.2434322953398846e-06, "loss": 0.6929, "step": 884 }, { "epoch": 0.08165148195133203, "grad_norm": 1.790863741197223, "learning_rate": 1.2434050632613214e-06, "loss": 0.6883, "step": 885 }, { "epoch": 0.08165148195133203, "eval_GEN Loss": 0.49333953857421875, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8427672955974843, "eval_PRM F1 AUC": 0.707962283918282, "eval_PRM F1 Neg": 0.5283018867924528, "eval_PRM Loss": 0.4510464668273926, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.881578947368421, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9476562738418579, "eval_runtime": 55.8007, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 885 }, { "epoch": 0.08174374351285896, "grad_norm": 1.6524067640391467, "learning_rate": 1.243377775141918e-06, "loss": 0.7504, "step": 886 }, { "epoch": 0.08183600507438589, "grad_norm": 1.7549163735268902, "learning_rate": 1.2433504309841475e-06, "loss": 0.8734, "step": 887 }, { "epoch": 0.08192826663591281, "grad_norm": 1.887443067589934, "learning_rate": 1.2433230307904873e-06, "loss": 0.6943, "step": 888 }, { "epoch": 0.08202052819743974, "grad_norm": 1.5869128030746127, "learning_rate": 1.243295574563421e-06, "loss": 0.7765, "step": 889 }, { "epoch": 0.08211278975896667, "grad_norm": 1.5400141425545875, "learning_rate": 1.2432680623054363e-06, "loss": 0.7727, "step": 890 }, { "epoch": 0.08211278975896667, "eval_GEN Loss": 0.4944790005683899, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4337035119533539, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9912259578704834, "eval_runtime": 55.9741, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 890 }, { "epoch": 0.0822050513204936, "grad_norm": 1.979917657565039, "learning_rate": 1.2432404940190268e-06, "loss": 0.7471, "step": 891 }, { "epoch": 0.08229731288202052, "grad_norm": 3.301646440722295, "learning_rate": 1.2432128697066906e-06, "loss": 0.9991, "step": 892 }, { "epoch": 0.08238957444354746, "grad_norm": 1.6350141598657844, "learning_rate": 1.243185189370931e-06, "loss": 0.722, "step": 893 }, { "epoch": 0.08248183600507439, "grad_norm": 3.8710426053518883, "learning_rate": 1.2431574530142566e-06, "loss": 0.8502, "step": 894 }, { "epoch": 0.08257409756660132, "grad_norm": 1.7868172321055178, "learning_rate": 1.2431296606391808e-06, "loss": 0.64, "step": 895 }, { "epoch": 0.08257409756660132, "eval_GEN Loss": 0.4964035153388977, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.43730512261390686, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 1.0329326391220093, "eval_runtime": 56.2022, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 895 }, { "epoch": 0.08266635912812824, "grad_norm": 2.8442898880016956, "learning_rate": 1.243101812248222e-06, "loss": 0.7484, "step": 896 }, { "epoch": 0.08275862068965517, "grad_norm": 1.9643221892455205, "learning_rate": 1.2430739078439043e-06, "loss": 0.6905, "step": 897 }, { "epoch": 0.0828508822511821, "grad_norm": 1.9929314050835263, "learning_rate": 1.2430459474287561e-06, "loss": 0.9033, "step": 898 }, { "epoch": 0.08294314381270904, "grad_norm": 2.12943498187798, "learning_rate": 1.2430179310053115e-06, "loss": 0.9438, "step": 899 }, { "epoch": 0.08303540537423595, "grad_norm": 2.636941537564535, "learning_rate": 1.2429898585761089e-06, "loss": 0.8624, "step": 900 }, { "epoch": 0.08303540537423595, "eval_GEN Loss": 0.49784040451049805, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.43831467628479004, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9543870091438293, "eval_runtime": 55.8343, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 900 }, { "epoch": 0.08312766693576289, "grad_norm": 2.4751278736954565, "learning_rate": 1.2429617301436927e-06, "loss": 0.8424, "step": 901 }, { "epoch": 0.08321992849728982, "grad_norm": 2.4505556014641576, "learning_rate": 1.242933545710612e-06, "loss": 0.9397, "step": 902 }, { "epoch": 0.08331219005881675, "grad_norm": 2.168359211408005, "learning_rate": 1.2429053052794208e-06, "loss": 0.9011, "step": 903 }, { "epoch": 0.08340445162034367, "grad_norm": 1.8215197239340088, "learning_rate": 1.2428770088526778e-06, "loss": 0.8597, "step": 904 }, { "epoch": 0.0834967131818706, "grad_norm": 1.4998595951461988, "learning_rate": 1.242848656432948e-06, "loss": 0.7586, "step": 905 }, { "epoch": 0.0834967131818706, "eval_GEN Loss": 0.4991404116153717, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.442852646112442, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9323317408561707, "eval_runtime": 55.809, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 905 }, { "epoch": 0.08358897474339753, "grad_norm": 2.448892605638469, "learning_rate": 1.2428202480228004e-06, "loss": 0.7082, "step": 906 }, { "epoch": 0.08368123630492447, "grad_norm": 2.0823511958510625, "learning_rate": 1.2427917836248095e-06, "loss": 0.8262, "step": 907 }, { "epoch": 0.08377349786645139, "grad_norm": 2.4923033408350985, "learning_rate": 1.2427632632415548e-06, "loss": 0.897, "step": 908 }, { "epoch": 0.08386575942797832, "grad_norm": 1.9198283211883294, "learning_rate": 1.2427346868756207e-06, "loss": 0.6094, "step": 909 }, { "epoch": 0.08395802098950525, "grad_norm": 2.0695183395171526, "learning_rate": 1.242706054529597e-06, "loss": 0.8529, "step": 910 }, { "epoch": 0.08395802098950525, "eval_GEN Loss": 0.4996287524700165, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.42069101333618164, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9454928040504456, "eval_runtime": 55.8764, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 910 }, { "epoch": 0.08405028255103218, "grad_norm": 1.778329862058544, "learning_rate": 1.2426773662060785e-06, "loss": 0.9364, "step": 911 }, { "epoch": 0.0841425441125591, "grad_norm": 1.4975012988149345, "learning_rate": 1.2426486219076647e-06, "loss": 0.7888, "step": 912 }, { "epoch": 0.08423480567408603, "grad_norm": 3.5460235175487056, "learning_rate": 1.2426198216369605e-06, "loss": 0.9086, "step": 913 }, { "epoch": 0.08432706723561297, "grad_norm": 1.4721525607859052, "learning_rate": 1.2425909653965759e-06, "loss": 0.7795, "step": 914 }, { "epoch": 0.0844193287971399, "grad_norm": 2.1330276691274728, "learning_rate": 1.242562053189126e-06, "loss": 0.7734, "step": 915 }, { "epoch": 0.0844193287971399, "eval_GEN Loss": 0.4994935095310211, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4029008150100708, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9498196840286255, "eval_runtime": 55.8242, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 915 }, { "epoch": 0.08451159035866682, "grad_norm": 1.4857650700445841, "learning_rate": 1.2425330850172308e-06, "loss": 0.5915, "step": 916 }, { "epoch": 0.08460385192019375, "grad_norm": 2.5305604505637347, "learning_rate": 1.2425040608835154e-06, "loss": 0.8846, "step": 917 }, { "epoch": 0.08469611348172068, "grad_norm": 1.6612318143106672, "learning_rate": 1.24247498079061e-06, "loss": 0.7023, "step": 918 }, { "epoch": 0.08478837504324761, "grad_norm": 1.7376350497879325, "learning_rate": 1.24244584474115e-06, "loss": 0.8275, "step": 919 }, { "epoch": 0.08488063660477453, "grad_norm": 1.540593975695022, "learning_rate": 1.2424166527377757e-06, "loss": 0.7477, "step": 920 }, { "epoch": 0.08488063660477453, "eval_GEN Loss": 0.500395655632019, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.39217761158943176, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9426081776618958, "eval_runtime": 55.8493, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 920 }, { "epoch": 0.08497289816630146, "grad_norm": 2.9010946783351184, "learning_rate": 1.2423874047831326e-06, "loss": 0.9336, "step": 921 }, { "epoch": 0.0850651597278284, "grad_norm": 2.4788366402222763, "learning_rate": 1.2423581008798707e-06, "loss": 0.8536, "step": 922 }, { "epoch": 0.08515742128935533, "grad_norm": 1.7633558621672578, "learning_rate": 1.2423287410306462e-06, "loss": 0.7852, "step": 923 }, { "epoch": 0.08524968285088225, "grad_norm": 1.5975516766632853, "learning_rate": 1.2422993252381195e-06, "loss": 0.8795, "step": 924 }, { "epoch": 0.08534194441240918, "grad_norm": 1.9115089431244583, "learning_rate": 1.2422698535049563e-06, "loss": 0.8315, "step": 925 }, { "epoch": 0.08534194441240918, "eval_GEN Loss": 0.49908775091171265, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.39852482080459595, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9270432591438293, "eval_runtime": 55.8449, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 925 }, { "epoch": 0.08543420597393611, "grad_norm": 2.376237572356329, "learning_rate": 1.2422403258338275e-06, "loss": 0.9664, "step": 926 }, { "epoch": 0.08552646753546304, "grad_norm": 1.7224706922713144, "learning_rate": 1.2422107422274086e-06, "loss": 0.9022, "step": 927 }, { "epoch": 0.08561872909698996, "grad_norm": 1.7754361881681706, "learning_rate": 1.242181102688381e-06, "loss": 0.9474, "step": 928 }, { "epoch": 0.0857109906585169, "grad_norm": 2.44837687350161, "learning_rate": 1.2421514072194302e-06, "loss": 0.914, "step": 929 }, { "epoch": 0.08580325222004383, "grad_norm": 2.06445320624774, "learning_rate": 1.2421216558232474e-06, "loss": 0.9022, "step": 930 }, { "epoch": 0.08580325222004383, "eval_GEN Loss": 0.49789413809776306, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4136628806591034, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9203726053237915, "eval_runtime": 55.885, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 930 }, { "epoch": 0.08589551378157076, "grad_norm": 2.694014836265426, "learning_rate": 1.242091848502529e-06, "loss": 0.8918, "step": 931 }, { "epoch": 0.08598777534309768, "grad_norm": 1.6161159496644908, "learning_rate": 1.2420619852599758e-06, "loss": 0.9424, "step": 932 }, { "epoch": 0.08608003690462461, "grad_norm": 2.2565358418890367, "learning_rate": 1.2420320660982944e-06, "loss": 0.7794, "step": 933 }, { "epoch": 0.08617229846615154, "grad_norm": 2.1082931556063547, "learning_rate": 1.2420020910201958e-06, "loss": 0.8659, "step": 934 }, { "epoch": 0.08626456002767847, "grad_norm": 1.616588521436696, "learning_rate": 1.2419720600283966e-06, "loss": 0.8662, "step": 935 }, { "epoch": 0.08626456002767847, "eval_GEN Loss": 0.4949224293231964, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.42087623476982117, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9172475934028625, "eval_runtime": 55.6459, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 935 }, { "epoch": 0.0863568215892054, "grad_norm": 2.2089355564102737, "learning_rate": 1.2419419731256182e-06, "loss": 0.753, "step": 936 }, { "epoch": 0.08644908315073233, "grad_norm": 1.693462533837462, "learning_rate": 1.241911830314587e-06, "loss": 0.636, "step": 937 }, { "epoch": 0.08654134471225926, "grad_norm": 2.3068665088424654, "learning_rate": 1.2418816315980348e-06, "loss": 0.6942, "step": 938 }, { "epoch": 0.08663360627378619, "grad_norm": 1.5593779345836822, "learning_rate": 1.2418513769786982e-06, "loss": 0.8544, "step": 939 }, { "epoch": 0.08672586783531311, "grad_norm": 2.0972921187878755, "learning_rate": 1.241821066459319e-06, "loss": 0.817, "step": 940 }, { "epoch": 0.08672586783531311, "eval_GEN Loss": 0.49334296584129333, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.40967661142349243, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9105167984962463, "eval_runtime": 55.8201, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 940 }, { "epoch": 0.08681812939684004, "grad_norm": 3.396534800564875, "learning_rate": 1.2417907000426435e-06, "loss": 1.0753, "step": 941 }, { "epoch": 0.08691039095836697, "grad_norm": 1.4537018426734836, "learning_rate": 1.241760277731424e-06, "loss": 0.8919, "step": 942 }, { "epoch": 0.0870026525198939, "grad_norm": 2.1880471890812188, "learning_rate": 1.2417297995284176e-06, "loss": 0.9027, "step": 943 }, { "epoch": 0.08709491408142082, "grad_norm": 2.1748698411085376, "learning_rate": 1.241699265436386e-06, "loss": 0.9034, "step": 944 }, { "epoch": 0.08718717564294776, "grad_norm": 2.0742997899946753, "learning_rate": 1.241668675458096e-06, "loss": 0.9607, "step": 945 }, { "epoch": 0.08718717564294776, "eval_GEN Loss": 0.49398431181907654, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.40069958567619324, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9083533883094788, "eval_runtime": 55.8051, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 945 }, { "epoch": 0.08727943720447469, "grad_norm": 1.68528997969868, "learning_rate": 1.2416380295963202e-06, "loss": 0.7965, "step": 946 }, { "epoch": 0.08737169876600162, "grad_norm": 1.6895554469366851, "learning_rate": 1.2416073278538354e-06, "loss": 0.6948, "step": 947 }, { "epoch": 0.08746396032752854, "grad_norm": 1.863158177970021, "learning_rate": 1.2415765702334239e-06, "loss": 0.8556, "step": 948 }, { "epoch": 0.08755622188905547, "grad_norm": 1.8045272780669495, "learning_rate": 1.2415457567378735e-06, "loss": 0.7606, "step": 949 }, { "epoch": 0.0876484834505824, "grad_norm": 2.46053200857306, "learning_rate": 1.241514887369976e-06, "loss": 0.6749, "step": 950 }, { "epoch": 0.0876484834505824, "eval_GEN Loss": 0.4946034848690033, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.40132224559783936, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9060096144676208, "eval_runtime": 55.8463, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 950 }, { "epoch": 0.08774074501210934, "grad_norm": 1.7453560866782651, "learning_rate": 1.2414839621325288e-06, "loss": 0.8106, "step": 951 }, { "epoch": 0.08783300657363625, "grad_norm": 2.327415032945926, "learning_rate": 1.2414529810283348e-06, "loss": 1.0471, "step": 952 }, { "epoch": 0.08792526813516319, "grad_norm": 1.5499009356140918, "learning_rate": 1.2414219440602012e-06, "loss": 0.7972, "step": 953 }, { "epoch": 0.08801752969669012, "grad_norm": 2.675616280773306, "learning_rate": 1.2413908512309408e-06, "loss": 0.8065, "step": 954 }, { "epoch": 0.08810979125821705, "grad_norm": 2.68357802713316, "learning_rate": 1.2413597025433712e-06, "loss": 0.9762, "step": 955 }, { "epoch": 0.08810979125821705, "eval_GEN Loss": 0.49337396025657654, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.405143678188324, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9100961685180664, "eval_runtime": 55.9096, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 955 }, { "epoch": 0.08820205281974397, "grad_norm": 1.704720640234973, "learning_rate": 1.2413284980003154e-06, "loss": 0.7031, "step": 956 }, { "epoch": 0.0882943143812709, "grad_norm": 2.1369641797328924, "learning_rate": 1.241297237604601e-06, "loss": 1.029, "step": 957 }, { "epoch": 0.08838657594279783, "grad_norm": 2.0579810955328384, "learning_rate": 1.2412659213590607e-06, "loss": 0.9636, "step": 958 }, { "epoch": 0.08847883750432477, "grad_norm": 1.2458359657878737, "learning_rate": 1.2412345492665326e-06, "loss": 0.582, "step": 959 }, { "epoch": 0.08857109906585169, "grad_norm": 1.906453396979652, "learning_rate": 1.2412031213298597e-06, "loss": 0.9057, "step": 960 }, { "epoch": 0.08857109906585169, "eval_GEN Loss": 0.49197861552238464, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4226519763469696, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.914843738079071, "eval_runtime": 55.9482, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 960 }, { "epoch": 0.08866336062737862, "grad_norm": 2.544046625569359, "learning_rate": 1.24117163755189e-06, "loss": 0.7873, "step": 961 }, { "epoch": 0.08875562218890555, "grad_norm": 2.315145397439504, "learning_rate": 1.2411400979354769e-06, "loss": 0.8408, "step": 962 }, { "epoch": 0.08884788375043248, "grad_norm": 1.4001561441990045, "learning_rate": 1.241108502483478e-06, "loss": 0.6308, "step": 963 }, { "epoch": 0.0889401453119594, "grad_norm": 2.018304603971791, "learning_rate": 1.2410768511987568e-06, "loss": 0.654, "step": 964 }, { "epoch": 0.08903240687348633, "grad_norm": 1.914867302083205, "learning_rate": 1.2410451440841817e-06, "loss": 0.7151, "step": 965 }, { "epoch": 0.08903240687348633, "eval_GEN Loss": 0.493167906999588, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4310265779495239, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.926682710647583, "eval_runtime": 55.9206, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 965 }, { "epoch": 0.08912466843501327, "grad_norm": 1.5606454945037835, "learning_rate": 1.241013381142626e-06, "loss": 0.8283, "step": 966 }, { "epoch": 0.0892169299965402, "grad_norm": 5.223071926553168, "learning_rate": 1.240981562376968e-06, "loss": 0.7292, "step": 967 }, { "epoch": 0.08930919155806712, "grad_norm": 1.5113562039472168, "learning_rate": 1.2409496877900914e-06, "loss": 0.7259, "step": 968 }, { "epoch": 0.08940145311959405, "grad_norm": 2.5214760068160142, "learning_rate": 1.2409177573848846e-06, "loss": 0.8092, "step": 969 }, { "epoch": 0.08949371468112098, "grad_norm": 2.0447430483082933, "learning_rate": 1.2408857711642412e-06, "loss": 0.9398, "step": 970 }, { "epoch": 0.08949371468112098, "eval_GEN Loss": 0.49091872572898865, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.42805832624435425, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9384615421295166, "eval_runtime": 55.9109, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 970 }, { "epoch": 0.08958597624264791, "grad_norm": 1.570560978823499, "learning_rate": 1.2408537291310595e-06, "loss": 0.7814, "step": 971 }, { "epoch": 0.08967823780417483, "grad_norm": 2.2696024022161714, "learning_rate": 1.2408216312882437e-06, "loss": 0.9953, "step": 972 }, { "epoch": 0.08977049936570176, "grad_norm": 1.4593275503611438, "learning_rate": 1.2407894776387023e-06, "loss": 0.7604, "step": 973 }, { "epoch": 0.0898627609272287, "grad_norm": 2.3007610096129274, "learning_rate": 1.240757268185349e-06, "loss": 0.9001, "step": 974 }, { "epoch": 0.08995502248875563, "grad_norm": 2.2448516620611816, "learning_rate": 1.2407250029311032e-06, "loss": 1.0175, "step": 975 }, { "epoch": 0.08995502248875563, "eval_GEN Loss": 0.49143147468566895, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8461538461538461, "eval_PRM F1 AUC": 0.7454164484023049, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.46443119645118713, "eval_PRM NPV": 0.48484848484848486, "eval_PRM Precision": 0.9041095890410958, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9454326629638672, "eval_runtime": 55.7019, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 975 }, { "epoch": 0.09004728405028255, "grad_norm": 2.210950991950348, "learning_rate": 1.2406926818788884e-06, "loss": 0.8523, "step": 976 }, { "epoch": 0.09013954561180948, "grad_norm": 1.6662669941233985, "learning_rate": 1.2406603050316334e-06, "loss": 0.7193, "step": 977 }, { "epoch": 0.09023180717333641, "grad_norm": 2.6173364182712073, "learning_rate": 1.2406278723922727e-06, "loss": 0.9668, "step": 978 }, { "epoch": 0.09032406873486334, "grad_norm": 2.578586937335509, "learning_rate": 1.2405953839637453e-06, "loss": 0.9479, "step": 979 }, { "epoch": 0.09041633029639026, "grad_norm": 3.7347857967613374, "learning_rate": 1.240562839748995e-06, "loss": 0.8276, "step": 980 }, { "epoch": 0.09041633029639026, "eval_GEN Loss": 0.4923248887062073, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8461538461538461, "eval_PRM F1 AUC": 0.7454164484023049, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4941073954105377, "eval_PRM NPV": 0.48484848484848486, "eval_PRM Precision": 0.9041095890410958, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.96484375, "eval_runtime": 56.725, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 980 }, { "epoch": 0.0905085918579172, "grad_norm": 2.638901943907216, "learning_rate": 1.2405302397509713e-06, "loss": 0.7783, "step": 981 }, { "epoch": 0.09060085341944413, "grad_norm": 2.1376484634956294, "learning_rate": 1.2404975839726285e-06, "loss": 0.9446, "step": 982 }, { "epoch": 0.09069311498097106, "grad_norm": 1.9396715223441883, "learning_rate": 1.2404648724169258e-06, "loss": 0.9514, "step": 983 }, { "epoch": 0.09078537654249798, "grad_norm": 1.7578422227243191, "learning_rate": 1.2404321050868276e-06, "loss": 0.7279, "step": 984 }, { "epoch": 0.09087763810402491, "grad_norm": 1.8642313172315839, "learning_rate": 1.2403992819853033e-06, "loss": 0.7766, "step": 985 }, { "epoch": 0.09087763810402491, "eval_GEN Loss": 0.4914352297782898, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.45686113834381104, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9616586565971375, "eval_runtime": 56.8705, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 985 }, { "epoch": 0.09096989966555184, "grad_norm": 1.9382213328481714, "learning_rate": 1.2403664031153274e-06, "loss": 0.9468, "step": 986 }, { "epoch": 0.09106216122707878, "grad_norm": 1.7634110586373042, "learning_rate": 1.2403334684798796e-06, "loss": 0.9205, "step": 987 }, { "epoch": 0.0911544227886057, "grad_norm": 1.533406115187923, "learning_rate": 1.2403004780819441e-06, "loss": 0.8005, "step": 988 }, { "epoch": 0.09124668435013263, "grad_norm": 2.0331736276058496, "learning_rate": 1.240267431924511e-06, "loss": 0.8553, "step": 989 }, { "epoch": 0.09133894591165956, "grad_norm": 1.5357846151003822, "learning_rate": 1.2402343300105746e-06, "loss": 0.7107, "step": 990 }, { "epoch": 0.09133894591165956, "eval_GEN Loss": 0.49173447489738464, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4222582280635834, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9712740182876587, "eval_runtime": 56.771, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 990 }, { "epoch": 0.09143120747318649, "grad_norm": 1.786324163487861, "learning_rate": 1.2402011723431348e-06, "loss": 0.7631, "step": 991 }, { "epoch": 0.09152346903471341, "grad_norm": 1.2584966725554103, "learning_rate": 1.2401679589251967e-06, "loss": 0.7694, "step": 992 }, { "epoch": 0.09161573059624034, "grad_norm": 1.7125418298951514, "learning_rate": 1.2401346897597696e-06, "loss": 0.7168, "step": 993 }, { "epoch": 0.09170799215776727, "grad_norm": 4.6677885891605255, "learning_rate": 1.2401013648498687e-06, "loss": 1.0056, "step": 994 }, { "epoch": 0.0918002537192942, "grad_norm": 2.096807475712761, "learning_rate": 1.240067984198514e-06, "loss": 1.0276, "step": 995 }, { "epoch": 0.0918002537192942, "eval_GEN Loss": 0.494640052318573, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4195377826690674, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9857572317123413, "eval_runtime": 56.692, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 995 }, { "epoch": 0.09189251528082112, "grad_norm": 1.3429032844712543, "learning_rate": 1.2400345478087306e-06, "loss": 0.736, "step": 996 }, { "epoch": 0.09198477684234806, "grad_norm": 1.5727366523808957, "learning_rate": 1.240001055683548e-06, "loss": 0.7833, "step": 997 }, { "epoch": 0.09207703840387499, "grad_norm": 1.3380310355741822, "learning_rate": 1.2399675078260021e-06, "loss": 0.6486, "step": 998 }, { "epoch": 0.09216929996540192, "grad_norm": 1.6976269992176125, "learning_rate": 1.2399339042391326e-06, "loss": 0.8231, "step": 999 }, { "epoch": 0.09226156152692884, "grad_norm": 1.3615470809281198, "learning_rate": 1.2399002449259845e-06, "loss": 0.7108, "step": 1000 }, { "epoch": 0.09226156152692884, "eval_GEN Loss": 0.49521714448928833, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.42610013484954834, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9921875, "eval_runtime": 56.8655, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1000 }, { "epoch": 0.09235382308845577, "grad_norm": 3.1917917311136788, "learning_rate": 1.2398665298896086e-06, "loss": 0.9791, "step": 1001 }, { "epoch": 0.0924460846499827, "grad_norm": 1.2435109862977927, "learning_rate": 1.2398327591330599e-06, "loss": 0.6088, "step": 1002 }, { "epoch": 0.09253834621150964, "grad_norm": 1.6375665664287087, "learning_rate": 1.2397989326593988e-06, "loss": 0.7379, "step": 1003 }, { "epoch": 0.09263060777303656, "grad_norm": 1.8619757019705074, "learning_rate": 1.2397650504716907e-06, "loss": 0.9372, "step": 1004 }, { "epoch": 0.09272286933456349, "grad_norm": 2.0115412373645825, "learning_rate": 1.239731112573006e-06, "loss": 0.8765, "step": 1005 }, { "epoch": 0.09272286933456349, "eval_GEN Loss": 0.4953429698944092, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4615454077720642, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9923076629638672, "eval_runtime": 56.4484, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 1005 }, { "epoch": 0.09281513089609042, "grad_norm": 1.8999889847203806, "learning_rate": 1.2396971189664202e-06, "loss": 0.8761, "step": 1006 }, { "epoch": 0.09290739245761735, "grad_norm": 1.5805870123343921, "learning_rate": 1.2396630696550143e-06, "loss": 0.5916, "step": 1007 }, { "epoch": 0.09299965401914427, "grad_norm": 1.7449783247013633, "learning_rate": 1.2396289646418733e-06, "loss": 0.7875, "step": 1008 }, { "epoch": 0.0930919155806712, "grad_norm": 1.6141993052024273, "learning_rate": 1.2395948039300882e-06, "loss": 0.7338, "step": 1009 }, { "epoch": 0.09318417714219814, "grad_norm": 1.8277815860684463, "learning_rate": 1.2395605875227542e-06, "loss": 0.7331, "step": 1010 }, { "epoch": 0.09318417714219814, "eval_GEN Loss": 0.4921077489852905, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.46621182560920715, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9893629550933838, "eval_runtime": 55.7417, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1010 }, { "epoch": 0.09327643870372505, "grad_norm": 1.856528550567078, "learning_rate": 1.239526315422973e-06, "loss": 0.744, "step": 1011 }, { "epoch": 0.09336870026525199, "grad_norm": 1.5903192366250005, "learning_rate": 1.2394919876338494e-06, "loss": 0.8565, "step": 1012 }, { "epoch": 0.09346096182677892, "grad_norm": 2.241953738337567, "learning_rate": 1.2394576041584946e-06, "loss": 0.8878, "step": 1013 }, { "epoch": 0.09355322338830585, "grad_norm": 1.701638442750919, "learning_rate": 1.239423165000025e-06, "loss": 0.8068, "step": 1014 }, { "epoch": 0.09364548494983277, "grad_norm": 2.8186542530982095, "learning_rate": 1.2393886701615607e-06, "loss": 0.8443, "step": 1015 }, { "epoch": 0.09364548494983277, "eval_GEN Loss": 0.4892708659172058, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.46163588762283325, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9852163195610046, "eval_runtime": 55.7734, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 1015 }, { "epoch": 0.0937377465113597, "grad_norm": 1.7717725144662118, "learning_rate": 1.239354119646228e-06, "loss": 0.8047, "step": 1016 }, { "epoch": 0.09383000807288663, "grad_norm": 1.8512229970673009, "learning_rate": 1.2393195134571582e-06, "loss": 0.6764, "step": 1017 }, { "epoch": 0.09392226963441357, "grad_norm": 2.54185236358672, "learning_rate": 1.239284851597487e-06, "loss": 1.0241, "step": 1018 }, { "epoch": 0.09401453119594048, "grad_norm": 2.8263319126756703, "learning_rate": 1.2392501340703557e-06, "loss": 0.8761, "step": 1019 }, { "epoch": 0.09410679275746742, "grad_norm": 2.0255142275269042, "learning_rate": 1.2392153608789103e-06, "loss": 0.9198, "step": 1020 }, { "epoch": 0.09410679275746742, "eval_GEN Loss": 0.4873213768005371, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.46061861515045166, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9809495210647583, "eval_runtime": 55.9561, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1020 }, { "epoch": 0.09419905431899435, "grad_norm": 2.6503757314184373, "learning_rate": 1.2391805320263023e-06, "loss": 0.7316, "step": 1021 }, { "epoch": 0.09429131588052128, "grad_norm": 1.7216110902862465, "learning_rate": 1.2391456475156876e-06, "loss": 0.8213, "step": 1022 }, { "epoch": 0.0943835774420482, "grad_norm": 1.9917097770601746, "learning_rate": 1.239110707350228e-06, "loss": 0.5839, "step": 1023 }, { "epoch": 0.09447583900357513, "grad_norm": 2.115845903684835, "learning_rate": 1.2390757115330889e-06, "loss": 0.8723, "step": 1024 }, { "epoch": 0.09456810056510206, "grad_norm": 1.985374323924196, "learning_rate": 1.2390406600674427e-06, "loss": 0.76, "step": 1025 }, { "epoch": 0.09456810056510206, "eval_GEN Loss": 0.4882165491580963, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.45601755380630493, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9912259578704834, "eval_runtime": 55.8091, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 1025 }, { "epoch": 0.094660362126629, "grad_norm": 2.0338184228229776, "learning_rate": 1.239005552956465e-06, "loss": 0.7357, "step": 1026 }, { "epoch": 0.09475262368815592, "grad_norm": 1.6369499769315794, "learning_rate": 1.238970390203338e-06, "loss": 0.8611, "step": 1027 }, { "epoch": 0.09484488524968285, "grad_norm": 2.3335893973512776, "learning_rate": 1.2389351718112476e-06, "loss": 1.027, "step": 1028 }, { "epoch": 0.09493714681120978, "grad_norm": 2.1131556795739788, "learning_rate": 1.2388998977833857e-06, "loss": 0.6919, "step": 1029 }, { "epoch": 0.09502940837273671, "grad_norm": 3.9803852639076336, "learning_rate": 1.2388645681229486e-06, "loss": 0.9372, "step": 1030 }, { "epoch": 0.09502940837273671, "eval_GEN Loss": 0.4888576865196228, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.45159152150154114, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9866586327552795, "eval_runtime": 55.8556, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1030 }, { "epoch": 0.09512166993426363, "grad_norm": 2.674260347679863, "learning_rate": 1.2388291828331383e-06, "loss": 0.6835, "step": 1031 }, { "epoch": 0.09521393149579056, "grad_norm": 1.4120791571535167, "learning_rate": 1.238793741917161e-06, "loss": 0.7706, "step": 1032 }, { "epoch": 0.0953061930573175, "grad_norm": 1.7594840517952317, "learning_rate": 1.238758245378229e-06, "loss": 0.7101, "step": 1033 }, { "epoch": 0.09539845461884443, "grad_norm": 2.4218671387046653, "learning_rate": 1.2387226932195587e-06, "loss": 0.8659, "step": 1034 }, { "epoch": 0.09549071618037135, "grad_norm": 1.7849933037963401, "learning_rate": 1.2386870854443719e-06, "loss": 0.8784, "step": 1035 }, { "epoch": 0.09549071618037135, "eval_GEN Loss": 0.48858630657196045, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.46425315737724304, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9759014248847961, "eval_runtime": 55.7373, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1035 }, { "epoch": 0.09558297774189828, "grad_norm": 2.115845187930869, "learning_rate": 1.2386514220558953e-06, "loss": 0.6927, "step": 1036 }, { "epoch": 0.09567523930342521, "grad_norm": 1.6759229154986803, "learning_rate": 1.2386157030573608e-06, "loss": 0.7528, "step": 1037 }, { "epoch": 0.09576750086495214, "grad_norm": 1.7471625660255927, "learning_rate": 1.238579928452006e-06, "loss": 0.8052, "step": 1038 }, { "epoch": 0.09585976242647906, "grad_norm": 1.8974624367917863, "learning_rate": 1.238544098243072e-06, "loss": 0.8325, "step": 1039 }, { "epoch": 0.095952023988006, "grad_norm": 2.272234491171637, "learning_rate": 1.2385082124338058e-06, "loss": 0.8701, "step": 1040 }, { "epoch": 0.095952023988006, "eval_GEN Loss": 0.4879036843776703, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.46317258477211, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9808894395828247, "eval_runtime": 55.8278, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1040 }, { "epoch": 0.09604428554953293, "grad_norm": 1.9479029261980405, "learning_rate": 1.23847227102746e-06, "loss": 0.8885, "step": 1041 }, { "epoch": 0.09613654711105986, "grad_norm": 1.5555454438192333, "learning_rate": 1.2384362740272913e-06, "loss": 0.6559, "step": 1042 }, { "epoch": 0.09622880867258678, "grad_norm": 1.5042057654066376, "learning_rate": 1.238400221436562e-06, "loss": 0.7191, "step": 1043 }, { "epoch": 0.09632107023411371, "grad_norm": 1.897573278510063, "learning_rate": 1.238364113258539e-06, "loss": 0.8611, "step": 1044 }, { "epoch": 0.09641333179564064, "grad_norm": 1.6709830910703745, "learning_rate": 1.2383279494964948e-06, "loss": 0.746, "step": 1045 }, { "epoch": 0.09641333179564064, "eval_GEN Loss": 0.4869081974029541, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM Loss": 0.4486120343208313, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9861778616905212, "eval_runtime": 55.9687, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1045 }, { "epoch": 0.09650559335716757, "grad_norm": 1.7310991194741818, "learning_rate": 1.2382917301537061e-06, "loss": 0.7717, "step": 1046 }, { "epoch": 0.09659785491869449, "grad_norm": 1.5023268924529263, "learning_rate": 1.2382554552334558e-06, "loss": 0.6981, "step": 1047 }, { "epoch": 0.09669011648022142, "grad_norm": 3.330774683342622, "learning_rate": 1.2382191247390307e-06, "loss": 0.945, "step": 1048 }, { "epoch": 0.09678237804174836, "grad_norm": 1.3849945323861854, "learning_rate": 1.2381827386737234e-06, "loss": 0.75, "step": 1049 }, { "epoch": 0.09687463960327529, "grad_norm": 2.560950054271451, "learning_rate": 1.238146297040831e-06, "loss": 0.8057, "step": 1050 }, { "epoch": 0.09687463960327529, "eval_GEN Loss": 0.4846045970916748, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM Loss": 0.4420788288116455, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 1.0069711208343506, "eval_runtime": 56.3492, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 1050 }, { "epoch": 0.09696690116480221, "grad_norm": 1.2051478050447069, "learning_rate": 1.2381097998436562e-06, "loss": 0.7035, "step": 1051 }, { "epoch": 0.09705916272632914, "grad_norm": 1.6971767462504381, "learning_rate": 1.2380732470855062e-06, "loss": 0.7376, "step": 1052 }, { "epoch": 0.09715142428785607, "grad_norm": 2.5051400000537924, "learning_rate": 1.2380366387696935e-06, "loss": 0.9175, "step": 1053 }, { "epoch": 0.097243685849383, "grad_norm": 1.9790729909551097, "learning_rate": 1.2379999748995358e-06, "loss": 0.7782, "step": 1054 }, { "epoch": 0.09733594741090992, "grad_norm": 1.5143617905400066, "learning_rate": 1.2379632554783553e-06, "loss": 0.5763, "step": 1055 }, { "epoch": 0.09733594741090992, "eval_GEN Loss": 0.4831518232822418, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM Loss": 0.4305679500102997, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9697115421295166, "eval_runtime": 56.2017, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1055 }, { "epoch": 0.09742820897243686, "grad_norm": 2.1927628921543154, "learning_rate": 1.23792648050948e-06, "loss": 0.9713, "step": 1056 }, { "epoch": 0.09752047053396379, "grad_norm": 1.7522898262035198, "learning_rate": 1.2378896499962423e-06, "loss": 0.7826, "step": 1057 }, { "epoch": 0.09761273209549072, "grad_norm": 2.464980681638915, "learning_rate": 1.2378527639419795e-06, "loss": 0.9874, "step": 1058 }, { "epoch": 0.09770499365701764, "grad_norm": 2.5801590379761583, "learning_rate": 1.237815822350035e-06, "loss": 0.8722, "step": 1059 }, { "epoch": 0.09779725521854457, "grad_norm": 1.6227529227120872, "learning_rate": 1.2377788252237558e-06, "loss": 0.7129, "step": 1060 }, { "epoch": 0.09779725521854457, "eval_GEN Loss": 0.48260170221328735, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4441496431827545, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9358773827552795, "eval_runtime": 56.0349, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1060 }, { "epoch": 0.0978895167800715, "grad_norm": 2.0915950164198045, "learning_rate": 1.237741772566495e-06, "loss": 0.8365, "step": 1061 }, { "epoch": 0.09798177834159844, "grad_norm": 2.209002448171688, "learning_rate": 1.2377046643816104e-06, "loss": 0.879, "step": 1062 }, { "epoch": 0.09807403990312535, "grad_norm": 2.0767325247321, "learning_rate": 1.2376675006724644e-06, "loss": 0.8205, "step": 1063 }, { "epoch": 0.09816630146465229, "grad_norm": 1.6383269233868047, "learning_rate": 1.2376302814424255e-06, "loss": 0.7769, "step": 1064 }, { "epoch": 0.09825856302617922, "grad_norm": 1.335123538600553, "learning_rate": 1.237593006694866e-06, "loss": 0.7526, "step": 1065 }, { "epoch": 0.09825856302617922, "eval_GEN Loss": 0.4857008755207062, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.48533496260643005, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.954026460647583, "eval_runtime": 55.9249, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1065 }, { "epoch": 0.09835082458770615, "grad_norm": 1.5668643122578736, "learning_rate": 1.2375556764331641e-06, "loss": 0.6694, "step": 1066 }, { "epoch": 0.09844308614923307, "grad_norm": 2.265192148242357, "learning_rate": 1.2375182906607025e-06, "loss": 0.8344, "step": 1067 }, { "epoch": 0.09853534771076, "grad_norm": 3.331332787875964, "learning_rate": 1.2374808493808693e-06, "loss": 0.914, "step": 1068 }, { "epoch": 0.09862760927228693, "grad_norm": 3.0449674069849713, "learning_rate": 1.2374433525970576e-06, "loss": 0.9626, "step": 1069 }, { "epoch": 0.09871987083381387, "grad_norm": 3.495290514797651, "learning_rate": 1.2374058003126651e-06, "loss": 0.7489, "step": 1070 }, { "epoch": 0.09871987083381387, "eval_GEN Loss": 0.48816636204719543, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.4851211607456207, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9559495449066162, "eval_runtime": 55.9455, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1070 }, { "epoch": 0.09881213239534078, "grad_norm": 2.768920860049011, "learning_rate": 1.2373681925310952e-06, "loss": 0.8713, "step": 1071 }, { "epoch": 0.09890439395686772, "grad_norm": 2.326404515885457, "learning_rate": 1.2373305292557558e-06, "loss": 0.5683, "step": 1072 }, { "epoch": 0.09899665551839465, "grad_norm": 1.707817515880418, "learning_rate": 1.23729281049006e-06, "loss": 0.6518, "step": 1073 }, { "epoch": 0.09908891707992158, "grad_norm": 2.1661936872492045, "learning_rate": 1.2372550362374258e-06, "loss": 0.7883, "step": 1074 }, { "epoch": 0.0991811786414485, "grad_norm": 1.5784542421180987, "learning_rate": 1.2372172065012768e-06, "loss": 0.7391, "step": 1075 }, { "epoch": 0.0991811786414485, "eval_GEN Loss": 0.48966479301452637, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.42942070960998535, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9418870210647583, "eval_runtime": 55.9779, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1075 }, { "epoch": 0.09927344020297543, "grad_norm": 2.318419152657595, "learning_rate": 1.2371793212850406e-06, "loss": 1.0127, "step": 1076 }, { "epoch": 0.09936570176450236, "grad_norm": 1.5615375184288336, "learning_rate": 1.237141380592151e-06, "loss": 0.7858, "step": 1077 }, { "epoch": 0.0994579633260293, "grad_norm": 3.6175963867550807, "learning_rate": 1.2371033844260457e-06, "loss": 0.85, "step": 1078 }, { "epoch": 0.09955022488755622, "grad_norm": 2.180342768126879, "learning_rate": 1.2370653327901685e-06, "loss": 0.779, "step": 1079 }, { "epoch": 0.09964248644908315, "grad_norm": 1.7449433978213127, "learning_rate": 1.2370272256879673e-06, "loss": 0.8243, "step": 1080 }, { "epoch": 0.09964248644908315, "eval_GEN Loss": 0.49025124311447144, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4073673486709595, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9507211446762085, "eval_runtime": 56.1036, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1080 }, { "epoch": 0.09973474801061008, "grad_norm": 2.920875514089996, "learning_rate": 1.2369890631228956e-06, "loss": 1.0256, "step": 1081 }, { "epoch": 0.09982700957213701, "grad_norm": 2.224332763254484, "learning_rate": 1.2369508450984115e-06, "loss": 0.6702, "step": 1082 }, { "epoch": 0.09991927113366393, "grad_norm": 1.545276626196894, "learning_rate": 1.2369125716179789e-06, "loss": 0.7714, "step": 1083 }, { "epoch": 0.10001153269519086, "grad_norm": 1.6531163183487245, "learning_rate": 1.2368742426850658e-06, "loss": 0.7989, "step": 1084 }, { "epoch": 0.1001037942567178, "grad_norm": 2.400449458139153, "learning_rate": 1.2368358583031457e-06, "loss": 0.9417, "step": 1085 }, { "epoch": 0.1001037942567178, "eval_GEN Loss": 0.4873465299606323, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.41614651679992676, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9508413672447205, "eval_runtime": 56.9944, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1085 }, { "epoch": 0.10019605581824473, "grad_norm": 2.397450377181036, "learning_rate": 1.236797418475697e-06, "loss": 0.9024, "step": 1086 }, { "epoch": 0.10028831737977165, "grad_norm": 2.774157868181651, "learning_rate": 1.2367589232062033e-06, "loss": 0.9406, "step": 1087 }, { "epoch": 0.10038057894129858, "grad_norm": 2.155396098393847, "learning_rate": 1.236720372498153e-06, "loss": 0.8102, "step": 1088 }, { "epoch": 0.10047284050282551, "grad_norm": 1.566442610547236, "learning_rate": 1.2366817663550399e-06, "loss": 0.669, "step": 1089 }, { "epoch": 0.10056510206435244, "grad_norm": 1.6382905235056355, "learning_rate": 1.2366431047803622e-06, "loss": 0.7896, "step": 1090 }, { "epoch": 0.10056510206435244, "eval_GEN Loss": 0.4887427091598511, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.45235133171081543, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9478966593742371, "eval_runtime": 56.2997, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 1090 }, { "epoch": 0.10065736362587936, "grad_norm": 3.260548589865754, "learning_rate": 1.2366043877776235e-06, "loss": 0.93, "step": 1091 }, { "epoch": 0.1007496251874063, "grad_norm": 2.8646590819893207, "learning_rate": 1.2365656153503327e-06, "loss": 0.6845, "step": 1092 }, { "epoch": 0.10084188674893323, "grad_norm": 2.0288586179259758, "learning_rate": 1.236526787502003e-06, "loss": 0.8515, "step": 1093 }, { "epoch": 0.10093414831046016, "grad_norm": 1.5112978349865815, "learning_rate": 1.2364879042361535e-06, "loss": 0.7404, "step": 1094 }, { "epoch": 0.10102640987198708, "grad_norm": 2.401128397609629, "learning_rate": 1.2364489655563075e-06, "loss": 0.66, "step": 1095 }, { "epoch": 0.10102640987198708, "eval_GEN Loss": 0.4885111153125763, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.46584510803222656, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9509615302085876, "eval_runtime": 57.106, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 1095 }, { "epoch": 0.10111867143351401, "grad_norm": 1.5690924072635593, "learning_rate": 1.2364099714659937e-06, "loss": 0.7624, "step": 1096 }, { "epoch": 0.10121093299504094, "grad_norm": 2.1418884280774155, "learning_rate": 1.236370921968746e-06, "loss": 1.0047, "step": 1097 }, { "epoch": 0.10130319455656787, "grad_norm": 1.8642136781223946, "learning_rate": 1.2363318170681032e-06, "loss": 0.8175, "step": 1098 }, { "epoch": 0.10139545611809479, "grad_norm": 2.6736263314289292, "learning_rate": 1.2362926567676087e-06, "loss": 0.9793, "step": 1099 }, { "epoch": 0.10148771767962173, "grad_norm": 1.752541227854694, "learning_rate": 1.2362534410708114e-06, "loss": 0.7323, "step": 1100 }, { "epoch": 0.10148771767962173, "eval_GEN Loss": 0.4882470965385437, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4444061517715454, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9581129550933838, "eval_runtime": 55.8385, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1100 }, { "epoch": 0.10157997924114866, "grad_norm": 2.503064476777125, "learning_rate": 1.2362141699812652e-06, "loss": 0.778, "step": 1101 }, { "epoch": 0.10167224080267559, "grad_norm": 1.5878985869751334, "learning_rate": 1.236174843502529e-06, "loss": 0.7759, "step": 1102 }, { "epoch": 0.10176450236420251, "grad_norm": 1.9126008356736544, "learning_rate": 1.2361354616381664e-06, "loss": 0.7474, "step": 1103 }, { "epoch": 0.10185676392572944, "grad_norm": 1.5539796327415196, "learning_rate": 1.2360960243917463e-06, "loss": 0.749, "step": 1104 }, { "epoch": 0.10194902548725637, "grad_norm": 1.960197152011404, "learning_rate": 1.2360565317668425e-06, "loss": 0.7112, "step": 1105 }, { "epoch": 0.10194902548725637, "eval_GEN Loss": 0.4906383156776428, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.44833284616470337, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9697115421295166, "eval_runtime": 56.0608, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1105 }, { "epoch": 0.1020412870487833, "grad_norm": 2.0062356883556047, "learning_rate": 1.236016983767034e-06, "loss": 0.9052, "step": 1106 }, { "epoch": 0.10213354861031022, "grad_norm": 2.407371182829471, "learning_rate": 1.2359773803959047e-06, "loss": 0.8707, "step": 1107 }, { "epoch": 0.10222581017183716, "grad_norm": 1.8258105151103796, "learning_rate": 1.2359377216570437e-06, "loss": 0.6605, "step": 1108 }, { "epoch": 0.10231807173336409, "grad_norm": 1.8117603448203083, "learning_rate": 1.2358980075540444e-06, "loss": 0.5328, "step": 1109 }, { "epoch": 0.10241033329489102, "grad_norm": 2.3949952588731342, "learning_rate": 1.2358582380905063e-06, "loss": 0.8625, "step": 1110 }, { "epoch": 0.10241033329489102, "eval_GEN Loss": 0.4929998815059662, "eval_GEN top-5 accuracy": 0.9767645769399387, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.450009286403656, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9662860631942749, "eval_runtime": 55.8382, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1110 }, { "epoch": 0.10250259485641794, "grad_norm": 2.267304274320555, "learning_rate": 1.2358184132700331e-06, "loss": 1.0628, "step": 1111 }, { "epoch": 0.10259485641794487, "grad_norm": 1.9153714077184445, "learning_rate": 1.2357785330962338e-06, "loss": 0.8216, "step": 1112 }, { "epoch": 0.1026871179794718, "grad_norm": 2.1349724599465776, "learning_rate": 1.2357385975727226e-06, "loss": 0.8565, "step": 1113 }, { "epoch": 0.10277937954099874, "grad_norm": 1.5515261839089143, "learning_rate": 1.2356986067031181e-06, "loss": 0.7103, "step": 1114 }, { "epoch": 0.10287164110252565, "grad_norm": 2.18568346598404, "learning_rate": 1.2356585604910448e-06, "loss": 0.9461, "step": 1115 }, { "epoch": 0.10287164110252565, "eval_GEN Loss": 0.4928361177444458, "eval_GEN top-5 accuracy": 0.9776413853572994, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4473930597305298, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9716346263885498, "eval_runtime": 55.9383, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1115 }, { "epoch": 0.10296390266405259, "grad_norm": 1.9593718521236188, "learning_rate": 1.2356184589401317e-06, "loss": 0.701, "step": 1116 }, { "epoch": 0.10305616422557952, "grad_norm": 1.5112039103193984, "learning_rate": 1.2355783020540125e-06, "loss": 0.4822, "step": 1117 }, { "epoch": 0.10314842578710645, "grad_norm": 3.492610895074985, "learning_rate": 1.2355380898363265e-06, "loss": 1.0495, "step": 1118 }, { "epoch": 0.10324068734863337, "grad_norm": 2.779790989181864, "learning_rate": 1.235497822290718e-06, "loss": 0.8498, "step": 1119 }, { "epoch": 0.1033329489101603, "grad_norm": 2.495259404393216, "learning_rate": 1.2354574994208358e-06, "loss": 0.8314, "step": 1120 }, { "epoch": 0.1033329489101603, "eval_GEN Loss": 0.49186062812805176, "eval_GEN top-5 accuracy": 0.977202981148619, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4566497206687927, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9811899065971375, "eval_runtime": 56.1218, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 1120 }, { "epoch": 0.10342521047168723, "grad_norm": 2.638511333717374, "learning_rate": 1.235417121230334e-06, "loss": 1.0844, "step": 1121 }, { "epoch": 0.10351747203321417, "grad_norm": 2.157032359175817, "learning_rate": 1.235376687722872e-06, "loss": 0.9147, "step": 1122 }, { "epoch": 0.10360973359474109, "grad_norm": 1.3307503885733896, "learning_rate": 1.2353361989021137e-06, "loss": 0.7644, "step": 1123 }, { "epoch": 0.10370199515626802, "grad_norm": 1.9289836445089643, "learning_rate": 1.2352956547717285e-06, "loss": 0.8233, "step": 1124 }, { "epoch": 0.10379425671779495, "grad_norm": 1.6397876995873373, "learning_rate": 1.2352550553353903e-06, "loss": 0.5665, "step": 1125 }, { "epoch": 0.10379425671779495, "eval_GEN Loss": 0.4904106557369232, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.46971702575683594, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9793269038200378, "eval_runtime": 56.005, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1125 }, { "epoch": 0.10388651827932188, "grad_norm": 2.223510724143778, "learning_rate": 1.2352144005967787e-06, "loss": 0.7505, "step": 1126 }, { "epoch": 0.1039787798408488, "grad_norm": 3.043622424099526, "learning_rate": 1.2351736905595774e-06, "loss": 0.9179, "step": 1127 }, { "epoch": 0.10407104140237573, "grad_norm": 2.3547098805165105, "learning_rate": 1.235132925227476e-06, "loss": 0.8413, "step": 1128 }, { "epoch": 0.10416330296390267, "grad_norm": 1.9630806022172627, "learning_rate": 1.2350921046041683e-06, "loss": 0.7343, "step": 1129 }, { "epoch": 0.1042555645254296, "grad_norm": 1.946989665759252, "learning_rate": 1.2350512286933538e-06, "loss": 0.8474, "step": 1130 }, { "epoch": 0.1042555645254296, "eval_GEN Loss": 0.4904525578022003, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 Neg": 0.5, "eval_PRM Loss": 0.486596941947937, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9783653616905212, "eval_runtime": 57.2988, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 1130 }, { "epoch": 0.10434782608695652, "grad_norm": 2.2566667342476494, "learning_rate": 1.2350102974987368e-06, "loss": 0.9051, "step": 1131 }, { "epoch": 0.10444008764848345, "grad_norm": 1.190516769690317, "learning_rate": 1.2349693110240265e-06, "loss": 0.7958, "step": 1132 }, { "epoch": 0.10453234921001038, "grad_norm": 2.5848385443398807, "learning_rate": 1.2349282692729373e-06, "loss": 0.8176, "step": 1133 }, { "epoch": 0.10462461077153731, "grad_norm": 1.6079555069768316, "learning_rate": 1.234887172249188e-06, "loss": 0.8849, "step": 1134 }, { "epoch": 0.10471687233306423, "grad_norm": 1.8259966634702556, "learning_rate": 1.2348460199565035e-06, "loss": 0.7843, "step": 1135 }, { "epoch": 0.10471687233306423, "eval_GEN Loss": 0.49019476771354675, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 Neg": 0.5, "eval_PRM Loss": 0.49282306432724, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9757211804389954, "eval_runtime": 56.0892, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1135 }, { "epoch": 0.10480913389459116, "grad_norm": 2.578494402269661, "learning_rate": 1.2348048123986125e-06, "loss": 0.8173, "step": 1136 }, { "epoch": 0.1049013954561181, "grad_norm": 1.7756464307745905, "learning_rate": 1.2347635495792494e-06, "loss": 1.0041, "step": 1137 }, { "epoch": 0.10499365701764503, "grad_norm": 2.242358836794997, "learning_rate": 1.234722231502154e-06, "loss": 0.8198, "step": 1138 }, { "epoch": 0.10508591857917195, "grad_norm": 1.562835763782735, "learning_rate": 1.2346808581710702e-06, "loss": 0.7372, "step": 1139 }, { "epoch": 0.10517818014069888, "grad_norm": 1.7829047388278465, "learning_rate": 1.2346394295897473e-06, "loss": 0.7671, "step": 1140 }, { "epoch": 0.10517818014069888, "eval_GEN Loss": 0.4887770712375641, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8427672955974843, "eval_PRM F1 AUC": 0.707962283918282, "eval_PRM F1 Neg": 0.5283018867924528, "eval_PRM Loss": 0.5005943179130554, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.881578947368421, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9809495210647583, "eval_runtime": 55.797, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 1140 }, { "epoch": 0.10527044170222581, "grad_norm": 2.4676921484264422, "learning_rate": 1.2345979457619397e-06, "loss": 1.0341, "step": 1141 }, { "epoch": 0.10536270326375274, "grad_norm": 2.3281434201296265, "learning_rate": 1.2345564066914068e-06, "loss": 0.9362, "step": 1142 }, { "epoch": 0.10545496482527966, "grad_norm": 1.8217499538697424, "learning_rate": 1.234514812381913e-06, "loss": 0.8462, "step": 1143 }, { "epoch": 0.1055472263868066, "grad_norm": 1.998244371373172, "learning_rate": 1.2344731628372273e-06, "loss": 0.8503, "step": 1144 }, { "epoch": 0.10563948794833353, "grad_norm": 1.8376465866184033, "learning_rate": 1.2344314580611242e-06, "loss": 0.7209, "step": 1145 }, { "epoch": 0.10563948794833353, "eval_GEN Loss": 0.48478788137435913, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.4554228186607361, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9803485870361328, "eval_runtime": 55.9927, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1145 }, { "epoch": 0.10573174950986046, "grad_norm": 1.5757690964316267, "learning_rate": 1.2343896980573832e-06, "loss": 0.8978, "step": 1146 }, { "epoch": 0.10582401107138738, "grad_norm": 2.4409144721834375, "learning_rate": 1.2343478828297887e-06, "loss": 1.0605, "step": 1147 }, { "epoch": 0.10591627263291431, "grad_norm": 2.052028030357802, "learning_rate": 1.2343060123821296e-06, "loss": 0.8907, "step": 1148 }, { "epoch": 0.10600853419444124, "grad_norm": 1.544575693393687, "learning_rate": 1.234264086718201e-06, "loss": 0.6599, "step": 1149 }, { "epoch": 0.10610079575596817, "grad_norm": 2.1519084900119787, "learning_rate": 1.2342221058418017e-06, "loss": 0.9246, "step": 1150 }, { "epoch": 0.10610079575596817, "eval_GEN Loss": 0.48479387164115906, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.6511262441068623, "eval_PRM F1 Neg": 0.45454545454545453, "eval_PRM Loss": 0.43649429082870483, "eval_PRM NPV": 0.47619047619047616, "eval_PRM Precision": 0.8470588235294118, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 1.0037260055541992, "eval_runtime": 55.917, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1150 }, { "epoch": 0.1061930573174951, "grad_norm": 1.7989726386356726, "learning_rate": 1.234180069756736e-06, "loss": 0.7731, "step": 1151 }, { "epoch": 0.10628531887902203, "grad_norm": 1.8165689721538687, "learning_rate": 1.2341379784668137e-06, "loss": 0.7234, "step": 1152 }, { "epoch": 0.10637758044054896, "grad_norm": 2.6393223009208033, "learning_rate": 1.234095831975849e-06, "loss": 0.9134, "step": 1153 }, { "epoch": 0.10646984200207589, "grad_norm": 2.770264310554098, "learning_rate": 1.2340536302876614e-06, "loss": 0.9177, "step": 1154 }, { "epoch": 0.10656210356360281, "grad_norm": 1.7140804450288918, "learning_rate": 1.234011373406075e-06, "loss": 0.7026, "step": 1155 }, { "epoch": 0.10656210356360281, "eval_GEN Loss": 0.486250638961792, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM Loss": 0.40797463059425354, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.959254801273346, "eval_runtime": 55.9408, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1155 }, { "epoch": 0.10665436512512974, "grad_norm": 1.726417072871133, "learning_rate": 1.2339690613349194e-06, "loss": 0.9421, "step": 1156 }, { "epoch": 0.10674662668665667, "grad_norm": 1.7498272511515074, "learning_rate": 1.233926694078029e-06, "loss": 0.8111, "step": 1157 }, { "epoch": 0.1068388882481836, "grad_norm": 2.1298247243358723, "learning_rate": 1.233884271639243e-06, "loss": 1.0038, "step": 1158 }, { "epoch": 0.10693114980971052, "grad_norm": 2.31391672660952, "learning_rate": 1.2338417940224059e-06, "loss": 0.7578, "step": 1159 }, { "epoch": 0.10702341137123746, "grad_norm": 1.9063754681354979, "learning_rate": 1.2337992612313672e-06, "loss": 0.8946, "step": 1160 }, { "epoch": 0.10702341137123746, "eval_GEN Loss": 0.4875490963459015, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.43092072010040283, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9337740540504456, "eval_runtime": 55.9026, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1160 }, { "epoch": 0.10711567293276439, "grad_norm": 2.2177275668005723, "learning_rate": 1.233756673269981e-06, "loss": 0.8565, "step": 1161 }, { "epoch": 0.10720793449429132, "grad_norm": 2.305173590342485, "learning_rate": 1.2337140301421071e-06, "loss": 0.8235, "step": 1162 }, { "epoch": 0.10730019605581824, "grad_norm": 2.0110986777526, "learning_rate": 1.2336713318516095e-06, "loss": 0.6888, "step": 1163 }, { "epoch": 0.10739245761734517, "grad_norm": 1.7485914014280124, "learning_rate": 1.2336285784023578e-06, "loss": 0.9129, "step": 1164 }, { "epoch": 0.1074847191788721, "grad_norm": 1.929861511939592, "learning_rate": 1.2335857697982266e-06, "loss": 0.8243, "step": 1165 }, { "epoch": 0.1074847191788721, "eval_GEN Loss": 0.4870619773864746, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.44409653544425964, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9309495091438293, "eval_runtime": 56.1366, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 1165 }, { "epoch": 0.10757698074039904, "grad_norm": 1.980310529716834, "learning_rate": 1.2335429060430944e-06, "loss": 0.8317, "step": 1166 }, { "epoch": 0.10766924230192595, "grad_norm": 1.656414726821583, "learning_rate": 1.2334999871408467e-06, "loss": 0.7256, "step": 1167 }, { "epoch": 0.10776150386345289, "grad_norm": 1.4769578060692212, "learning_rate": 1.233457013095372e-06, "loss": 0.8265, "step": 1168 }, { "epoch": 0.10785376542497982, "grad_norm": 1.6487135203109253, "learning_rate": 1.2334139839105654e-06, "loss": 0.8368, "step": 1169 }, { "epoch": 0.10794602698650675, "grad_norm": 1.5763624855331888, "learning_rate": 1.2333708995903258e-06, "loss": 0.6424, "step": 1170 }, { "epoch": 0.10794602698650675, "eval_GEN Loss": 0.48684194684028625, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.42577382922172546, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9293269515037537, "eval_runtime": 56.9057, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1170 }, { "epoch": 0.10803828854803367, "grad_norm": 2.069352072052707, "learning_rate": 1.2333277601385577e-06, "loss": 0.822, "step": 1171 }, { "epoch": 0.1081305501095606, "grad_norm": 1.5312709494364685, "learning_rate": 1.2332845655591704e-06, "loss": 0.6668, "step": 1172 }, { "epoch": 0.10822281167108753, "grad_norm": 2.0578395624832018, "learning_rate": 1.2332413158560784e-06, "loss": 0.6411, "step": 1173 }, { "epoch": 0.10831507323261447, "grad_norm": 2.02697975392182, "learning_rate": 1.2331980110332007e-06, "loss": 0.9499, "step": 1174 }, { "epoch": 0.10840733479414139, "grad_norm": 1.677973701213988, "learning_rate": 1.2331546510944622e-06, "loss": 0.8123, "step": 1175 }, { "epoch": 0.10840733479414139, "eval_GEN Loss": 0.48646190762519836, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.40674087405204773, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9456730484962463, "eval_runtime": 57.0068, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1175 }, { "epoch": 0.10849959635566832, "grad_norm": 1.3564191365190188, "learning_rate": 1.2331112360437918e-06, "loss": 0.7495, "step": 1176 }, { "epoch": 0.10859185791719525, "grad_norm": 2.548023510607541, "learning_rate": 1.2330677658851242e-06, "loss": 1.0494, "step": 1177 }, { "epoch": 0.10868411947872218, "grad_norm": 2.4895815250280777, "learning_rate": 1.2330242406223985e-06, "loss": 0.9173, "step": 1178 }, { "epoch": 0.1087763810402491, "grad_norm": 2.93590344431322, "learning_rate": 1.2329806602595589e-06, "loss": 0.8843, "step": 1179 }, { "epoch": 0.10886864260177603, "grad_norm": 1.9049200362528216, "learning_rate": 1.2329370248005551e-06, "loss": 0.8401, "step": 1180 }, { "epoch": 0.10886864260177603, "eval_GEN Loss": 0.48844602704048157, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4213868975639343, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9299278855323792, "eval_runtime": 55.8828, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1180 }, { "epoch": 0.10896090416330297, "grad_norm": 1.7688347547982666, "learning_rate": 1.2328933342493411e-06, "loss": 0.8114, "step": 1181 }, { "epoch": 0.1090531657248299, "grad_norm": 1.7359552501254916, "learning_rate": 1.2328495886098762e-06, "loss": 0.7648, "step": 1182 }, { "epoch": 0.10914542728635682, "grad_norm": 1.612046766686986, "learning_rate": 1.232805787886125e-06, "loss": 0.7457, "step": 1183 }, { "epoch": 0.10923768884788375, "grad_norm": 1.9636722783651244, "learning_rate": 1.2327619320820566e-06, "loss": 0.917, "step": 1184 }, { "epoch": 0.10932995040941068, "grad_norm": 1.5754703622264092, "learning_rate": 1.2327180212016452e-06, "loss": 0.6563, "step": 1185 }, { "epoch": 0.10932995040941068, "eval_GEN Loss": 0.49035125970840454, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8441558441558441, "eval_PRM F1 AUC": 0.7611314824515453, "eval_PRM F1 Neg": 0.5862068965517241, "eval_PRM Loss": 0.4824090898036957, "eval_PRM NPV": 0.4857142857142857, "eval_PRM Precision": 0.9154929577464789, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9477764368057251, "eval_runtime": 55.8827, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1185 }, { "epoch": 0.10942221197093761, "grad_norm": 2.2896371509113744, "learning_rate": 1.2326740552488702e-06, "loss": 0.8701, "step": 1186 }, { "epoch": 0.10951447353246453, "grad_norm": 2.0582193165405154, "learning_rate": 1.2326300342277159e-06, "loss": 0.8605, "step": 1187 }, { "epoch": 0.10960673509399146, "grad_norm": 2.1309555411326198, "learning_rate": 1.2325859581421713e-06, "loss": 0.8683, "step": 1188 }, { "epoch": 0.1096989966555184, "grad_norm": 2.510452992249232, "learning_rate": 1.2325418269962308e-06, "loss": 0.903, "step": 1189 }, { "epoch": 0.10979125821704533, "grad_norm": 2.2442105538117354, "learning_rate": 1.2324976407938939e-06, "loss": 1.0334, "step": 1190 }, { "epoch": 0.10979125821704533, "eval_GEN Loss": 0.48855337500572205, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8589743589743589, "eval_PRM F1 AUC": 0.7731796752226295, "eval_PRM F1 Neg": 0.6071428571428571, "eval_PRM Loss": 0.4656677544116974, "eval_PRM NPV": 0.5151515151515151, "eval_PRM Precision": 0.9178082191780822, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9493990540504456, "eval_runtime": 56.0119, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1190 }, { "epoch": 0.10988351977857225, "grad_norm": 2.022699428884022, "learning_rate": 1.2324533995391643e-06, "loss": 0.8244, "step": 1191 }, { "epoch": 0.10997578134009918, "grad_norm": 1.9424420201266335, "learning_rate": 1.2324091032360517e-06, "loss": 0.8637, "step": 1192 }, { "epoch": 0.11006804290162611, "grad_norm": 2.3609370608937383, "learning_rate": 1.23236475188857e-06, "loss": 0.7843, "step": 1193 }, { "epoch": 0.11016030446315304, "grad_norm": 1.9832704742742902, "learning_rate": 1.2323203455007384e-06, "loss": 0.6733, "step": 1194 }, { "epoch": 0.11025256602467996, "grad_norm": 1.7324730654333904, "learning_rate": 1.2322758840765813e-06, "loss": 0.6238, "step": 1195 }, { "epoch": 0.11025256602467996, "eval_GEN Loss": 0.48724260926246643, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM Loss": 0.4369560778141022, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9841346144676208, "eval_runtime": 56.161, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1195 }, { "epoch": 0.1103448275862069, "grad_norm": 3.3504049718983215, "learning_rate": 1.2322313676201274e-06, "loss": 0.8395, "step": 1196 }, { "epoch": 0.11043708914773383, "grad_norm": 1.8281556673261714, "learning_rate": 1.2321867961354116e-06, "loss": 0.7803, "step": 1197 }, { "epoch": 0.11052935070926076, "grad_norm": 2.1794012034206585, "learning_rate": 1.2321421696264723e-06, "loss": 0.9177, "step": 1198 }, { "epoch": 0.11062161227078768, "grad_norm": 2.4232356631219707, "learning_rate": 1.2320974880973542e-06, "loss": 0.7455, "step": 1199 }, { "epoch": 0.11071387383231461, "grad_norm": 2.466812411105342, "learning_rate": 1.2320527515521059e-06, "loss": 0.8103, "step": 1200 }, { "epoch": 0.11071387383231461, "eval_GEN Loss": 0.4868861436843872, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM Loss": 0.45209363102912903, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 1.0098557472229004, "eval_runtime": 56.1683, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1200 }, { "epoch": 0.11080613539384154, "grad_norm": 2.3272115875739146, "learning_rate": 1.232007959994782e-06, "loss": 0.7054, "step": 1201 }, { "epoch": 0.11089839695536848, "grad_norm": 2.583595119552973, "learning_rate": 1.231963113429441e-06, "loss": 0.9144, "step": 1202 }, { "epoch": 0.1109906585168954, "grad_norm": 3.306092969142411, "learning_rate": 1.2319182118601475e-06, "loss": 0.8067, "step": 1203 }, { "epoch": 0.11108292007842233, "grad_norm": 2.5640626066477172, "learning_rate": 1.2318732552909703e-06, "loss": 0.9441, "step": 1204 }, { "epoch": 0.11117518163994926, "grad_norm": 1.6918386714801197, "learning_rate": 1.2318282437259835e-06, "loss": 0.7275, "step": 1205 }, { "epoch": 0.11117518163994926, "eval_GEN Loss": 0.4903247058391571, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.4829825162887573, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9960336685180664, "eval_runtime": 56.0394, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1205 }, { "epoch": 0.11126744320147619, "grad_norm": 1.9142145845356089, "learning_rate": 1.2317831771692658e-06, "loss": 0.9109, "step": 1206 }, { "epoch": 0.11135970476300311, "grad_norm": 2.2061703937594603, "learning_rate": 1.231738055624902e-06, "loss": 0.8353, "step": 1207 }, { "epoch": 0.11145196632453004, "grad_norm": 1.6339986391626806, "learning_rate": 1.2316928790969803e-06, "loss": 0.7552, "step": 1208 }, { "epoch": 0.11154422788605697, "grad_norm": 1.9839433452397386, "learning_rate": 1.231647647589595e-06, "loss": 0.8809, "step": 1209 }, { "epoch": 0.1116364894475839, "grad_norm": 1.6948509211816858, "learning_rate": 1.231602361106845e-06, "loss": 0.7515, "step": 1210 }, { "epoch": 0.1116364894475839, "eval_GEN Loss": 0.49288755655288696, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.84472049689441, "eval_PRM F1 AUC": 0.6922472498690415, "eval_PRM F1 Neg": 0.5098039215686274, "eval_PRM Loss": 0.4933969974517822, "eval_PRM NPV": 0.4642857142857143, "eval_PRM Precision": 0.8717948717948718, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9946514368057251, "eval_runtime": 57.0308, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1210 }, { "epoch": 0.11172875100911082, "grad_norm": 2.333241413499883, "learning_rate": 1.2315570196528342e-06, "loss": 0.7236, "step": 1211 }, { "epoch": 0.11182101257063776, "grad_norm": 1.8259354114271136, "learning_rate": 1.2315116232316715e-06, "loss": 0.7274, "step": 1212 }, { "epoch": 0.11191327413216469, "grad_norm": 1.5460668876861083, "learning_rate": 1.2314661718474708e-06, "loss": 0.7628, "step": 1213 }, { "epoch": 0.11200553569369162, "grad_norm": 3.979263775837841, "learning_rate": 1.2314206655043512e-06, "loss": 1.0967, "step": 1214 }, { "epoch": 0.11209779725521854, "grad_norm": 1.803237941124396, "learning_rate": 1.2313751042064362e-06, "loss": 0.673, "step": 1215 }, { "epoch": 0.11209779725521854, "eval_GEN Loss": 0.4911290109157562, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.48653483390808105, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9960336685180664, "eval_runtime": 56.7757, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1215 }, { "epoch": 0.11219005881674547, "grad_norm": 2.0604165445059595, "learning_rate": 1.2313294879578548e-06, "loss": 0.7396, "step": 1216 }, { "epoch": 0.1122823203782724, "grad_norm": 1.8054316251819142, "learning_rate": 1.2312838167627408e-06, "loss": 0.9521, "step": 1217 }, { "epoch": 0.11237458193979934, "grad_norm": 2.0219527025493234, "learning_rate": 1.2312380906252334e-06, "loss": 0.7238, "step": 1218 }, { "epoch": 0.11246684350132626, "grad_norm": 1.9476637258107512, "learning_rate": 1.2311923095494755e-06, "loss": 0.6648, "step": 1219 }, { "epoch": 0.11255910506285319, "grad_norm": 1.9191471098412223, "learning_rate": 1.2311464735396166e-06, "loss": 0.7794, "step": 1220 }, { "epoch": 0.11255910506285319, "eval_GEN Loss": 0.48921579122543335, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.47596776485443115, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9862980842590332, "eval_runtime": 56.7988, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1220 }, { "epoch": 0.11265136662438012, "grad_norm": 1.910437132627685, "learning_rate": 1.2311005825998102e-06, "loss": 0.9121, "step": 1221 }, { "epoch": 0.11274362818590705, "grad_norm": 1.5798561671650437, "learning_rate": 1.2310546367342149e-06, "loss": 0.8384, "step": 1222 }, { "epoch": 0.11283588974743397, "grad_norm": 2.1210775495187972, "learning_rate": 1.2310086359469945e-06, "loss": 0.7574, "step": 1223 }, { "epoch": 0.1129281513089609, "grad_norm": 2.0998204169465673, "learning_rate": 1.2309625802423176e-06, "loss": 0.9323, "step": 1224 }, { "epoch": 0.11302041287048784, "grad_norm": 3.8016711561536463, "learning_rate": 1.230916469624358e-06, "loss": 0.8167, "step": 1225 }, { "epoch": 0.11302041287048784, "eval_GEN Loss": 0.48783984780311584, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4506700038909912, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9697115421295166, "eval_runtime": 56.7983, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1225 }, { "epoch": 0.11311267443201477, "grad_norm": 2.3009203906219935, "learning_rate": 1.2308703040972942e-06, "loss": 0.9366, "step": 1226 }, { "epoch": 0.11320493599354169, "grad_norm": 2.26488523449271, "learning_rate": 1.2308240836653096e-06, "loss": 0.7221, "step": 1227 }, { "epoch": 0.11329719755506862, "grad_norm": 1.8704250858740405, "learning_rate": 1.230777808332593e-06, "loss": 0.6154, "step": 1228 }, { "epoch": 0.11338945911659555, "grad_norm": 2.0560324644077466, "learning_rate": 1.230731478103338e-06, "loss": 0.8106, "step": 1229 }, { "epoch": 0.11348172067812248, "grad_norm": 1.495671876208774, "learning_rate": 1.230685092981743e-06, "loss": 0.7048, "step": 1230 }, { "epoch": 0.11348172067812248, "eval_GEN Loss": 0.4879695177078247, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.42036473751068115, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9837740659713745, "eval_runtime": 56.9633, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1230 }, { "epoch": 0.1135739822396494, "grad_norm": 1.9992911268614089, "learning_rate": 1.2306386529720115e-06, "loss": 0.6861, "step": 1231 }, { "epoch": 0.11366624380117633, "grad_norm": 2.1625798494717157, "learning_rate": 1.2305921580783519e-06, "loss": 0.8691, "step": 1232 }, { "epoch": 0.11375850536270327, "grad_norm": 1.7572110133120686, "learning_rate": 1.2305456083049778e-06, "loss": 0.6188, "step": 1233 }, { "epoch": 0.1138507669242302, "grad_norm": 3.990292125990343, "learning_rate": 1.2304990036561077e-06, "loss": 1.122, "step": 1234 }, { "epoch": 0.11394302848575712, "grad_norm": 1.362868875893105, "learning_rate": 1.2304523441359645e-06, "loss": 0.6572, "step": 1235 }, { "epoch": 0.11394302848575712, "eval_GEN Loss": 0.4927229881286621, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.41139060258865356, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9867788553237915, "eval_runtime": 55.8913, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1235 }, { "epoch": 0.11403529004728405, "grad_norm": 1.4789390013239685, "learning_rate": 1.230405629748777e-06, "loss": 0.7417, "step": 1236 }, { "epoch": 0.11412755160881098, "grad_norm": 1.8020256171051858, "learning_rate": 1.2303588604987785e-06, "loss": 0.7417, "step": 1237 }, { "epoch": 0.11421981317033791, "grad_norm": 1.9066295153227304, "learning_rate": 1.230312036390207e-06, "loss": 0.7737, "step": 1238 }, { "epoch": 0.11431207473186483, "grad_norm": 2.4963181073538094, "learning_rate": 1.2302651574273063e-06, "loss": 1.054, "step": 1239 }, { "epoch": 0.11440433629339176, "grad_norm": 1.8251129584340515, "learning_rate": 1.230218223614324e-06, "loss": 0.9767, "step": 1240 }, { "epoch": 0.11440433629339176, "eval_GEN Loss": 0.49484437704086304, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.4209262430667877, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9575120210647583, "eval_runtime": 55.8379, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1240 }, { "epoch": 0.1144965978549187, "grad_norm": 1.997936736599995, "learning_rate": 1.2301712349555139e-06, "loss": 0.7246, "step": 1241 }, { "epoch": 0.11458885941644563, "grad_norm": 1.4723677395700392, "learning_rate": 1.230124191455134e-06, "loss": 0.8091, "step": 1242 }, { "epoch": 0.11468112097797255, "grad_norm": 1.8669420475096228, "learning_rate": 1.2300770931174472e-06, "loss": 0.8244, "step": 1243 }, { "epoch": 0.11477338253949948, "grad_norm": 1.976773884958207, "learning_rate": 1.2300299399467217e-06, "loss": 0.7619, "step": 1244 }, { "epoch": 0.11486564410102641, "grad_norm": 1.7786316282322259, "learning_rate": 1.229982731947231e-06, "loss": 0.5921, "step": 1245 }, { "epoch": 0.11486564410102641, "eval_GEN Loss": 0.4953586459159851, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.44311127066612244, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9525240659713745, "eval_runtime": 55.9117, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1245 }, { "epoch": 0.11495790566255334, "grad_norm": 1.7248180124838284, "learning_rate": 1.2299354691232527e-06, "loss": 0.7807, "step": 1246 }, { "epoch": 0.11505016722408026, "grad_norm": 1.9239963241109062, "learning_rate": 1.22988815147907e-06, "loss": 0.7448, "step": 1247 }, { "epoch": 0.1151424287856072, "grad_norm": 2.1630647471198636, "learning_rate": 1.2298407790189709e-06, "loss": 0.9987, "step": 1248 }, { "epoch": 0.11523469034713413, "grad_norm": 1.8775242072610066, "learning_rate": 1.2297933517472484e-06, "loss": 0.8983, "step": 1249 }, { "epoch": 0.11532695190866106, "grad_norm": 1.9481258755149686, "learning_rate": 1.2297458696682005e-06, "loss": 0.9304, "step": 1250 }, { "epoch": 0.11532695190866106, "eval_GEN Loss": 0.49161943793296814, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4523923993110657, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.95703125, "eval_runtime": 56.0817, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1250 }, { "epoch": 0.11541921347018798, "grad_norm": 1.8349139608614415, "learning_rate": 1.22969833278613e-06, "loss": 0.6716, "step": 1251 }, { "epoch": 0.11551147503171491, "grad_norm": 1.5689091622911395, "learning_rate": 1.2296507411053446e-06, "loss": 0.7903, "step": 1252 }, { "epoch": 0.11560373659324184, "grad_norm": 1.864361596538834, "learning_rate": 1.2296030946301574e-06, "loss": 0.8044, "step": 1253 }, { "epoch": 0.11569599815476878, "grad_norm": 1.9153860482212435, "learning_rate": 1.2295553933648863e-06, "loss": 0.9074, "step": 1254 }, { "epoch": 0.1157882597162957, "grad_norm": 1.9224706653837949, "learning_rate": 1.2295076373138536e-06, "loss": 0.922, "step": 1255 }, { "epoch": 0.1157882597162957, "eval_GEN Loss": 0.49123042821884155, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.44373172521591187, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9667067527770996, "eval_runtime": 55.9882, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1255 }, { "epoch": 0.11588052127782263, "grad_norm": 1.5471438731740057, "learning_rate": 1.2294598264813873e-06, "loss": 0.9188, "step": 1256 }, { "epoch": 0.11597278283934956, "grad_norm": 1.7555395101693638, "learning_rate": 1.2294119608718203e-06, "loss": 0.839, "step": 1257 }, { "epoch": 0.11606504440087649, "grad_norm": 1.6358990907131337, "learning_rate": 1.22936404048949e-06, "loss": 0.8239, "step": 1258 }, { "epoch": 0.11615730596240341, "grad_norm": 1.8715056530450735, "learning_rate": 1.2293160653387388e-06, "loss": 0.8721, "step": 1259 }, { "epoch": 0.11624956752393034, "grad_norm": 1.7281595737040045, "learning_rate": 1.2292680354239148e-06, "loss": 0.7831, "step": 1260 }, { "epoch": 0.11624956752393034, "eval_GEN Loss": 0.4905729293823242, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4472057521343231, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9637620449066162, "eval_runtime": 56.0599, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1260 }, { "epoch": 0.11634182908545727, "grad_norm": 1.7609236740955532, "learning_rate": 1.2292199507493702e-06, "loss": 0.7484, "step": 1261 }, { "epoch": 0.1164340906469842, "grad_norm": 2.118717397078278, "learning_rate": 1.2291718113194627e-06, "loss": 0.8318, "step": 1262 }, { "epoch": 0.11652635220851112, "grad_norm": 1.8373932256046257, "learning_rate": 1.2291236171385545e-06, "loss": 0.7109, "step": 1263 }, { "epoch": 0.11661861377003806, "grad_norm": 1.7655496164280557, "learning_rate": 1.2290753682110135e-06, "loss": 0.7079, "step": 1264 }, { "epoch": 0.11671087533156499, "grad_norm": 2.5227832491472744, "learning_rate": 1.2290270645412116e-06, "loss": 0.7442, "step": 1265 }, { "epoch": 0.11671087533156499, "eval_GEN Loss": 0.48896458745002747, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.44111210107803345, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9471153616905212, "eval_runtime": 56.9285, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1265 }, { "epoch": 0.11680313689309192, "grad_norm": 1.7873531252217434, "learning_rate": 1.2289787061335263e-06, "loss": 0.7228, "step": 1266 }, { "epoch": 0.11689539845461884, "grad_norm": 2.8849635823358573, "learning_rate": 1.2289302929923402e-06, "loss": 0.8533, "step": 1267 }, { "epoch": 0.11698766001614577, "grad_norm": 2.4305007851692153, "learning_rate": 1.2288818251220403e-06, "loss": 0.8249, "step": 1268 }, { "epoch": 0.1170799215776727, "grad_norm": 1.6413552127999673, "learning_rate": 1.2288333025270185e-06, "loss": 0.7109, "step": 1269 }, { "epoch": 0.11717218313919964, "grad_norm": 2.397754173705168, "learning_rate": 1.2287847252116726e-06, "loss": 0.8528, "step": 1270 }, { "epoch": 0.11717218313919964, "eval_GEN Loss": 0.48914703726768494, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.40857037901878357, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9649038314819336, "eval_runtime": 55.9966, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1270 }, { "epoch": 0.11726444470072656, "grad_norm": 1.749884991453997, "learning_rate": 1.2287360931804048e-06, "loss": 0.9046, "step": 1271 }, { "epoch": 0.11735670626225349, "grad_norm": 3.3203167016211377, "learning_rate": 1.2286874064376217e-06, "loss": 0.9641, "step": 1272 }, { "epoch": 0.11744896782378042, "grad_norm": 1.78784685017401, "learning_rate": 1.2286386649877358e-06, "loss": 0.6087, "step": 1273 }, { "epoch": 0.11754122938530735, "grad_norm": 2.207589169562766, "learning_rate": 1.2285898688351638e-06, "loss": 0.788, "step": 1274 }, { "epoch": 0.11763349094683427, "grad_norm": 1.9101249677078853, "learning_rate": 1.2285410179843277e-06, "loss": 0.7491, "step": 1275 }, { "epoch": 0.11763349094683427, "eval_GEN Loss": 0.4912085235118866, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.39622050523757935, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.957932710647583, "eval_runtime": 57.1497, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 1275 }, { "epoch": 0.1177257525083612, "grad_norm": 2.6422083951311666, "learning_rate": 1.2284921124396547e-06, "loss": 0.7895, "step": 1276 }, { "epoch": 0.11781801406988814, "grad_norm": 2.46197267519697, "learning_rate": 1.2284431522055766e-06, "loss": 0.7814, "step": 1277 }, { "epoch": 0.11791027563141507, "grad_norm": 1.8120570948314536, "learning_rate": 1.2283941372865303e-06, "loss": 0.7436, "step": 1278 }, { "epoch": 0.11800253719294199, "grad_norm": 2.684960415278719, "learning_rate": 1.2283450676869573e-06, "loss": 0.7525, "step": 1279 }, { "epoch": 0.11809479875446892, "grad_norm": 2.506761052462561, "learning_rate": 1.2282959434113045e-06, "loss": 0.7506, "step": 1280 }, { "epoch": 0.11809479875446892, "eval_GEN Loss": 0.4923955202102661, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.4056079089641571, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9118990302085876, "eval_runtime": 56.9534, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1280 }, { "epoch": 0.11818706031599585, "grad_norm": 1.6064649037889431, "learning_rate": 1.2282467644640239e-06, "loss": 0.6396, "step": 1281 }, { "epoch": 0.11827932187752278, "grad_norm": 1.940776110107445, "learning_rate": 1.228197530849572e-06, "loss": 0.8193, "step": 1282 }, { "epoch": 0.1183715834390497, "grad_norm": 1.7846565497956695, "learning_rate": 1.2281482425724103e-06, "loss": 0.7188, "step": 1283 }, { "epoch": 0.11846384500057663, "grad_norm": 2.2620249600204994, "learning_rate": 1.2280988996370057e-06, "loss": 0.9059, "step": 1284 }, { "epoch": 0.11855610656210357, "grad_norm": 1.7475948681226834, "learning_rate": 1.2280495020478291e-06, "loss": 0.7448, "step": 1285 }, { "epoch": 0.11855610656210357, "eval_GEN Loss": 0.4951961636543274, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4066463112831116, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8948317170143127, "eval_runtime": 56.9624, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1285 }, { "epoch": 0.1186483681236305, "grad_norm": 1.326016769754368, "learning_rate": 1.2280000498093578e-06, "loss": 0.6742, "step": 1286 }, { "epoch": 0.11874062968515742, "grad_norm": 2.292162155898998, "learning_rate": 1.2279505429260729e-06, "loss": 0.803, "step": 1287 }, { "epoch": 0.11883289124668435, "grad_norm": 1.563686091518793, "learning_rate": 1.2279009814024605e-06, "loss": 0.7024, "step": 1288 }, { "epoch": 0.11892515280821128, "grad_norm": 2.5605781601401514, "learning_rate": 1.2278513652430123e-06, "loss": 0.836, "step": 1289 }, { "epoch": 0.11901741436973821, "grad_norm": 1.9957556185976306, "learning_rate": 1.2278016944522245e-06, "loss": 0.8837, "step": 1290 }, { "epoch": 0.11901741436973821, "eval_GEN Loss": 0.49639612436294556, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.38042151927948, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8947115540504456, "eval_runtime": 56.8549, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1290 }, { "epoch": 0.11910967593126513, "grad_norm": 3.0767161496384716, "learning_rate": 1.2277519690345982e-06, "loss": 0.9519, "step": 1291 }, { "epoch": 0.11920193749279206, "grad_norm": 2.022954445214826, "learning_rate": 1.2277021889946397e-06, "loss": 0.6947, "step": 1292 }, { "epoch": 0.119294199054319, "grad_norm": 1.9583881679622657, "learning_rate": 1.2276523543368602e-06, "loss": 0.7825, "step": 1293 }, { "epoch": 0.11938646061584593, "grad_norm": 1.5783633172665636, "learning_rate": 1.2276024650657758e-06, "loss": 0.6771, "step": 1294 }, { "epoch": 0.11947872217737285, "grad_norm": 1.6031041132358899, "learning_rate": 1.2275525211859076e-06, "loss": 0.6923, "step": 1295 }, { "epoch": 0.11947872217737285, "eval_GEN Loss": 0.49745118618011475, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3748480975627899, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9041466116905212, "eval_runtime": 56.9659, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1295 }, { "epoch": 0.11957098373889978, "grad_norm": 1.573106670247981, "learning_rate": 1.2275025227017813e-06, "loss": 0.8175, "step": 1296 }, { "epoch": 0.11966324530042671, "grad_norm": 2.8140865304331673, "learning_rate": 1.2274524696179283e-06, "loss": 1.1144, "step": 1297 }, { "epoch": 0.11975550686195365, "grad_norm": 1.5626355365290727, "learning_rate": 1.227402361938884e-06, "loss": 0.6706, "step": 1298 }, { "epoch": 0.11984776842348056, "grad_norm": 2.2106948655961323, "learning_rate": 1.2273521996691895e-06, "loss": 0.7366, "step": 1299 }, { "epoch": 0.1199400299850075, "grad_norm": 3.611276867720812, "learning_rate": 1.2273019828133908e-06, "loss": 0.8502, "step": 1300 }, { "epoch": 0.1199400299850075, "eval_GEN Loss": 0.49392223358154297, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37433359026908875, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9100360870361328, "eval_runtime": 56.978, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1300 }, { "epoch": 0.12003229154653443, "grad_norm": 2.1935284161123323, "learning_rate": 1.227251711376038e-06, "loss": 0.9244, "step": 1301 }, { "epoch": 0.12012455310806136, "grad_norm": 2.28938953997289, "learning_rate": 1.2272013853616874e-06, "loss": 0.6428, "step": 1302 }, { "epoch": 0.12021681466958828, "grad_norm": 1.8831071642607708, "learning_rate": 1.2271510047748994e-06, "loss": 0.5655, "step": 1303 }, { "epoch": 0.12030907623111521, "grad_norm": 2.7674605841492, "learning_rate": 1.2271005696202394e-06, "loss": 0.8868, "step": 1304 }, { "epoch": 0.12040133779264214, "grad_norm": 2.1277466206939586, "learning_rate": 1.227050079902278e-06, "loss": 0.8592, "step": 1305 }, { "epoch": 0.12040133779264214, "eval_GEN Loss": 0.49284905195236206, "eval_GEN top-5 accuracy": 0.9780797895659799, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.398231565952301, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8812500238418579, "eval_runtime": 56.8489, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1305 }, { "epoch": 0.12049359935416908, "grad_norm": 3.230113473102956, "learning_rate": 1.226999535625591e-06, "loss": 1.0419, "step": 1306 }, { "epoch": 0.120585860915696, "grad_norm": 1.6201613850118866, "learning_rate": 1.2269489367947582e-06, "loss": 0.8235, "step": 1307 }, { "epoch": 0.12067812247722293, "grad_norm": 2.264023013262882, "learning_rate": 1.2268982834143656e-06, "loss": 0.8541, "step": 1308 }, { "epoch": 0.12077038403874986, "grad_norm": 2.421431406370077, "learning_rate": 1.2268475754890029e-06, "loss": 0.962, "step": 1309 }, { "epoch": 0.12086264560027679, "grad_norm": 1.7229390248536531, "learning_rate": 1.2267968130232657e-06, "loss": 0.712, "step": 1310 }, { "epoch": 0.12086264560027679, "eval_GEN Loss": 0.49430614709854126, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8552631578947368, "eval_PRM F1 AUC": 0.8046097433211105, "eval_PRM F1 Neg": 0.6333333333333333, "eval_PRM Loss": 0.47042927145957947, "eval_PRM NPV": 0.5135135135135135, "eval_PRM Precision": 0.9420289855072463, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.9013221263885498, "eval_runtime": 57.0128, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1310 }, { "epoch": 0.12095490716180371, "grad_norm": 2.2250996507214276, "learning_rate": 1.226745996021754e-06, "loss": 0.8493, "step": 1311 }, { "epoch": 0.12104716872333064, "grad_norm": 1.8707936283098114, "learning_rate": 1.226695124489073e-06, "loss": 0.6961, "step": 1312 }, { "epoch": 0.12113943028485757, "grad_norm": 3.3417424110119347, "learning_rate": 1.2266441984298327e-06, "loss": 0.9266, "step": 1313 }, { "epoch": 0.1212316918463845, "grad_norm": 2.5732522872035446, "learning_rate": 1.2265932178486483e-06, "loss": 0.7325, "step": 1314 }, { "epoch": 0.12132395340791143, "grad_norm": 1.9018229284694772, "learning_rate": 1.2265421827501395e-06, "loss": 0.7876, "step": 1315 }, { "epoch": 0.12132395340791143, "eval_GEN Loss": 0.49222859740257263, "eval_GEN top-5 accuracy": 0.9789565979833407, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8774193548387097, "eval_PRM F1 AUC": 0.8226820324777371, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4281691312789917, "eval_PRM NPV": 0.5588235294117647, "eval_PRM Precision": 0.9444444444444444, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.8835336565971375, "eval_runtime": 56.8326, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1315 }, { "epoch": 0.12141621496943836, "grad_norm": 1.8488596501663879, "learning_rate": 1.2264910931389312e-06, "loss": 0.7547, "step": 1316 }, { "epoch": 0.12150847653096529, "grad_norm": 1.8484299160489088, "learning_rate": 1.2264399490196533e-06, "loss": 0.8028, "step": 1317 }, { "epoch": 0.12160073809249222, "grad_norm": 1.5443884201729963, "learning_rate": 1.2263887503969405e-06, "loss": 0.6124, "step": 1318 }, { "epoch": 0.12169299965401914, "grad_norm": 1.5278949700900137, "learning_rate": 1.2263374972754324e-06, "loss": 0.7439, "step": 1319 }, { "epoch": 0.12178526121554607, "grad_norm": 1.8514423421923552, "learning_rate": 1.226286189659774e-06, "loss": 0.8699, "step": 1320 }, { "epoch": 0.12178526121554607, "eval_GEN Loss": 0.49053096771240234, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.38080504536628723, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9111778736114502, "eval_runtime": 56.9873, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1320 }, { "epoch": 0.121877522777073, "grad_norm": 2.565714757651536, "learning_rate": 1.2262348275546145e-06, "loss": 0.8825, "step": 1321 }, { "epoch": 0.12196978433859994, "grad_norm": 1.7304304013800949, "learning_rate": 1.226183410964609e-06, "loss": 0.7343, "step": 1322 }, { "epoch": 0.12206204590012686, "grad_norm": 2.51550071315553, "learning_rate": 1.226131939894416e-06, "loss": 1.048, "step": 1323 }, { "epoch": 0.12215430746165379, "grad_norm": 2.3891342523973447, "learning_rate": 1.2260804143487007e-06, "loss": 0.8047, "step": 1324 }, { "epoch": 0.12224656902318072, "grad_norm": 1.8475248227200738, "learning_rate": 1.226028834332132e-06, "loss": 0.6824, "step": 1325 }, { "epoch": 0.12224656902318072, "eval_GEN Loss": 0.49069076776504517, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3912678062915802, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9151442050933838, "eval_runtime": 56.8241, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1325 }, { "epoch": 0.12233883058470765, "grad_norm": 1.779257449054373, "learning_rate": 1.2259771998493845e-06, "loss": 0.5389, "step": 1326 }, { "epoch": 0.12243109214623457, "grad_norm": 3.5142895414815505, "learning_rate": 1.2259255109051369e-06, "loss": 1.0975, "step": 1327 }, { "epoch": 0.1225233537077615, "grad_norm": 2.0668360555397824, "learning_rate": 1.2258737675040738e-06, "loss": 0.818, "step": 1328 }, { "epoch": 0.12261561526928844, "grad_norm": 1.6280634119087998, "learning_rate": 1.225821969650884e-06, "loss": 0.9491, "step": 1329 }, { "epoch": 0.12270787683081537, "grad_norm": 1.9001001064855316, "learning_rate": 1.2257701173502618e-06, "loss": 0.8077, "step": 1330 }, { "epoch": 0.12270787683081537, "eval_GEN Loss": 0.48902031779289246, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3988769054412842, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9060696959495544, "eval_runtime": 56.8036, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1330 }, { "epoch": 0.12280013839234229, "grad_norm": 1.6537615151434861, "learning_rate": 1.2257182106069056e-06, "loss": 0.6946, "step": 1331 }, { "epoch": 0.12289239995386922, "grad_norm": 1.8871678927422304, "learning_rate": 1.22566624942552e-06, "loss": 0.7479, "step": 1332 }, { "epoch": 0.12298466151539615, "grad_norm": 1.979539107160251, "learning_rate": 1.2256142338108132e-06, "loss": 0.7868, "step": 1333 }, { "epoch": 0.12307692307692308, "grad_norm": 2.4620381895051557, "learning_rate": 1.2255621637674991e-06, "loss": 0.9231, "step": 1334 }, { "epoch": 0.12316918463845, "grad_norm": 2.5053203833222666, "learning_rate": 1.2255100393002967e-06, "loss": 0.8815, "step": 1335 }, { "epoch": 0.12316918463845, "eval_GEN Loss": 0.4872274696826935, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4308062493801117, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.907151460647583, "eval_runtime": 57.2071, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 1335 }, { "epoch": 0.12326144619997693, "grad_norm": 2.4154779428773003, "learning_rate": 1.225457860413929e-06, "loss": 0.8436, "step": 1336 }, { "epoch": 0.12335370776150387, "grad_norm": 1.8829189925644858, "learning_rate": 1.225405627113125e-06, "loss": 0.8892, "step": 1337 }, { "epoch": 0.1234459693230308, "grad_norm": 1.7127274025772998, "learning_rate": 1.2253533394026178e-06, "loss": 0.4481, "step": 1338 }, { "epoch": 0.12353823088455772, "grad_norm": 2.03664475177838, "learning_rate": 1.2253009972871463e-06, "loss": 0.7433, "step": 1339 }, { "epoch": 0.12363049244608465, "grad_norm": 1.7966903993830157, "learning_rate": 1.2252486007714535e-06, "loss": 0.8347, "step": 1340 }, { "epoch": 0.12363049244608465, "eval_GEN Loss": 0.48570749163627625, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.4023730754852295, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9155048131942749, "eval_runtime": 56.9631, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1340 }, { "epoch": 0.12372275400761158, "grad_norm": 1.5100872404160781, "learning_rate": 1.2251961498602876e-06, "loss": 0.7208, "step": 1341 }, { "epoch": 0.12381501556913851, "grad_norm": 1.1805249230992214, "learning_rate": 1.2251436445584019e-06, "loss": 0.5913, "step": 1342 }, { "epoch": 0.12390727713066543, "grad_norm": 2.000992335213143, "learning_rate": 1.2250910848705546e-06, "loss": 0.8445, "step": 1343 }, { "epoch": 0.12399953869219237, "grad_norm": 1.5996161674342857, "learning_rate": 1.2250384708015087e-06, "loss": 0.7581, "step": 1344 }, { "epoch": 0.1240918002537193, "grad_norm": 3.241294099197593, "learning_rate": 1.2249858023560317e-06, "loss": 1.0236, "step": 1345 }, { "epoch": 0.1240918002537193, "eval_GEN Loss": 0.4876135289669037, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM Loss": 0.39364543557167053, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9313101172447205, "eval_runtime": 56.8033, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1345 }, { "epoch": 0.12418406181524622, "grad_norm": 1.9905229496189492, "learning_rate": 1.2249330795388971e-06, "loss": 0.8514, "step": 1346 }, { "epoch": 0.12427632337677315, "grad_norm": 1.571750154821204, "learning_rate": 1.2248803023548827e-06, "loss": 0.7193, "step": 1347 }, { "epoch": 0.12436858493830008, "grad_norm": 1.685205589806922, "learning_rate": 1.224827470808771e-06, "loss": 0.5701, "step": 1348 }, { "epoch": 0.12446084649982701, "grad_norm": 2.394225354378885, "learning_rate": 1.2247745849053497e-06, "loss": 0.9537, "step": 1349 }, { "epoch": 0.12455310806135393, "grad_norm": 2.3157824689347515, "learning_rate": 1.2247216446494115e-06, "loss": 0.6846, "step": 1350 }, { "epoch": 0.12455310806135393, "eval_GEN Loss": 0.490536630153656, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.40498775243759155, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.920192301273346, "eval_runtime": 56.8933, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1350 }, { "epoch": 0.12464536962288086, "grad_norm": 1.3484877227150613, "learning_rate": 1.2246686500457539e-06, "loss": 0.7361, "step": 1351 }, { "epoch": 0.1247376311844078, "grad_norm": 1.462469573473979, "learning_rate": 1.2246156010991791e-06, "loss": 0.7746, "step": 1352 }, { "epoch": 0.12482989274593473, "grad_norm": 2.441359574282289, "learning_rate": 1.224562497814495e-06, "loss": 0.68, "step": 1353 }, { "epoch": 0.12492215430746165, "grad_norm": 1.4352457642433032, "learning_rate": 1.2245093401965136e-06, "loss": 0.6796, "step": 1354 }, { "epoch": 0.1250144158689886, "grad_norm": 2.0719272539069866, "learning_rate": 1.224456128250052e-06, "loss": 0.822, "step": 1355 }, { "epoch": 0.1250144158689886, "eval_GEN Loss": 0.493169367313385, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.40531107783317566, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9220553040504456, "eval_runtime": 55.9278, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1355 }, { "epoch": 0.1251066774305155, "grad_norm": 1.6547964849612078, "learning_rate": 1.2244028619799326e-06, "loss": 0.7411, "step": 1356 }, { "epoch": 0.12519893899204243, "grad_norm": 1.9780433262016586, "learning_rate": 1.2243495413909823e-06, "loss": 0.6415, "step": 1357 }, { "epoch": 0.12529120055356938, "grad_norm": 1.6968738629275064, "learning_rate": 1.2242961664880332e-06, "loss": 0.6864, "step": 1358 }, { "epoch": 0.1253834621150963, "grad_norm": 3.751259488620392, "learning_rate": 1.2242427372759222e-06, "loss": 0.9207, "step": 1359 }, { "epoch": 0.1254757236766232, "grad_norm": 1.2764892118359368, "learning_rate": 1.2241892537594912e-06, "loss": 0.6415, "step": 1360 }, { "epoch": 0.1254757236766232, "eval_GEN Loss": 0.492832213640213, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.4038274884223938, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9268028736114502, "eval_runtime": 56.1999, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1360 }, { "epoch": 0.12556798523815016, "grad_norm": 2.1026123520145767, "learning_rate": 1.2241357159435868e-06, "loss": 0.8027, "step": 1361 }, { "epoch": 0.12566024679967708, "grad_norm": 2.5842829641384437, "learning_rate": 1.2240821238330608e-06, "loss": 0.7074, "step": 1362 }, { "epoch": 0.12575250836120402, "grad_norm": 1.9007473539853121, "learning_rate": 1.2240284774327698e-06, "loss": 0.873, "step": 1363 }, { "epoch": 0.12584476992273094, "grad_norm": 2.5262611850282233, "learning_rate": 1.2239747767475752e-06, "loss": 0.6985, "step": 1364 }, { "epoch": 0.12593703148425786, "grad_norm": 2.2135095209477913, "learning_rate": 1.2239210217823435e-06, "loss": 0.9369, "step": 1365 }, { "epoch": 0.12593703148425786, "eval_GEN Loss": 0.49305102229118347, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.4163629710674286, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9364783763885498, "eval_runtime": 55.9229, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1365 }, { "epoch": 0.1260292930457848, "grad_norm": 1.8745471552444068, "learning_rate": 1.2238672125419462e-06, "loss": 0.6284, "step": 1366 }, { "epoch": 0.12612155460731173, "grad_norm": 2.8458876213877007, "learning_rate": 1.2238133490312594e-06, "loss": 0.8194, "step": 1367 }, { "epoch": 0.12621381616883864, "grad_norm": 1.9038505262417882, "learning_rate": 1.2237594312551644e-06, "loss": 0.8271, "step": 1368 }, { "epoch": 0.1263060777303656, "grad_norm": 1.6360322936279517, "learning_rate": 1.2237054592185475e-06, "loss": 0.8412, "step": 1369 }, { "epoch": 0.1263983392918925, "grad_norm": 2.344156408789055, "learning_rate": 1.2236514329262992e-06, "loss": 0.8236, "step": 1370 }, { "epoch": 0.1263983392918925, "eval_GEN Loss": 0.4930301010608673, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4327784776687622, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9435697197914124, "eval_runtime": 55.9203, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1370 }, { "epoch": 0.12649060085341945, "grad_norm": 1.6354513496716774, "learning_rate": 1.2235973523833156e-06, "loss": 0.6719, "step": 1371 }, { "epoch": 0.12658286241494637, "grad_norm": 2.511174037923046, "learning_rate": 1.223543217594498e-06, "loss": 0.7847, "step": 1372 }, { "epoch": 0.1266751239764733, "grad_norm": 2.3701663942762456, "learning_rate": 1.2234890285647518e-06, "loss": 1.0791, "step": 1373 }, { "epoch": 0.12676738553800024, "grad_norm": 1.7896499207358794, "learning_rate": 1.2234347852989881e-06, "loss": 0.9398, "step": 1374 }, { "epoch": 0.12685964709952716, "grad_norm": 2.4965286537941127, "learning_rate": 1.2233804878021218e-06, "loss": 0.9747, "step": 1375 }, { "epoch": 0.12685964709952716, "eval_GEN Loss": 0.4926159977912903, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4483198821544647, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9524038434028625, "eval_runtime": 56.9883, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1375 }, { "epoch": 0.12695190866105407, "grad_norm": 1.4924837656210077, "learning_rate": 1.223326136079074e-06, "loss": 0.6207, "step": 1376 }, { "epoch": 0.12704417022258102, "grad_norm": 3.2142046158407096, "learning_rate": 1.22327173013477e-06, "loss": 0.8013, "step": 1377 }, { "epoch": 0.12713643178410794, "grad_norm": 1.8665806346977394, "learning_rate": 1.22321726997414e-06, "loss": 0.7902, "step": 1378 }, { "epoch": 0.12722869334563489, "grad_norm": 1.6012907009929764, "learning_rate": 1.2231627556021196e-06, "loss": 0.8071, "step": 1379 }, { "epoch": 0.1273209549071618, "grad_norm": 1.6471852536792064, "learning_rate": 1.2231081870236487e-06, "loss": 0.6864, "step": 1380 }, { "epoch": 0.1273209549071618, "eval_GEN Loss": 0.4910682141780853, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.42695653438568115, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9421274065971375, "eval_runtime": 56.876, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1380 }, { "epoch": 0.12741321646868872, "grad_norm": 3.352318014291917, "learning_rate": 1.2230535642436722e-06, "loss": 0.8315, "step": 1381 }, { "epoch": 0.12750547803021567, "grad_norm": 1.856451818849259, "learning_rate": 1.2229988872671405e-06, "loss": 0.806, "step": 1382 }, { "epoch": 0.1275977395917426, "grad_norm": 2.5806734605644337, "learning_rate": 1.2229441560990085e-06, "loss": 0.9162, "step": 1383 }, { "epoch": 0.1276900011532695, "grad_norm": 1.4628711909970085, "learning_rate": 1.222889370744236e-06, "loss": 0.8331, "step": 1384 }, { "epoch": 0.12778226271479645, "grad_norm": 1.6707117807192426, "learning_rate": 1.2228345312077875e-06, "loss": 0.7961, "step": 1385 }, { "epoch": 0.12778226271479645, "eval_GEN Loss": 0.4901101589202881, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4238015413284302, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9219951629638672, "eval_runtime": 57.0429, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 1385 }, { "epoch": 0.12787452427632337, "grad_norm": 1.7394289318327385, "learning_rate": 1.2227796374946326e-06, "loss": 0.6722, "step": 1386 }, { "epoch": 0.12796678583785032, "grad_norm": 1.6752054740440538, "learning_rate": 1.222724689609746e-06, "loss": 0.9017, "step": 1387 }, { "epoch": 0.12805904739937723, "grad_norm": 2.077628593692242, "learning_rate": 1.2226696875581075e-06, "loss": 0.814, "step": 1388 }, { "epoch": 0.12815130896090415, "grad_norm": 2.8099615886878313, "learning_rate": 1.2226146313447009e-06, "loss": 0.9671, "step": 1389 }, { "epoch": 0.1282435705224311, "grad_norm": 2.0630872164343446, "learning_rate": 1.222559520974516e-06, "loss": 0.8071, "step": 1390 }, { "epoch": 0.1282435705224311, "eval_GEN Loss": 0.48906949162483215, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.40765708684921265, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9087740182876587, "eval_runtime": 57.318, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 1390 }, { "epoch": 0.12833583208395802, "grad_norm": 1.457275792782061, "learning_rate": 1.2225043564525465e-06, "loss": 0.6686, "step": 1391 }, { "epoch": 0.12842809364548494, "grad_norm": 2.1525328381332693, "learning_rate": 1.222449137783792e-06, "loss": 0.8122, "step": 1392 }, { "epoch": 0.12852035520701188, "grad_norm": 2.2700897179949786, "learning_rate": 1.222393864973256e-06, "loss": 1.0304, "step": 1393 }, { "epoch": 0.1286126167685388, "grad_norm": 2.6915181959518706, "learning_rate": 1.2223385380259478e-06, "loss": 0.8429, "step": 1394 }, { "epoch": 0.12870487833006575, "grad_norm": 2.2887944308865253, "learning_rate": 1.2222831569468808e-06, "loss": 0.7829, "step": 1395 }, { "epoch": 0.12870487833006575, "eval_GEN Loss": 0.48873692750930786, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.4033927321434021, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9007812738418579, "eval_runtime": 55.9162, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1395 }, { "epoch": 0.12879713989159267, "grad_norm": 1.3869280208113692, "learning_rate": 1.2222277217410742e-06, "loss": 0.5959, "step": 1396 }, { "epoch": 0.12888940145311958, "grad_norm": 2.0303859235387063, "learning_rate": 1.2221722324135513e-06, "loss": 0.7309, "step": 1397 }, { "epoch": 0.12898166301464653, "grad_norm": 2.2558662821989826, "learning_rate": 1.2221166889693408e-06, "loss": 0.9391, "step": 1398 }, { "epoch": 0.12907392457617345, "grad_norm": 2.499820992030088, "learning_rate": 1.222061091413476e-06, "loss": 1.0213, "step": 1399 }, { "epoch": 0.12916618613770037, "grad_norm": 2.1620822515755163, "learning_rate": 1.2220054397509956e-06, "loss": 0.5987, "step": 1400 }, { "epoch": 0.12916618613770037, "eval_GEN Loss": 0.48808538913726807, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.394230455160141, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9165865182876587, "eval_runtime": 55.8693, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1400 }, { "epoch": 0.1292584476992273, "grad_norm": 1.8023173226208795, "learning_rate": 1.2219497339869422e-06, "loss": 0.8016, "step": 1401 }, { "epoch": 0.12935070926075423, "grad_norm": 1.4360042587144939, "learning_rate": 1.2218939741263645e-06, "loss": 0.7909, "step": 1402 }, { "epoch": 0.12944297082228118, "grad_norm": 2.2181041510646957, "learning_rate": 1.2218381601743152e-06, "loss": 0.82, "step": 1403 }, { "epoch": 0.1295352323838081, "grad_norm": 2.3711314095201597, "learning_rate": 1.2217822921358525e-06, "loss": 0.7794, "step": 1404 }, { "epoch": 0.12962749394533502, "grad_norm": 3.077543869031744, "learning_rate": 1.221726370016039e-06, "loss": 1.0432, "step": 1405 }, { "epoch": 0.12962749394533502, "eval_GEN Loss": 0.4886215031147003, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM Loss": 0.39263656735420227, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9164062738418579, "eval_runtime": 56.9822, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1405 }, { "epoch": 0.12971975550686196, "grad_norm": 1.493004898420434, "learning_rate": 1.2216703938199427e-06, "loss": 0.7421, "step": 1406 }, { "epoch": 0.12981201706838888, "grad_norm": 3.166827384383026, "learning_rate": 1.2216143635526363e-06, "loss": 0.9538, "step": 1407 }, { "epoch": 0.1299042786299158, "grad_norm": 2.080544775842973, "learning_rate": 1.221558279219197e-06, "loss": 0.8079, "step": 1408 }, { "epoch": 0.12999654019144274, "grad_norm": 2.0712815496356627, "learning_rate": 1.2215021408247073e-06, "loss": 0.8785, "step": 1409 }, { "epoch": 0.13008880175296966, "grad_norm": 2.2258005591246155, "learning_rate": 1.2214459483742548e-06, "loss": 0.9552, "step": 1410 }, { "epoch": 0.13008880175296966, "eval_GEN Loss": 0.4911350607872009, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 Neg": 0.5, "eval_PRM Loss": 0.39618173241615295, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.8948917984962463, "eval_runtime": 56.9222, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1410 }, { "epoch": 0.1301810633144966, "grad_norm": 1.725193134210622, "learning_rate": 1.2213897018729317e-06, "loss": 0.7585, "step": 1411 }, { "epoch": 0.13027332487602353, "grad_norm": 2.4539206060217524, "learning_rate": 1.221333401325835e-06, "loss": 0.8237, "step": 1412 }, { "epoch": 0.13036558643755045, "grad_norm": 2.4648471038553588, "learning_rate": 1.2212770467380668e-06, "loss": 1.0025, "step": 1413 }, { "epoch": 0.1304578479990774, "grad_norm": 1.943709308158613, "learning_rate": 1.2212206381147344e-06, "loss": 0.8606, "step": 1414 }, { "epoch": 0.1305501095606043, "grad_norm": 1.6151719683712205, "learning_rate": 1.221164175460949e-06, "loss": 0.8879, "step": 1415 }, { "epoch": 0.1305501095606043, "eval_GEN Loss": 0.49076810479164124, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.4118606150150299, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8805288672447205, "eval_runtime": 55.9309, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1415 }, { "epoch": 0.13064237112213123, "grad_norm": 1.8935609703014025, "learning_rate": 1.2211076587818276e-06, "loss": 1.0113, "step": 1416 }, { "epoch": 0.13073463268365818, "grad_norm": 1.7868360237988912, "learning_rate": 1.221051088082492e-06, "loss": 0.7498, "step": 1417 }, { "epoch": 0.1308268942451851, "grad_norm": 2.6406930623671157, "learning_rate": 1.2209944633680686e-06, "loss": 0.7203, "step": 1418 }, { "epoch": 0.13091915580671204, "grad_norm": 1.6732757519263721, "learning_rate": 1.2209377846436888e-06, "loss": 0.6282, "step": 1419 }, { "epoch": 0.13101141736823896, "grad_norm": 1.4389012831970156, "learning_rate": 1.220881051914489e-06, "loss": 0.6431, "step": 1420 }, { "epoch": 0.13101141736823896, "eval_GEN Loss": 0.4901523292064667, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4123425781726837, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8772836327552795, "eval_runtime": 55.8691, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1420 }, { "epoch": 0.13110367892976588, "grad_norm": 1.9077427061357575, "learning_rate": 1.2208242651856102e-06, "loss": 0.7044, "step": 1421 }, { "epoch": 0.13119594049129282, "grad_norm": 1.6201455051099196, "learning_rate": 1.2207674244621986e-06, "loss": 0.8841, "step": 1422 }, { "epoch": 0.13128820205281974, "grad_norm": 2.61301669288379, "learning_rate": 1.2207105297494054e-06, "loss": 0.907, "step": 1423 }, { "epoch": 0.13138046361434666, "grad_norm": 1.5551235813856161, "learning_rate": 1.2206535810523865e-06, "loss": 0.7483, "step": 1424 }, { "epoch": 0.1314727251758736, "grad_norm": 1.9306786971149377, "learning_rate": 1.220596578376302e-06, "loss": 0.7005, "step": 1425 }, { "epoch": 0.1314727251758736, "eval_GEN Loss": 0.48764145374298096, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3840732276439667, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8736779093742371, "eval_runtime": 56.0107, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1425 }, { "epoch": 0.13156498673740052, "grad_norm": 1.4270304714741135, "learning_rate": 1.2205395217263186e-06, "loss": 0.6763, "step": 1426 }, { "epoch": 0.13165724829892747, "grad_norm": 2.30788141561209, "learning_rate": 1.220482411107606e-06, "loss": 0.9192, "step": 1427 }, { "epoch": 0.1317495098604544, "grad_norm": 2.7212851138373955, "learning_rate": 1.2204252465253403e-06, "loss": 0.9717, "step": 1428 }, { "epoch": 0.1318417714219813, "grad_norm": 2.230544584496275, "learning_rate": 1.2203680279847014e-06, "loss": 0.8579, "step": 1429 }, { "epoch": 0.13193403298350825, "grad_norm": 1.640629308733161, "learning_rate": 1.2203107554908746e-06, "loss": 0.8892, "step": 1430 }, { "epoch": 0.13193403298350825, "eval_GEN Loss": 0.48576074838638306, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3708195686340332, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8837740421295166, "eval_runtime": 55.9978, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1430 }, { "epoch": 0.13202629454503517, "grad_norm": 2.8181086708700076, "learning_rate": 1.2202534290490503e-06, "loss": 0.7244, "step": 1431 }, { "epoch": 0.1321185561065621, "grad_norm": 2.2999219725297078, "learning_rate": 1.2201960486644233e-06, "loss": 0.6805, "step": 1432 }, { "epoch": 0.13221081766808904, "grad_norm": 3.036926360636184, "learning_rate": 1.2201386143421933e-06, "loss": 0.7745, "step": 1433 }, { "epoch": 0.13230307922961596, "grad_norm": 1.626070332283681, "learning_rate": 1.2200811260875653e-06, "loss": 0.7557, "step": 1434 }, { "epoch": 0.1323953407911429, "grad_norm": 2.9045959136378876, "learning_rate": 1.2200235839057491e-06, "loss": 0.9921, "step": 1435 }, { "epoch": 0.1323953407911429, "eval_GEN Loss": 0.48395654559135437, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3801724314689636, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8667067289352417, "eval_runtime": 55.9602, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1435 }, { "epoch": 0.13248760235266982, "grad_norm": 3.534488933557012, "learning_rate": 1.2199659878019593e-06, "loss": 1.0597, "step": 1436 }, { "epoch": 0.13257986391419674, "grad_norm": 1.9046011313670044, "learning_rate": 1.219908337781415e-06, "loss": 0.8453, "step": 1437 }, { "epoch": 0.13267212547572368, "grad_norm": 2.0757607966541696, "learning_rate": 1.2198506338493406e-06, "loss": 0.8751, "step": 1438 }, { "epoch": 0.1327643870372506, "grad_norm": 2.128683664799301, "learning_rate": 1.2197928760109658e-06, "loss": 0.7596, "step": 1439 }, { "epoch": 0.13285664859877752, "grad_norm": 2.487992956455477, "learning_rate": 1.2197350642715241e-06, "loss": 0.8282, "step": 1440 }, { "epoch": 0.13285664859877752, "eval_GEN Loss": 0.4832429587841034, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4173552095890045, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8638221025466919, "eval_runtime": 56.0343, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1440 }, { "epoch": 0.13294891016030447, "grad_norm": 2.2825361847454717, "learning_rate": 1.219677198636255e-06, "loss": 0.8686, "step": 1441 }, { "epoch": 0.13304117172183139, "grad_norm": 2.6788643263216123, "learning_rate": 1.2196192791104017e-06, "loss": 0.6179, "step": 1442 }, { "epoch": 0.13313343328335833, "grad_norm": 2.1012184128946236, "learning_rate": 1.2195613056992137e-06, "loss": 0.6893, "step": 1443 }, { "epoch": 0.13322569484488525, "grad_norm": 1.5552346137341364, "learning_rate": 1.2195032784079444e-06, "loss": 0.7452, "step": 1444 }, { "epoch": 0.13331795640641217, "grad_norm": 1.606597977368422, "learning_rate": 1.219445197241852e-06, "loss": 0.621, "step": 1445 }, { "epoch": 0.13331795640641217, "eval_GEN Loss": 0.4831272065639496, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.441954642534256, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8729567527770996, "eval_runtime": 57.0335, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1445 }, { "epoch": 0.13341021796793912, "grad_norm": 1.89406867652153, "learning_rate": 1.2193870622062004e-06, "loss": 0.7446, "step": 1446 }, { "epoch": 0.13350247952946603, "grad_norm": 3.2388273648052297, "learning_rate": 1.2193288733062574e-06, "loss": 0.921, "step": 1447 }, { "epoch": 0.13359474109099295, "grad_norm": 3.0643457878600135, "learning_rate": 1.2192706305472965e-06, "loss": 0.9296, "step": 1448 }, { "epoch": 0.1336870026525199, "grad_norm": 1.6532173075171206, "learning_rate": 1.2192123339345957e-06, "loss": 0.786, "step": 1449 }, { "epoch": 0.13377926421404682, "grad_norm": 1.717418204393591, "learning_rate": 1.2191539834734378e-06, "loss": 0.7298, "step": 1450 }, { "epoch": 0.13377926421404682, "eval_GEN Loss": 0.48509472608566284, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4426087737083435, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8865384459495544, "eval_runtime": 55.9, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1450 }, { "epoch": 0.13387152577557376, "grad_norm": 1.7870663859688258, "learning_rate": 1.2190955791691108e-06, "loss": 0.6784, "step": 1451 }, { "epoch": 0.13396378733710068, "grad_norm": 1.7480168937710523, "learning_rate": 1.2190371210269075e-06, "loss": 0.7037, "step": 1452 }, { "epoch": 0.1340560488986276, "grad_norm": 1.8071013731005843, "learning_rate": 1.218978609052125e-06, "loss": 0.8095, "step": 1453 }, { "epoch": 0.13414831046015455, "grad_norm": 3.023351955770835, "learning_rate": 1.218920043250066e-06, "loss": 0.991, "step": 1454 }, { "epoch": 0.13424057202168146, "grad_norm": 2.034217737011871, "learning_rate": 1.2188614236260378e-06, "loss": 0.7052, "step": 1455 }, { "epoch": 0.13424057202168146, "eval_GEN Loss": 0.48578301072120667, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.43944641947746277, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8933894038200378, "eval_runtime": 57.0451, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 1455 }, { "epoch": 0.13433283358320838, "grad_norm": 1.7513297937120134, "learning_rate": 1.2188027501853527e-06, "loss": 0.9649, "step": 1456 }, { "epoch": 0.13442509514473533, "grad_norm": 2.1796927369703702, "learning_rate": 1.218744022933328e-06, "loss": 0.6808, "step": 1457 }, { "epoch": 0.13451735670626225, "grad_norm": 1.5648907930871407, "learning_rate": 1.2186852418752851e-06, "loss": 0.8168, "step": 1458 }, { "epoch": 0.1346096182677892, "grad_norm": 2.659296652822949, "learning_rate": 1.218626407016551e-06, "loss": 0.8799, "step": 1459 }, { "epoch": 0.1347018798293161, "grad_norm": 1.6903040043421167, "learning_rate": 1.2185675183624577e-06, "loss": 0.9248, "step": 1460 }, { "epoch": 0.1347018798293161, "eval_GEN Loss": 0.4877380132675171, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.42827802896499634, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.907151460647583, "eval_runtime": 57.0855, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 1460 }, { "epoch": 0.13479414139084303, "grad_norm": 2.2399104560871024, "learning_rate": 1.2185085759183416e-06, "loss": 0.9153, "step": 1461 }, { "epoch": 0.13488640295236998, "grad_norm": 1.5843009173873546, "learning_rate": 1.2184495796895441e-06, "loss": 0.585, "step": 1462 }, { "epoch": 0.1349786645138969, "grad_norm": 1.540416191368777, "learning_rate": 1.2183905296814116e-06, "loss": 0.7705, "step": 1463 }, { "epoch": 0.13507092607542381, "grad_norm": 1.5800918821585193, "learning_rate": 1.2183314258992953e-06, "loss": 0.8058, "step": 1464 }, { "epoch": 0.13516318763695076, "grad_norm": 2.6540944037546295, "learning_rate": 1.2182722683485511e-06, "loss": 0.8014, "step": 1465 }, { "epoch": 0.13516318763695076, "eval_GEN Loss": 0.4897516071796417, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.43161651492118835, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.909254789352417, "eval_runtime": 57.121, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 1465 }, { "epoch": 0.13525544919847768, "grad_norm": 2.555886509779221, "learning_rate": 1.2182130570345404e-06, "loss": 0.8484, "step": 1466 }, { "epoch": 0.13534771076000462, "grad_norm": 1.6730850578977305, "learning_rate": 1.2181537919626284e-06, "loss": 0.8389, "step": 1467 }, { "epoch": 0.13543997232153154, "grad_norm": 2.340466897164336, "learning_rate": 1.2180944731381864e-06, "loss": 0.6125, "step": 1468 }, { "epoch": 0.13553223388305846, "grad_norm": 2.3124459269800606, "learning_rate": 1.2180351005665897e-06, "loss": 0.8138, "step": 1469 }, { "epoch": 0.1356244954445854, "grad_norm": 1.8353511605355965, "learning_rate": 1.2179756742532187e-06, "loss": 0.7342, "step": 1470 }, { "epoch": 0.1356244954445854, "eval_GEN Loss": 0.49066561460494995, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.41019701957702637, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9172475934028625, "eval_runtime": 57.0038, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1470 }, { "epoch": 0.13571675700611233, "grad_norm": 2.8703132324935763, "learning_rate": 1.2179161942034587e-06, "loss": 0.7313, "step": 1471 }, { "epoch": 0.13580901856763924, "grad_norm": 1.4823664860463994, "learning_rate": 1.2178566604226999e-06, "loss": 0.7206, "step": 1472 }, { "epoch": 0.1359012801291662, "grad_norm": 2.5045616762517238, "learning_rate": 1.2177970729163374e-06, "loss": 0.6631, "step": 1473 }, { "epoch": 0.1359935416906931, "grad_norm": 1.797659550845175, "learning_rate": 1.217737431689771e-06, "loss": 0.845, "step": 1474 }, { "epoch": 0.13608580325222006, "grad_norm": 1.7472275102991048, "learning_rate": 1.2176777367484058e-06, "loss": 0.7978, "step": 1475 }, { "epoch": 0.13608580325222006, "eval_GEN Loss": 0.48971661925315857, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3996686339378357, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9207331538200378, "eval_runtime": 56.8658, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1475 }, { "epoch": 0.13617806481374697, "grad_norm": 2.3145155051067117, "learning_rate": 1.217617988097651e-06, "loss": 1.0098, "step": 1476 }, { "epoch": 0.1362703263752739, "grad_norm": 1.7676781476663201, "learning_rate": 1.2175581857429212e-06, "loss": 0.7219, "step": 1477 }, { "epoch": 0.13636258793680084, "grad_norm": 2.1027275664909144, "learning_rate": 1.2174983296896362e-06, "loss": 0.6974, "step": 1478 }, { "epoch": 0.13645484949832776, "grad_norm": 1.677411819562967, "learning_rate": 1.2174384199432198e-06, "loss": 0.6773, "step": 1479 }, { "epoch": 0.13654711105985468, "grad_norm": 1.401378609734081, "learning_rate": 1.2173784565091013e-06, "loss": 0.6816, "step": 1480 }, { "epoch": 0.13654711105985468, "eval_GEN Loss": 0.4899117350578308, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41072383522987366, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9126802682876587, "eval_runtime": 56.8851, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1480 }, { "epoch": 0.13663937262138162, "grad_norm": 3.1739626128379514, "learning_rate": 1.2173184393927146e-06, "loss": 1.0342, "step": 1481 }, { "epoch": 0.13673163418290854, "grad_norm": 2.1981313502484006, "learning_rate": 1.2172583685994987e-06, "loss": 0.9485, "step": 1482 }, { "epoch": 0.1368238957444355, "grad_norm": 1.2383898111735496, "learning_rate": 1.217198244134897e-06, "loss": 0.7046, "step": 1483 }, { "epoch": 0.1369161573059624, "grad_norm": 2.5278187196321085, "learning_rate": 1.2171380660043586e-06, "loss": 0.6783, "step": 1484 }, { "epoch": 0.13700841886748932, "grad_norm": 1.9326352047414406, "learning_rate": 1.2170778342133365e-06, "loss": 0.8354, "step": 1485 }, { "epoch": 0.13700841886748932, "eval_GEN Loss": 0.4875543415546417, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.4324727952480316, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9129206538200378, "eval_runtime": 56.9608, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1485 }, { "epoch": 0.13710068042901627, "grad_norm": 2.016188506648634, "learning_rate": 1.217017548767289e-06, "loss": 0.8474, "step": 1486 }, { "epoch": 0.1371929419905432, "grad_norm": 1.8314060510452763, "learning_rate": 1.2169572096716794e-06, "loss": 0.9059, "step": 1487 }, { "epoch": 0.1372852035520701, "grad_norm": 1.6984189460823083, "learning_rate": 1.2168968169319758e-06, "loss": 0.6674, "step": 1488 }, { "epoch": 0.13737746511359705, "grad_norm": 2.6395713682345163, "learning_rate": 1.216836370553651e-06, "loss": 0.8628, "step": 1489 }, { "epoch": 0.13746972667512397, "grad_norm": 1.9000009573257397, "learning_rate": 1.2167758705421827e-06, "loss": 0.911, "step": 1490 }, { "epoch": 0.13746972667512397, "eval_GEN Loss": 0.4862188994884491, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.42939531803131104, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9112980961799622, "eval_runtime": 56.904, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1490 }, { "epoch": 0.13756198823665092, "grad_norm": 1.940560206516826, "learning_rate": 1.2167153169030536e-06, "loss": 1.0167, "step": 1491 }, { "epoch": 0.13765424979817784, "grad_norm": 1.7804113668872108, "learning_rate": 1.216654709641751e-06, "loss": 0.8197, "step": 1492 }, { "epoch": 0.13774651135970475, "grad_norm": 1.870396973825811, "learning_rate": 1.2165940487637672e-06, "loss": 0.8109, "step": 1493 }, { "epoch": 0.1378387729212317, "grad_norm": 1.783129166529002, "learning_rate": 1.2165333342745997e-06, "loss": 0.8711, "step": 1494 }, { "epoch": 0.13793103448275862, "grad_norm": 1.6537272729529997, "learning_rate": 1.2164725661797505e-06, "loss": 0.6381, "step": 1495 }, { "epoch": 0.13793103448275862, "eval_GEN Loss": 0.48459392786026, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.4264398217201233, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9077523946762085, "eval_runtime": 55.9849, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1495 }, { "epoch": 0.13802329604428554, "grad_norm": 1.7188956810123366, "learning_rate": 1.2164117444847262e-06, "loss": 0.8818, "step": 1496 }, { "epoch": 0.13811555760581248, "grad_norm": 1.968972988950428, "learning_rate": 1.2163508691950387e-06, "loss": 0.813, "step": 1497 }, { "epoch": 0.1382078191673394, "grad_norm": 2.160000707263368, "learning_rate": 1.2162899403162046e-06, "loss": 0.5748, "step": 1498 }, { "epoch": 0.13830008072886635, "grad_norm": 2.382010283993841, "learning_rate": 1.2162289578537457e-06, "loss": 0.7955, "step": 1499 }, { "epoch": 0.13839234229039327, "grad_norm": 1.495369182403971, "learning_rate": 1.2161679218131877e-06, "loss": 0.7968, "step": 1500 }, { "epoch": 0.13839234229039327, "eval_GEN Loss": 0.48590993881225586, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41839560866355896, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9126201868057251, "eval_runtime": 55.8859, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1500 }, { "epoch": 0.13848460385192018, "grad_norm": 1.7812087696351404, "learning_rate": 1.216106832200062e-06, "loss": 0.732, "step": 1501 }, { "epoch": 0.13857686541344713, "grad_norm": 2.1991333275716305, "learning_rate": 1.2160456890199052e-06, "loss": 0.9506, "step": 1502 }, { "epoch": 0.13866912697497405, "grad_norm": 2.8191440678976973, "learning_rate": 1.2159844922782575e-06, "loss": 0.8977, "step": 1503 }, { "epoch": 0.13876138853650097, "grad_norm": 2.3006810473425205, "learning_rate": 1.2159232419806649e-06, "loss": 0.8017, "step": 1504 }, { "epoch": 0.13885365009802791, "grad_norm": 2.5897149997967532, "learning_rate": 1.2158619381326778e-06, "loss": 0.902, "step": 1505 }, { "epoch": 0.13885365009802791, "eval_GEN Loss": 0.48909762501716614, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.42517611384391785, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9254207015037537, "eval_runtime": 55.9005, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1505 }, { "epoch": 0.13894591165955483, "grad_norm": 1.6344563329401594, "learning_rate": 1.215800580739852e-06, "loss": 0.8441, "step": 1506 }, { "epoch": 0.13903817322108178, "grad_norm": 2.1475173191522052, "learning_rate": 1.2157391698077477e-06, "loss": 0.9089, "step": 1507 }, { "epoch": 0.1391304347826087, "grad_norm": 2.188858630147719, "learning_rate": 1.21567770534193e-06, "loss": 0.9531, "step": 1508 }, { "epoch": 0.13922269634413562, "grad_norm": 1.2498198125794533, "learning_rate": 1.2156161873479688e-06, "loss": 0.6935, "step": 1509 }, { "epoch": 0.13931495790566256, "grad_norm": 3.1222719593071524, "learning_rate": 1.2155546158314391e-06, "loss": 1.0682, "step": 1510 }, { "epoch": 0.13931495790566256, "eval_GEN Loss": 0.4886327385902405, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.43589362502098083, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9278846383094788, "eval_runtime": 56.8024, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1510 }, { "epoch": 0.13940721946718948, "grad_norm": 1.6876532513309759, "learning_rate": 1.2154929907979207e-06, "loss": 0.9661, "step": 1511 }, { "epoch": 0.1394994810287164, "grad_norm": 2.3098677426370844, "learning_rate": 1.2154313122529979e-06, "loss": 0.9075, "step": 1512 }, { "epoch": 0.13959174259024335, "grad_norm": 1.5925941919284827, "learning_rate": 1.2153695802022603e-06, "loss": 0.7232, "step": 1513 }, { "epoch": 0.13968400415177026, "grad_norm": 2.07332708079127, "learning_rate": 1.215307794651302e-06, "loss": 0.6794, "step": 1514 }, { "epoch": 0.1397762657132972, "grad_norm": 1.5762825942969272, "learning_rate": 1.2152459556057221e-06, "loss": 0.6641, "step": 1515 }, { "epoch": 0.1397762657132972, "eval_GEN Loss": 0.4870279133319855, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4536207914352417, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9316706657409668, "eval_runtime": 56.648, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 1515 }, { "epoch": 0.13986852727482413, "grad_norm": 1.480708156546866, "learning_rate": 1.2151840630711249e-06, "loss": 0.7197, "step": 1516 }, { "epoch": 0.13996078883635105, "grad_norm": 2.5720173893902976, "learning_rate": 1.2151221170531186e-06, "loss": 0.9796, "step": 1517 }, { "epoch": 0.140053050397878, "grad_norm": 1.5842240024501602, "learning_rate": 1.2150601175573173e-06, "loss": 0.6834, "step": 1518 }, { "epoch": 0.1401453119594049, "grad_norm": 1.9219813009605233, "learning_rate": 1.2149980645893397e-06, "loss": 0.8441, "step": 1519 }, { "epoch": 0.14023757352093183, "grad_norm": 1.9267743882787396, "learning_rate": 1.2149359581548084e-06, "loss": 0.8574, "step": 1520 }, { "epoch": 0.14023757352093183, "eval_GEN Loss": 0.4875936806201935, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.46150749921798706, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9364783763885498, "eval_runtime": 56.8273, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1520 }, { "epoch": 0.14032983508245878, "grad_norm": 2.5934660350263643, "learning_rate": 1.2148737982593522e-06, "loss": 0.8217, "step": 1521 }, { "epoch": 0.1404220966439857, "grad_norm": 1.7778069422397285, "learning_rate": 1.2148115849086039e-06, "loss": 0.8128, "step": 1522 }, { "epoch": 0.14051435820551264, "grad_norm": 1.9120964058598204, "learning_rate": 1.2147493181082014e-06, "loss": 0.6522, "step": 1523 }, { "epoch": 0.14060661976703956, "grad_norm": 1.7316037392769772, "learning_rate": 1.2146869978637874e-06, "loss": 0.8323, "step": 1524 }, { "epoch": 0.14069888132856648, "grad_norm": 2.2877225371734435, "learning_rate": 1.2146246241810094e-06, "loss": 0.7117, "step": 1525 }, { "epoch": 0.14069888132856648, "eval_GEN Loss": 0.48820412158966064, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.45991775393486023, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9534855484962463, "eval_runtime": 56.8446, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1525 }, { "epoch": 0.14079114289009342, "grad_norm": 1.3918306824776139, "learning_rate": 1.21456219706552e-06, "loss": 0.715, "step": 1526 }, { "epoch": 0.14088340445162034, "grad_norm": 1.4411090798512138, "learning_rate": 1.2144997165229764e-06, "loss": 0.7589, "step": 1527 }, { "epoch": 0.14097566601314726, "grad_norm": 1.7806133121953431, "learning_rate": 1.2144371825590404e-06, "loss": 0.7439, "step": 1528 }, { "epoch": 0.1410679275746742, "grad_norm": 3.8133716362518717, "learning_rate": 1.2143745951793792e-06, "loss": 0.9046, "step": 1529 }, { "epoch": 0.14116018913620113, "grad_norm": 1.8334556072347568, "learning_rate": 1.2143119543896645e-06, "loss": 0.8661, "step": 1530 }, { "epoch": 0.14116018913620113, "eval_GEN Loss": 0.48858997225761414, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.4668982923030853, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9585336446762085, "eval_runtime": 56.8617, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1530 }, { "epoch": 0.14125245069772807, "grad_norm": 2.1977085918394224, "learning_rate": 1.214249260195573e-06, "loss": 0.8644, "step": 1531 }, { "epoch": 0.141344712259255, "grad_norm": 4.325783037130388, "learning_rate": 1.2141865126027859e-06, "loss": 1.0033, "step": 1532 }, { "epoch": 0.1414369738207819, "grad_norm": 1.920480883036466, "learning_rate": 1.2141237116169897e-06, "loss": 0.9399, "step": 1533 }, { "epoch": 0.14152923538230885, "grad_norm": 2.1268793254030114, "learning_rate": 1.2140608572438753e-06, "loss": 0.9536, "step": 1534 }, { "epoch": 0.14162149694383577, "grad_norm": 1.6851987626291, "learning_rate": 1.213997949489139e-06, "loss": 0.8608, "step": 1535 }, { "epoch": 0.14162149694383577, "eval_GEN Loss": 0.4883213937282562, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.4781765937805176, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.957932710647583, "eval_runtime": 56.8715, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1535 }, { "epoch": 0.1417137585053627, "grad_norm": 1.8035419546136695, "learning_rate": 1.2139349883584813e-06, "loss": 0.6354, "step": 1536 }, { "epoch": 0.14180602006688964, "grad_norm": 2.2774576257316537, "learning_rate": 1.2138719738576082e-06, "loss": 0.8053, "step": 1537 }, { "epoch": 0.14189828162841656, "grad_norm": 1.7243372664491499, "learning_rate": 1.2138089059922298e-06, "loss": 0.819, "step": 1538 }, { "epoch": 0.1419905431899435, "grad_norm": 1.7654585989184457, "learning_rate": 1.2137457847680615e-06, "loss": 1.1385, "step": 1539 }, { "epoch": 0.14208280475147042, "grad_norm": 1.791716423273646, "learning_rate": 1.2136826101908235e-06, "loss": 0.6427, "step": 1540 }, { "epoch": 0.14208280475147042, "eval_GEN Loss": 0.48769626021385193, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 Neg": 0.52, "eval_PRM Loss": 0.4586150050163269, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9599158763885498, "eval_runtime": 56.7674, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1540 }, { "epoch": 0.14217506631299734, "grad_norm": 2.6113178827100123, "learning_rate": 1.2136193822662408e-06, "loss": 0.8815, "step": 1541 }, { "epoch": 0.14226732787452429, "grad_norm": 2.27231942686477, "learning_rate": 1.213556101000043e-06, "loss": 0.8198, "step": 1542 }, { "epoch": 0.1423595894360512, "grad_norm": 1.7440396558376248, "learning_rate": 1.213492766397965e-06, "loss": 0.681, "step": 1543 }, { "epoch": 0.14245185099757812, "grad_norm": 1.9289662225514435, "learning_rate": 1.2134293784657463e-06, "loss": 0.9392, "step": 1544 }, { "epoch": 0.14254411255910507, "grad_norm": 2.015619872344053, "learning_rate": 1.2133659372091313e-06, "loss": 0.9288, "step": 1545 }, { "epoch": 0.14254411255910507, "eval_GEN Loss": 0.4858710467815399, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM Loss": 0.4427182078361511, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9689303040504456, "eval_runtime": 56.714, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 1545 }, { "epoch": 0.142636374120632, "grad_norm": 1.7083452678678301, "learning_rate": 1.213302442633869e-06, "loss": 0.7585, "step": 1546 }, { "epoch": 0.14272863568215893, "grad_norm": 1.7437547134384943, "learning_rate": 1.213238894745713e-06, "loss": 0.5721, "step": 1547 }, { "epoch": 0.14282089724368585, "grad_norm": 1.6264445760393105, "learning_rate": 1.2131752935504223e-06, "loss": 0.804, "step": 1548 }, { "epoch": 0.14291315880521277, "grad_norm": 3.0483329518966347, "learning_rate": 1.2131116390537612e-06, "loss": 0.9359, "step": 1549 }, { "epoch": 0.14300542036673972, "grad_norm": 1.4994529197445892, "learning_rate": 1.2130479312614973e-06, "loss": 0.7795, "step": 1550 }, { "epoch": 0.14300542036673972, "eval_GEN Loss": 0.4825584888458252, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM Loss": 0.4122474491596222, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9410457015037537, "eval_runtime": 56.6267, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 1550 }, { "epoch": 0.14309768192826663, "grad_norm": 2.03221205648812, "learning_rate": 1.2129841701794044e-06, "loss": 0.5885, "step": 1551 }, { "epoch": 0.14318994348979355, "grad_norm": 1.796864093783121, "learning_rate": 1.2129203558132604e-06, "loss": 0.6886, "step": 1552 }, { "epoch": 0.1432822050513205, "grad_norm": 1.5117740616104873, "learning_rate": 1.2128564881688486e-06, "loss": 0.8127, "step": 1553 }, { "epoch": 0.14337446661284742, "grad_norm": 1.9128950440003294, "learning_rate": 1.2127925672519564e-06, "loss": 0.6823, "step": 1554 }, { "epoch": 0.14346672817437436, "grad_norm": 2.221095276125673, "learning_rate": 1.2127285930683766e-06, "loss": 0.9162, "step": 1555 }, { "epoch": 0.14346672817437436, "eval_GEN Loss": 0.48015135526657104, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4164435565471649, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9243990182876587, "eval_runtime": 56.8141, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1555 }, { "epoch": 0.14355898973590128, "grad_norm": 1.6199425103379719, "learning_rate": 1.2126645656239064e-06, "loss": 0.929, "step": 1556 }, { "epoch": 0.1436512512974282, "grad_norm": 1.617495758978593, "learning_rate": 1.2126004849243485e-06, "loss": 0.7732, "step": 1557 }, { "epoch": 0.14374351285895515, "grad_norm": 2.5232182449527536, "learning_rate": 1.2125363509755098e-06, "loss": 0.8469, "step": 1558 }, { "epoch": 0.14383577442048207, "grad_norm": 1.8377351016379688, "learning_rate": 1.212472163783202e-06, "loss": 0.6864, "step": 1559 }, { "epoch": 0.14392803598200898, "grad_norm": 1.561310611356702, "learning_rate": 1.212407923353242e-06, "loss": 0.5072, "step": 1560 }, { "epoch": 0.14392803598200898, "eval_GEN Loss": 0.47932034730911255, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.41043820977211, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.926682710647583, "eval_runtime": 56.9817, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1560 }, { "epoch": 0.14402029754353593, "grad_norm": 2.1865153012788716, "learning_rate": 1.2123436296914514e-06, "loss": 0.8404, "step": 1561 }, { "epoch": 0.14411255910506285, "grad_norm": 1.4396843867341758, "learning_rate": 1.2122792828036566e-06, "loss": 0.7448, "step": 1562 }, { "epoch": 0.1442048206665898, "grad_norm": 2.4406187017441305, "learning_rate": 1.212214882695689e-06, "loss": 0.7268, "step": 1563 }, { "epoch": 0.1442970822281167, "grad_norm": 2.331673626795673, "learning_rate": 1.2121504293733843e-06, "loss": 0.7616, "step": 1564 }, { "epoch": 0.14438934378964363, "grad_norm": 1.4222004672390411, "learning_rate": 1.2120859228425835e-06, "loss": 0.6549, "step": 1565 }, { "epoch": 0.14438934378964363, "eval_GEN Loss": 0.4810382127761841, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM Loss": 0.39960551261901855, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9530048370361328, "eval_runtime": 56.7626, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1565 }, { "epoch": 0.14448160535117058, "grad_norm": 1.5144381910161673, "learning_rate": 1.2120213631091322e-06, "loss": 0.6392, "step": 1566 }, { "epoch": 0.1445738669126975, "grad_norm": 1.5191413241489855, "learning_rate": 1.211956750178881e-06, "loss": 0.724, "step": 1567 }, { "epoch": 0.14466612847422441, "grad_norm": 1.5331338319160501, "learning_rate": 1.2118920840576853e-06, "loss": 0.7858, "step": 1568 }, { "epoch": 0.14475839003575136, "grad_norm": 1.6681354517322655, "learning_rate": 1.2118273647514054e-06, "loss": 0.7343, "step": 1569 }, { "epoch": 0.14485065159727828, "grad_norm": 2.6359620666061736, "learning_rate": 1.2117625922659057e-06, "loss": 0.7797, "step": 1570 }, { "epoch": 0.14485065159727828, "eval_GEN Loss": 0.48034995794296265, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9058823529411765, "eval_PRM F1 AUC": 0.746464117338921, "eval_PRM F1 Neg": 0.6190476190476191, "eval_PRM Loss": 0.39335888624191284, "eval_PRM NPV": 0.6842105263157895, "eval_PRM Precision": 0.8850574712643678, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9628605842590332, "eval_runtime": 56.8155, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1570 }, { "epoch": 0.14494291315880523, "grad_norm": 1.815111611079528, "learning_rate": 1.2116977666070564e-06, "loss": 0.8399, "step": 1571 }, { "epoch": 0.14503517472033214, "grad_norm": 2.564024454609857, "learning_rate": 1.211632887780732e-06, "loss": 0.816, "step": 1572 }, { "epoch": 0.14512743628185906, "grad_norm": 2.1408366599577984, "learning_rate": 1.211567955792812e-06, "loss": 0.6796, "step": 1573 }, { "epoch": 0.145219697843386, "grad_norm": 1.6763765475188022, "learning_rate": 1.2115029706491804e-06, "loss": 0.6421, "step": 1574 }, { "epoch": 0.14531195940491293, "grad_norm": 2.6073873782420476, "learning_rate": 1.2114379323557266e-06, "loss": 0.7641, "step": 1575 }, { "epoch": 0.14531195940491293, "eval_GEN Loss": 0.477909654378891, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM Loss": 0.3995104730129242, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9445913434028625, "eval_runtime": 56.7706, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1575 }, { "epoch": 0.14540422096643985, "grad_norm": 1.7960350045434368, "learning_rate": 1.2113728409183441e-06, "loss": 1.0443, "step": 1576 }, { "epoch": 0.1454964825279668, "grad_norm": 2.2135505447891433, "learning_rate": 1.211307696342932e-06, "loss": 0.6969, "step": 1577 }, { "epoch": 0.1455887440894937, "grad_norm": 1.8917194674305324, "learning_rate": 1.2112424986353934e-06, "loss": 0.8017, "step": 1578 }, { "epoch": 0.14568100565102066, "grad_norm": 1.7442166552375302, "learning_rate": 1.211177247801637e-06, "loss": 0.9089, "step": 1579 }, { "epoch": 0.14577326721254757, "grad_norm": 1.9222757837622877, "learning_rate": 1.2111119438475758e-06, "loss": 0.7088, "step": 1580 }, { "epoch": 0.14577326721254757, "eval_GEN Loss": 0.4757411479949951, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM Loss": 0.39801672101020813, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9429086446762085, "eval_runtime": 56.9673, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1580 }, { "epoch": 0.1458655287740745, "grad_norm": 1.8373254696524093, "learning_rate": 1.2110465867791275e-06, "loss": 0.9386, "step": 1581 }, { "epoch": 0.14595779033560144, "grad_norm": 2.084647192251181, "learning_rate": 1.2109811766022153e-06, "loss": 0.8144, "step": 1582 }, { "epoch": 0.14605005189712836, "grad_norm": 2.3870932416535933, "learning_rate": 1.2109157133227662e-06, "loss": 0.9397, "step": 1583 }, { "epoch": 0.14614231345865528, "grad_norm": 1.777806736041665, "learning_rate": 1.2108501969467132e-06, "loss": 0.7087, "step": 1584 }, { "epoch": 0.14623457502018222, "grad_norm": 2.276862066058128, "learning_rate": 1.2107846274799932e-06, "loss": 0.71, "step": 1585 }, { "epoch": 0.14623457502018222, "eval_GEN Loss": 0.47742316126823425, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM Loss": 0.39713582396507263, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.95703125, "eval_runtime": 56.7561, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1585 }, { "epoch": 0.14632683658170914, "grad_norm": 2.3895934805555155, "learning_rate": 1.2107190049285478e-06, "loss": 0.7321, "step": 1586 }, { "epoch": 0.1464190981432361, "grad_norm": 1.4390572125615302, "learning_rate": 1.2106533292983247e-06, "loss": 0.7152, "step": 1587 }, { "epoch": 0.146511359704763, "grad_norm": 2.096151784511048, "learning_rate": 1.2105876005952749e-06, "loss": 0.898, "step": 1588 }, { "epoch": 0.14660362126628992, "grad_norm": 1.6431998302958275, "learning_rate": 1.210521818825355e-06, "loss": 0.7141, "step": 1589 }, { "epoch": 0.14669588282781687, "grad_norm": 1.7248784796130232, "learning_rate": 1.2104559839945261e-06, "loss": 1.0005, "step": 1590 }, { "epoch": 0.14669588282781687, "eval_GEN Loss": 0.47937461733818054, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM Loss": 0.40157634019851685, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9463942050933838, "eval_runtime": 56.8058, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1590 }, { "epoch": 0.1467881443893438, "grad_norm": 1.4031303818781538, "learning_rate": 1.2103900961087547e-06, "loss": 0.6271, "step": 1591 }, { "epoch": 0.1468804059508707, "grad_norm": 1.744541248195711, "learning_rate": 1.2103241551740114e-06, "loss": 0.6399, "step": 1592 }, { "epoch": 0.14697266751239765, "grad_norm": 1.4339104648237544, "learning_rate": 1.2102581611962715e-06, "loss": 0.7929, "step": 1593 }, { "epoch": 0.14706492907392457, "grad_norm": 1.4630138411701694, "learning_rate": 1.2101921141815163e-06, "loss": 0.7397, "step": 1594 }, { "epoch": 0.14715719063545152, "grad_norm": 1.4826477252971642, "learning_rate": 1.2101260141357302e-06, "loss": 0.8408, "step": 1595 }, { "epoch": 0.14715719063545152, "eval_GEN Loss": 0.48221975564956665, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM Loss": 0.4121546149253845, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.948437511920929, "eval_runtime": 56.0388, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1595 }, { "epoch": 0.14724945219697844, "grad_norm": 1.8944713991231408, "learning_rate": 1.210059861064904e-06, "loss": 0.8403, "step": 1596 }, { "epoch": 0.14734171375850535, "grad_norm": 1.4630907452130664, "learning_rate": 1.2099936549750318e-06, "loss": 0.7839, "step": 1597 }, { "epoch": 0.1474339753200323, "grad_norm": 1.3507923187890327, "learning_rate": 1.2099273958721142e-06, "loss": 0.6461, "step": 1598 }, { "epoch": 0.14752623688155922, "grad_norm": 1.7681718189083817, "learning_rate": 1.2098610837621552e-06, "loss": 0.9491, "step": 1599 }, { "epoch": 0.14761849844308614, "grad_norm": 1.7883526947799715, "learning_rate": 1.2097947186511641e-06, "loss": 0.9205, "step": 1600 }, { "epoch": 0.14761849844308614, "eval_GEN Loss": 0.48528167605400085, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.42186102271080017, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9498798251152039, "eval_runtime": 55.7531, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1600 }, { "epoch": 0.14771076000461308, "grad_norm": 1.7554929817074767, "learning_rate": 1.2097283005451555e-06, "loss": 0.913, "step": 1601 }, { "epoch": 0.14780302156614, "grad_norm": 1.539366146174878, "learning_rate": 1.2096618294501476e-06, "loss": 0.7369, "step": 1602 }, { "epoch": 0.14789528312766695, "grad_norm": 1.5570817115421292, "learning_rate": 1.2095953053721645e-06, "loss": 0.673, "step": 1603 }, { "epoch": 0.14798754468919387, "grad_norm": 1.4719215916664423, "learning_rate": 1.2095287283172346e-06, "loss": 0.6456, "step": 1604 }, { "epoch": 0.14807980625072079, "grad_norm": 1.6580542575424595, "learning_rate": 1.2094620982913914e-06, "loss": 0.7629, "step": 1605 }, { "epoch": 0.14807980625072079, "eval_GEN Loss": 0.4843921363353729, "eval_GEN top-5 accuracy": 0.9785181937746602, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.429315984249115, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9508413672447205, "eval_runtime": 55.8532, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1605 }, { "epoch": 0.14817206781224773, "grad_norm": 1.4995954682971415, "learning_rate": 1.209395415300673e-06, "loss": 0.729, "step": 1606 }, { "epoch": 0.14826432937377465, "grad_norm": 1.8353140264749694, "learning_rate": 1.209328679351122e-06, "loss": 0.6965, "step": 1607 }, { "epoch": 0.14835659093530157, "grad_norm": 2.320723749388007, "learning_rate": 1.2092618904487863e-06, "loss": 1.1059, "step": 1608 }, { "epoch": 0.14844885249682852, "grad_norm": 1.591344939349978, "learning_rate": 1.2091950485997184e-06, "loss": 0.7887, "step": 1609 }, { "epoch": 0.14854111405835543, "grad_norm": 2.3945639293802827, "learning_rate": 1.2091281538099758e-06, "loss": 0.8983, "step": 1610 }, { "epoch": 0.14854111405835543, "eval_GEN Loss": 0.48569273948669434, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.4210745394229889, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9552884697914124, "eval_runtime": 56.7096, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 1610 }, { "epoch": 0.14863337561988238, "grad_norm": 2.5894034595953426, "learning_rate": 1.2090612060856205e-06, "loss": 0.918, "step": 1611 }, { "epoch": 0.1487256371814093, "grad_norm": 1.8055335993350563, "learning_rate": 1.2089942054327193e-06, "loss": 0.9302, "step": 1612 }, { "epoch": 0.14881789874293622, "grad_norm": 1.431276838781587, "learning_rate": 1.208927151857344e-06, "loss": 0.6177, "step": 1613 }, { "epoch": 0.14891016030446316, "grad_norm": 1.8548376484175946, "learning_rate": 1.2088600453655712e-06, "loss": 0.7329, "step": 1614 }, { "epoch": 0.14900242186599008, "grad_norm": 1.2618433104244229, "learning_rate": 1.2087928859634819e-06, "loss": 0.8308, "step": 1615 }, { "epoch": 0.14900242186599008, "eval_GEN Loss": 0.48376229405403137, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM Loss": 0.412661612033844, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9467548131942749, "eval_runtime": 56.9104, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1615 }, { "epoch": 0.149094683427517, "grad_norm": 1.4320796997565808, "learning_rate": 1.2087256736571625e-06, "loss": 0.6618, "step": 1616 }, { "epoch": 0.14918694498904395, "grad_norm": 2.8879524205470233, "learning_rate": 1.2086584084527036e-06, "loss": 0.9691, "step": 1617 }, { "epoch": 0.14927920655057086, "grad_norm": 2.0813575595306837, "learning_rate": 1.208591090356201e-06, "loss": 0.7889, "step": 1618 }, { "epoch": 0.1493714681120978, "grad_norm": 1.7154256082863044, "learning_rate": 1.2085237193737555e-06, "loss": 0.821, "step": 1619 }, { "epoch": 0.14946372967362473, "grad_norm": 1.8068920307391616, "learning_rate": 1.208456295511472e-06, "loss": 0.9439, "step": 1620 }, { "epoch": 0.14946372967362473, "eval_GEN Loss": 0.48404887318611145, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4239797294139862, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9418269395828247, "eval_runtime": 56.9264, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1620 }, { "epoch": 0.14955599123515165, "grad_norm": 2.1943708935820743, "learning_rate": 1.2083888187754606e-06, "loss": 0.6457, "step": 1621 }, { "epoch": 0.1496482527966786, "grad_norm": 2.466683965417046, "learning_rate": 1.208321289171836e-06, "loss": 0.9365, "step": 1622 }, { "epoch": 0.1497405143582055, "grad_norm": 1.9127624121626094, "learning_rate": 1.2082537067067183e-06, "loss": 0.8982, "step": 1623 }, { "epoch": 0.14983277591973243, "grad_norm": 2.025036769928188, "learning_rate": 1.2081860713862315e-06, "loss": 0.9021, "step": 1624 }, { "epoch": 0.14992503748125938, "grad_norm": 1.7945257966905834, "learning_rate": 1.2081183832165048e-06, "loss": 0.705, "step": 1625 }, { "epoch": 0.14992503748125938, "eval_GEN Loss": 0.4825240969657898, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.4197624921798706, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9364182949066162, "eval_runtime": 56.7028, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 1625 }, { "epoch": 0.1500172990427863, "grad_norm": 1.631956597393466, "learning_rate": 1.2080506422036725e-06, "loss": 0.8216, "step": 1626 }, { "epoch": 0.15010956060431324, "grad_norm": 1.4820572458087988, "learning_rate": 1.2079828483538734e-06, "loss": 0.7541, "step": 1627 }, { "epoch": 0.15020182216584016, "grad_norm": 1.7679517466246568, "learning_rate": 1.2079150016732508e-06, "loss": 0.7515, "step": 1628 }, { "epoch": 0.15029408372736708, "grad_norm": 1.7491647994721775, "learning_rate": 1.2078471021679532e-06, "loss": 0.9263, "step": 1629 }, { "epoch": 0.15038634528889402, "grad_norm": 1.6872250249087157, "learning_rate": 1.2077791498441337e-06, "loss": 0.7216, "step": 1630 }, { "epoch": 0.15038634528889402, "eval_GEN Loss": 0.4820396602153778, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.41102948784828186, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9518629908561707, "eval_runtime": 56.7591, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1630 }, { "epoch": 0.15047860685042094, "grad_norm": 1.513845787668661, "learning_rate": 1.2077111447079506e-06, "loss": 0.7099, "step": 1631 }, { "epoch": 0.15057086841194786, "grad_norm": 1.4587680435549852, "learning_rate": 1.207643086765566e-06, "loss": 0.8275, "step": 1632 }, { "epoch": 0.1506631299734748, "grad_norm": 1.7551382662965955, "learning_rate": 1.2075749760231483e-06, "loss": 0.7261, "step": 1633 }, { "epoch": 0.15075539153500173, "grad_norm": 2.864420119803085, "learning_rate": 1.207506812486869e-06, "loss": 0.9541, "step": 1634 }, { "epoch": 0.15084765309652867, "grad_norm": 1.5404400297296554, "learning_rate": 1.2074385961629053e-06, "loss": 0.7804, "step": 1635 }, { "epoch": 0.15084765309652867, "eval_GEN Loss": 0.48046940565109253, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM Loss": 0.40919992327690125, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9668869972229004, "eval_runtime": 56.8026, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1635 }, { "epoch": 0.1509399146580556, "grad_norm": 1.2536688091569381, "learning_rate": 1.2073703270574398e-06, "loss": 0.7099, "step": 1636 }, { "epoch": 0.1510321762195825, "grad_norm": 1.421850236026778, "learning_rate": 1.2073020051766579e-06, "loss": 0.7492, "step": 1637 }, { "epoch": 0.15112443778110946, "grad_norm": 3.2116489289162726, "learning_rate": 1.207233630526752e-06, "loss": 0.9474, "step": 1638 }, { "epoch": 0.15121669934263637, "grad_norm": 1.8012319667097618, "learning_rate": 1.2071652031139182e-06, "loss": 0.6945, "step": 1639 }, { "epoch": 0.1513089609041633, "grad_norm": 1.6378723565772295, "learning_rate": 1.2070967229443573e-06, "loss": 0.8106, "step": 1640 }, { "epoch": 0.1513089609041633, "eval_GEN Loss": 0.479536235332489, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.392453134059906, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9292067289352417, "eval_runtime": 56.8961, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1640 }, { "epoch": 0.15140122246569024, "grad_norm": 1.56630901885544, "learning_rate": 1.2070281900242751e-06, "loss": 0.7959, "step": 1641 }, { "epoch": 0.15149348402721716, "grad_norm": 1.430543264390956, "learning_rate": 1.2069596043598821e-06, "loss": 0.6623, "step": 1642 }, { "epoch": 0.1515857455887441, "grad_norm": 1.9462579376769658, "learning_rate": 1.206890965957394e-06, "loss": 0.8359, "step": 1643 }, { "epoch": 0.15167800715027102, "grad_norm": 1.9999967322955061, "learning_rate": 1.2068222748230305e-06, "loss": 0.7238, "step": 1644 }, { "epoch": 0.15177026871179794, "grad_norm": 1.3361769691062042, "learning_rate": 1.2067535309630166e-06, "loss": 0.6875, "step": 1645 }, { "epoch": 0.15177026871179794, "eval_GEN Loss": 0.47986242175102234, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36502107977867126, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9144230484962463, "eval_runtime": 56.7669, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1645 }, { "epoch": 0.15186253027332489, "grad_norm": 2.5340417095182044, "learning_rate": 1.206684734383582e-06, "loss": 0.9313, "step": 1646 }, { "epoch": 0.1519547918348518, "grad_norm": 2.947386800871364, "learning_rate": 1.2066158850909613e-06, "loss": 1.0766, "step": 1647 }, { "epoch": 0.15204705339637872, "grad_norm": 1.5150065894360136, "learning_rate": 1.2065469830913935e-06, "loss": 0.867, "step": 1648 }, { "epoch": 0.15213931495790567, "grad_norm": 1.5827785765301632, "learning_rate": 1.206478028391123e-06, "loss": 0.5487, "step": 1649 }, { "epoch": 0.1522315765194326, "grad_norm": 1.9882035168587877, "learning_rate": 1.206409020996398e-06, "loss": 0.784, "step": 1650 }, { "epoch": 0.1522315765194326, "eval_GEN Loss": 0.4792032539844513, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9058823529411765, "eval_PRM F1 AUC": 0.746464117338921, "eval_PRM F1 Neg": 0.6190476190476191, "eval_PRM Loss": 0.3730213940143585, "eval_PRM NPV": 0.6842105263157895, "eval_PRM Precision": 0.8850574712643678, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9349759817123413, "eval_runtime": 57.0221, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1650 }, { "epoch": 0.15232383808095953, "grad_norm": 2.136656197409622, "learning_rate": 1.2063399609134724e-06, "loss": 0.9674, "step": 1651 }, { "epoch": 0.15241609964248645, "grad_norm": 1.5599202081446026, "learning_rate": 1.2062708481486046e-06, "loss": 0.7025, "step": 1652 }, { "epoch": 0.15250836120401337, "grad_norm": 2.03873936217497, "learning_rate": 1.2062016827080574e-06, "loss": 1.0646, "step": 1653 }, { "epoch": 0.15260062276554032, "grad_norm": 2.245857856496522, "learning_rate": 1.2061324645980993e-06, "loss": 0.7655, "step": 1654 }, { "epoch": 0.15269288432706724, "grad_norm": 2.3068424191925017, "learning_rate": 1.2060631938250022e-06, "loss": 0.8513, "step": 1655 }, { "epoch": 0.15269288432706724, "eval_GEN Loss": 0.480029433965683, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.38942280411720276, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9539663195610046, "eval_runtime": 56.8457, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1655 }, { "epoch": 0.15278514588859415, "grad_norm": 1.5602624685968338, "learning_rate": 1.205993870395044e-06, "loss": 0.6726, "step": 1656 }, { "epoch": 0.1528774074501211, "grad_norm": 1.963139289755594, "learning_rate": 1.2059244943145066e-06, "loss": 0.8696, "step": 1657 }, { "epoch": 0.15296966901164802, "grad_norm": 1.6254674761629366, "learning_rate": 1.2058550655896774e-06, "loss": 0.7386, "step": 1658 }, { "epoch": 0.15306193057317496, "grad_norm": 1.87372899223456, "learning_rate": 1.2057855842268477e-06, "loss": 0.8901, "step": 1659 }, { "epoch": 0.15315419213470188, "grad_norm": 1.6275426038225607, "learning_rate": 1.2057160502323142e-06, "loss": 0.8991, "step": 1660 }, { "epoch": 0.15315419213470188, "eval_GEN Loss": 0.48058921098709106, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.39074864983558655, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9556490182876587, "eval_runtime": 56.6544, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 1660 }, { "epoch": 0.1532464536962288, "grad_norm": 2.462114718297041, "learning_rate": 1.2056464636123782e-06, "loss": 0.9514, "step": 1661 }, { "epoch": 0.15333871525775575, "grad_norm": 2.388658099297588, "learning_rate": 1.2055768243733458e-06, "loss": 0.933, "step": 1662 }, { "epoch": 0.15343097681928267, "grad_norm": 2.6046711615357627, "learning_rate": 1.2055071325215275e-06, "loss": 0.8297, "step": 1663 }, { "epoch": 0.15352323838080958, "grad_norm": 1.5160597348850142, "learning_rate": 1.2054373880632395e-06, "loss": 0.8085, "step": 1664 }, { "epoch": 0.15361549994233653, "grad_norm": 1.511132567278672, "learning_rate": 1.2053675910048014e-06, "loss": 0.5161, "step": 1665 }, { "epoch": 0.15361549994233653, "eval_GEN Loss": 0.4798246920108795, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM Loss": 0.4006507694721222, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9478966593742371, "eval_runtime": 56.9298, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1665 }, { "epoch": 0.15370776150386345, "grad_norm": 1.7971993479517718, "learning_rate": 1.2052977413525388e-06, "loss": 0.7776, "step": 1666 }, { "epoch": 0.1538000230653904, "grad_norm": 1.3934391838398303, "learning_rate": 1.2052278391127816e-06, "loss": 0.6859, "step": 1667 }, { "epoch": 0.15389228462691731, "grad_norm": 2.6120998571193597, "learning_rate": 1.2051578842918643e-06, "loss": 0.617, "step": 1668 }, { "epoch": 0.15398454618844423, "grad_norm": 2.384936624570837, "learning_rate": 1.205087876896126e-06, "loss": 0.7993, "step": 1669 }, { "epoch": 0.15407680774997118, "grad_norm": 1.794813745419985, "learning_rate": 1.2050178169319117e-06, "loss": 0.7012, "step": 1670 }, { "epoch": 0.15407680774997118, "eval_GEN Loss": 0.47999176383018494, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.41702377796173096, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9520432949066162, "eval_runtime": 56.8304, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1670 }, { "epoch": 0.1541690693114981, "grad_norm": 1.8947530793166678, "learning_rate": 1.2049477044055697e-06, "loss": 0.728, "step": 1671 }, { "epoch": 0.15426133087302502, "grad_norm": 1.6667324756944912, "learning_rate": 1.2048775393234538e-06, "loss": 0.6683, "step": 1672 }, { "epoch": 0.15435359243455196, "grad_norm": 1.8403445494935375, "learning_rate": 1.2048073216919227e-06, "loss": 0.6996, "step": 1673 }, { "epoch": 0.15444585399607888, "grad_norm": 1.996166589754953, "learning_rate": 1.2047370515173393e-06, "loss": 0.7859, "step": 1674 }, { "epoch": 0.15453811555760583, "grad_norm": 2.0348565896472466, "learning_rate": 1.2046667288060718e-06, "loss": 0.796, "step": 1675 }, { "epoch": 0.15453811555760583, "eval_GEN Loss": 0.48171553015708923, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM Loss": 0.4134211540222168, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9649639129638672, "eval_runtime": 56.8471, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1675 }, { "epoch": 0.15463037711913274, "grad_norm": 1.9811196370473396, "learning_rate": 1.2045963535644931e-06, "loss": 0.7303, "step": 1676 }, { "epoch": 0.15472263868065966, "grad_norm": 2.0680009877363728, "learning_rate": 1.2045259257989803e-06, "loss": 0.9992, "step": 1677 }, { "epoch": 0.1548149002421866, "grad_norm": 2.3231930006003707, "learning_rate": 1.204455445515916e-06, "loss": 0.8537, "step": 1678 }, { "epoch": 0.15490716180371353, "grad_norm": 1.50076283457596, "learning_rate": 1.2043849127216873e-06, "loss": 0.7387, "step": 1679 }, { "epoch": 0.15499942336524045, "grad_norm": 3.237347355630976, "learning_rate": 1.2043143274226856e-06, "loss": 0.9481, "step": 1680 }, { "epoch": 0.15499942336524045, "eval_GEN Loss": 0.4792095720767975, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.400808721780777, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9655048251152039, "eval_runtime": 56.653, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 1680 }, { "epoch": 0.1550916849267674, "grad_norm": 1.7110570452735685, "learning_rate": 1.204243689625308e-06, "loss": 0.7252, "step": 1681 }, { "epoch": 0.1551839464882943, "grad_norm": 1.5904298016958394, "learning_rate": 1.2041729993359551e-06, "loss": 0.8541, "step": 1682 }, { "epoch": 0.15527620804982123, "grad_norm": 1.6387993124820592, "learning_rate": 1.2041022565610337e-06, "loss": 0.7684, "step": 1683 }, { "epoch": 0.15536846961134818, "grad_norm": 1.8078395242211844, "learning_rate": 1.2040314613069543e-06, "loss": 0.6376, "step": 1684 }, { "epoch": 0.1554607311728751, "grad_norm": 1.9072669000614397, "learning_rate": 1.2039606135801322e-06, "loss": 0.8818, "step": 1685 }, { "epoch": 0.1554607311728751, "eval_GEN Loss": 0.476083368062973, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.39639008045196533, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9598557949066162, "eval_runtime": 56.9089, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1685 }, { "epoch": 0.15555299273440204, "grad_norm": 3.375773958150725, "learning_rate": 1.203889713386988e-06, "loss": 0.7987, "step": 1686 }, { "epoch": 0.15564525429592896, "grad_norm": 2.099490335827624, "learning_rate": 1.2038187607339472e-06, "loss": 0.888, "step": 1687 }, { "epoch": 0.15573751585745588, "grad_norm": 1.5885592506757007, "learning_rate": 1.203747755627439e-06, "loss": 0.8049, "step": 1688 }, { "epoch": 0.15582977741898282, "grad_norm": 3.767814518316457, "learning_rate": 1.203676698073898e-06, "loss": 0.7145, "step": 1689 }, { "epoch": 0.15592203898050974, "grad_norm": 1.3371675311778843, "learning_rate": 1.203605588079764e-06, "loss": 0.7191, "step": 1690 }, { "epoch": 0.15592203898050974, "eval_GEN Loss": 0.4749113619327545, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.3965228796005249, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9549278616905212, "eval_runtime": 56.8121, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1690 }, { "epoch": 0.15601430054203666, "grad_norm": 2.000046315884686, "learning_rate": 1.2035344256514808e-06, "loss": 0.7516, "step": 1691 }, { "epoch": 0.1561065621035636, "grad_norm": 1.6137698284927622, "learning_rate": 1.2034632107954975e-06, "loss": 0.6281, "step": 1692 }, { "epoch": 0.15619882366509052, "grad_norm": 2.3084275818615816, "learning_rate": 1.2033919435182674e-06, "loss": 0.9654, "step": 1693 }, { "epoch": 0.15629108522661747, "grad_norm": 2.2810687982767837, "learning_rate": 1.2033206238262488e-06, "loss": 0.8687, "step": 1694 }, { "epoch": 0.1563833467881444, "grad_norm": 1.8474844628890328, "learning_rate": 1.2032492517259051e-06, "loss": 0.7925, "step": 1695 }, { "epoch": 0.1563833467881444, "eval_GEN Loss": 0.47422850131988525, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM Loss": 0.40184977650642395, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9668269157409668, "eval_runtime": 56.8617, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1695 }, { "epoch": 0.1564756083496713, "grad_norm": 3.3225835899501224, "learning_rate": 1.203177827223704e-06, "loss": 0.9558, "step": 1696 }, { "epoch": 0.15656786991119825, "grad_norm": 3.003528462283362, "learning_rate": 1.2031063503261182e-06, "loss": 1.0253, "step": 1697 }, { "epoch": 0.15666013147272517, "grad_norm": 1.869436446365027, "learning_rate": 1.203034821039625e-06, "loss": 0.8881, "step": 1698 }, { "epoch": 0.1567523930342521, "grad_norm": 2.4244399451612337, "learning_rate": 1.2029632393707064e-06, "loss": 0.9702, "step": 1699 }, { "epoch": 0.15684465459577904, "grad_norm": 1.4551539004376537, "learning_rate": 1.2028916053258494e-06, "loss": 0.6471, "step": 1700 }, { "epoch": 0.15684465459577904, "eval_GEN Loss": 0.4727160930633545, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.4090442657470703, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9594951868057251, "eval_runtime": 57.034, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1700 }, { "epoch": 0.15693691615730596, "grad_norm": 1.633623089933077, "learning_rate": 1.2028199189115455e-06, "loss": 0.8667, "step": 1701 }, { "epoch": 0.1570291777188329, "grad_norm": 2.680415118185708, "learning_rate": 1.2027481801342912e-06, "loss": 0.8986, "step": 1702 }, { "epoch": 0.15712143928035982, "grad_norm": 1.6584278448257652, "learning_rate": 1.2026763890005871e-06, "loss": 0.8192, "step": 1703 }, { "epoch": 0.15721370084188674, "grad_norm": 1.8433897939640338, "learning_rate": 1.2026045455169396e-06, "loss": 0.9292, "step": 1704 }, { "epoch": 0.15730596240341368, "grad_norm": 1.712124135850333, "learning_rate": 1.2025326496898587e-06, "loss": 0.814, "step": 1705 }, { "epoch": 0.15730596240341368, "eval_GEN Loss": 0.47189226746559143, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.413433700799942, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9611778855323792, "eval_runtime": 56.8385, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1705 }, { "epoch": 0.1573982239649406, "grad_norm": 1.5400809782769067, "learning_rate": 1.2024607015258605e-06, "loss": 0.7189, "step": 1706 }, { "epoch": 0.15749048552646752, "grad_norm": 2.0792363943929373, "learning_rate": 1.2023887010314642e-06, "loss": 0.7638, "step": 1707 }, { "epoch": 0.15758274708799447, "grad_norm": 1.8314031543374316, "learning_rate": 1.2023166482131952e-06, "loss": 0.7807, "step": 1708 }, { "epoch": 0.1576750086495214, "grad_norm": 1.1599471168352014, "learning_rate": 1.2022445430775827e-06, "loss": 0.5619, "step": 1709 }, { "epoch": 0.15776727021104833, "grad_norm": 1.919625624387616, "learning_rate": 1.2021723856311613e-06, "loss": 0.7799, "step": 1710 }, { "epoch": 0.15776727021104833, "eval_GEN Loss": 0.4721803367137909, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM Loss": 0.4043463468551636, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9524038434028625, "eval_runtime": 56.8285, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1710 }, { "epoch": 0.15785953177257525, "grad_norm": 1.7158155907304815, "learning_rate": 1.2021001758804696e-06, "loss": 0.7479, "step": 1711 }, { "epoch": 0.15795179333410217, "grad_norm": 1.7809784027850344, "learning_rate": 1.2020279138320517e-06, "loss": 0.7212, "step": 1712 }, { "epoch": 0.15804405489562912, "grad_norm": 1.2951346321259123, "learning_rate": 1.201955599492456e-06, "loss": 0.5891, "step": 1713 }, { "epoch": 0.15813631645715603, "grad_norm": 1.094419927256266, "learning_rate": 1.2018832328682357e-06, "loss": 0.5057, "step": 1714 }, { "epoch": 0.15822857801868295, "grad_norm": 1.18666422405567, "learning_rate": 1.2018108139659488e-06, "loss": 0.6807, "step": 1715 }, { "epoch": 0.15822857801868295, "eval_GEN Loss": 0.4728214144706726, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.3869480490684509, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9214543104171753, "eval_runtime": 56.0349, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1715 }, { "epoch": 0.1583208395802099, "grad_norm": 1.3590830697605831, "learning_rate": 1.2017383427921582e-06, "loss": 0.6337, "step": 1716 }, { "epoch": 0.15841310114173682, "grad_norm": 1.8654387537840311, "learning_rate": 1.201665819353431e-06, "loss": 0.7712, "step": 1717 }, { "epoch": 0.15850536270326376, "grad_norm": 1.3261619385314058, "learning_rate": 1.2015932436563396e-06, "loss": 0.6758, "step": 1718 }, { "epoch": 0.15859762426479068, "grad_norm": 1.360766445942538, "learning_rate": 1.2015206157074607e-06, "loss": 0.6135, "step": 1719 }, { "epoch": 0.1586898858263176, "grad_norm": 3.092527225707507, "learning_rate": 1.2014479355133765e-06, "loss": 0.8822, "step": 1720 }, { "epoch": 0.1586898858263176, "eval_GEN Loss": 0.4744291305541992, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3729347288608551, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8841947317123413, "eval_runtime": 56.9052, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1720 }, { "epoch": 0.15878214738784455, "grad_norm": 1.7859672639020925, "learning_rate": 1.2013752030806729e-06, "loss": 0.6137, "step": 1721 }, { "epoch": 0.15887440894937147, "grad_norm": 1.8132191474772663, "learning_rate": 1.2013024184159412e-06, "loss": 0.8266, "step": 1722 }, { "epoch": 0.15896667051089838, "grad_norm": 1.6281369509399972, "learning_rate": 1.2012295815257772e-06, "loss": 0.7941, "step": 1723 }, { "epoch": 0.15905893207242533, "grad_norm": 2.240640289607103, "learning_rate": 1.2011566924167814e-06, "loss": 0.8291, "step": 1724 }, { "epoch": 0.15915119363395225, "grad_norm": 2.2741129229217854, "learning_rate": 1.2010837510955594e-06, "loss": 0.7531, "step": 1725 }, { "epoch": 0.15915119363395225, "eval_GEN Loss": 0.4747401177883148, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3753626346588135, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8645432591438293, "eval_runtime": 56.7347, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 1725 }, { "epoch": 0.1592434551954792, "grad_norm": 1.8661920082388164, "learning_rate": 1.201010757568721e-06, "loss": 0.6207, "step": 1726 }, { "epoch": 0.1593357167570061, "grad_norm": 1.9780752738830902, "learning_rate": 1.2009377118428811e-06, "loss": 0.8295, "step": 1727 }, { "epoch": 0.15942797831853303, "grad_norm": 2.706376669079482, "learning_rate": 1.2008646139246594e-06, "loss": 0.7115, "step": 1728 }, { "epoch": 0.15952023988005998, "grad_norm": 1.9100448997257597, "learning_rate": 1.2007914638206797e-06, "loss": 0.7295, "step": 1729 }, { "epoch": 0.1596125014415869, "grad_norm": 2.0075331662337668, "learning_rate": 1.2007182615375714e-06, "loss": 0.8302, "step": 1730 }, { "epoch": 0.1596125014415869, "eval_GEN Loss": 0.4771677553653717, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM Loss": 0.36156365275382996, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.8718149065971375, "eval_runtime": 57.0068, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 1730 }, { "epoch": 0.15970476300311381, "grad_norm": 2.2282521166062117, "learning_rate": 1.2006450070819681e-06, "loss": 0.7787, "step": 1731 }, { "epoch": 0.15979702456464076, "grad_norm": 2.727345528912454, "learning_rate": 1.2005717004605081e-06, "loss": 0.8815, "step": 1732 }, { "epoch": 0.15988928612616768, "grad_norm": 5.409008356411552, "learning_rate": 1.2004983416798346e-06, "loss": 1.3479, "step": 1733 }, { "epoch": 0.15998154768769463, "grad_norm": 1.6377853480910112, "learning_rate": 1.2004249307465956e-06, "loss": 0.7857, "step": 1734 }, { "epoch": 0.16007380924922154, "grad_norm": 1.961215619307502, "learning_rate": 1.2003514676674435e-06, "loss": 0.9155, "step": 1735 }, { "epoch": 0.16007380924922154, "eval_GEN Loss": 0.4761819541454315, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM Loss": 0.3655785322189331, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.871874988079071, "eval_runtime": 56.9603, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1735 }, { "epoch": 0.16016607081074846, "grad_norm": 2.0968914042084403, "learning_rate": 1.200277952449036e-06, "loss": 0.8153, "step": 1736 }, { "epoch": 0.1602583323722754, "grad_norm": 2.408793464839001, "learning_rate": 1.2002043850980346e-06, "loss": 0.7876, "step": 1737 }, { "epoch": 0.16035059393380233, "grad_norm": 2.041860953980221, "learning_rate": 1.2001307656211069e-06, "loss": 0.6351, "step": 1738 }, { "epoch": 0.16044285549532925, "grad_norm": 1.9127806526581694, "learning_rate": 1.2000570940249237e-06, "loss": 0.7659, "step": 1739 }, { "epoch": 0.1605351170568562, "grad_norm": 3.3468723163460665, "learning_rate": 1.1999833703161614e-06, "loss": 0.9352, "step": 1740 }, { "epoch": 0.1605351170568562, "eval_GEN Loss": 0.4743192195892334, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM Loss": 0.3662451207637787, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.8649038672447205, "eval_runtime": 57.2074, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 1740 }, { "epoch": 0.1606273786183831, "grad_norm": 3.228071781396564, "learning_rate": 1.1999095945015013e-06, "loss": 0.9619, "step": 1741 }, { "epoch": 0.16071964017991006, "grad_norm": 1.9599230495336764, "learning_rate": 1.1998357665876288e-06, "loss": 0.7585, "step": 1742 }, { "epoch": 0.16081190174143697, "grad_norm": 1.9625157070892876, "learning_rate": 1.199761886581234e-06, "loss": 0.9341, "step": 1743 }, { "epoch": 0.1609041633029639, "grad_norm": 2.6344561913816547, "learning_rate": 1.1996879544890125e-06, "loss": 0.7793, "step": 1744 }, { "epoch": 0.16099642486449084, "grad_norm": 2.375414692367507, "learning_rate": 1.199613970317664e-06, "loss": 0.7729, "step": 1745 }, { "epoch": 0.16099642486449084, "eval_GEN Loss": 0.47493529319763184, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9056603773584906, "eval_PRM F1 AUC": 0.8467784180199058, "eval_PRM F1 Neg": 0.7169811320754716, "eval_PRM Loss": 0.38084328174591064, "eval_PRM NPV": 0.6333333333333333, "eval_PRM Precision": 0.9473684210526315, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.846875011920929, "eval_runtime": 56.7965, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 1745 }, { "epoch": 0.16108868642601776, "grad_norm": 2.346254146722747, "learning_rate": 1.1995399340738932e-06, "loss": 0.8282, "step": 1746 }, { "epoch": 0.16118094798754468, "grad_norm": 1.682342164816387, "learning_rate": 1.1994658457644091e-06, "loss": 0.8964, "step": 1747 }, { "epoch": 0.16127320954907162, "grad_norm": 1.9917021102123866, "learning_rate": 1.1993917053959258e-06, "loss": 0.7675, "step": 1748 }, { "epoch": 0.16136547111059854, "grad_norm": 1.5307292646365027, "learning_rate": 1.1993175129751622e-06, "loss": 0.6664, "step": 1749 }, { "epoch": 0.1614577326721255, "grad_norm": 2.145969974023176, "learning_rate": 1.1992432685088414e-06, "loss": 0.8581, "step": 1750 }, { "epoch": 0.1614577326721255, "eval_GEN Loss": 0.4752160906791687, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.8987341772151899, "eval_PRM F1 AUC": 0.8407543216343635, "eval_PRM F1 Neg": 0.7037037037037037, "eval_PRM Loss": 0.3944178521633148, "eval_PRM NPV": 0.6129032258064516, "eval_PRM Precision": 0.9466666666666667, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.8573317527770996, "eval_runtime": 56.9403, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1750 }, { "epoch": 0.1615499942336524, "grad_norm": 1.857511557807682, "learning_rate": 1.199168972003692e-06, "loss": 0.7344, "step": 1751 }, { "epoch": 0.16164225579517932, "grad_norm": 3.3110136809654356, "learning_rate": 1.1990946234664464e-06, "loss": 0.8864, "step": 1752 }, { "epoch": 0.16173451735670627, "grad_norm": 1.851308184913895, "learning_rate": 1.1990202229038426e-06, "loss": 0.821, "step": 1753 }, { "epoch": 0.1618267789182332, "grad_norm": 1.7270899120519583, "learning_rate": 1.1989457703226222e-06, "loss": 0.8285, "step": 1754 }, { "epoch": 0.1619190404797601, "grad_norm": 1.8888581494402377, "learning_rate": 1.198871265729533e-06, "loss": 0.8772, "step": 1755 }, { "epoch": 0.1619190404797601, "eval_GEN Loss": 0.47463130950927734, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3658333420753479, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8574519157409668, "eval_runtime": 56.0056, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1755 }, { "epoch": 0.16201130204128705, "grad_norm": 1.6795665178601533, "learning_rate": 1.1987967091313266e-06, "loss": 0.85, "step": 1756 }, { "epoch": 0.16210356360281397, "grad_norm": 1.901449510428993, "learning_rate": 1.198722100534759e-06, "loss": 0.8562, "step": 1757 }, { "epoch": 0.16219582516434092, "grad_norm": 3.4299953114132395, "learning_rate": 1.1986474399465916e-06, "loss": 1.1412, "step": 1758 }, { "epoch": 0.16228808672586784, "grad_norm": 2.148886315304666, "learning_rate": 1.1985727273735904e-06, "loss": 0.9179, "step": 1759 }, { "epoch": 0.16238034828739475, "grad_norm": 1.6700772269498403, "learning_rate": 1.1984979628225258e-06, "loss": 0.8421, "step": 1760 }, { "epoch": 0.16238034828739475, "eval_GEN Loss": 0.4730831980705261, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3528091013431549, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8771033883094788, "eval_runtime": 56.0585, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1760 }, { "epoch": 0.1624726098489217, "grad_norm": 1.5933767095295974, "learning_rate": 1.198423146300173e-06, "loss": 0.7713, "step": 1761 }, { "epoch": 0.16256487141044862, "grad_norm": 2.0012070258657455, "learning_rate": 1.198348277813312e-06, "loss": 0.9833, "step": 1762 }, { "epoch": 0.16265713297197554, "grad_norm": 1.7347135422048094, "learning_rate": 1.1982733573687279e-06, "loss": 0.7167, "step": 1763 }, { "epoch": 0.16274939453350248, "grad_norm": 1.9715518457252303, "learning_rate": 1.1981983849732096e-06, "loss": 0.7582, "step": 1764 }, { "epoch": 0.1628416560950294, "grad_norm": 2.396025379859153, "learning_rate": 1.1981233606335515e-06, "loss": 0.9252, "step": 1765 }, { "epoch": 0.1628416560950294, "eval_GEN Loss": 0.47371742129325867, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3666206896305084, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8832331895828247, "eval_runtime": 55.9256, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1765 }, { "epoch": 0.16293391765655635, "grad_norm": 1.67230443249086, "learning_rate": 1.1980482843565524e-06, "loss": 0.4898, "step": 1766 }, { "epoch": 0.16302617921808327, "grad_norm": 2.6798053789935015, "learning_rate": 1.1979731561490158e-06, "loss": 0.7325, "step": 1767 }, { "epoch": 0.16311844077961019, "grad_norm": 1.2788674533092632, "learning_rate": 1.1978979760177499e-06, "loss": 0.6708, "step": 1768 }, { "epoch": 0.16321070234113713, "grad_norm": 3.2214528116004915, "learning_rate": 1.1978227439695675e-06, "loss": 0.7314, "step": 1769 }, { "epoch": 0.16330296390266405, "grad_norm": 1.4528340184239323, "learning_rate": 1.1977474600112865e-06, "loss": 0.6578, "step": 1770 }, { "epoch": 0.16330296390266405, "eval_GEN Loss": 0.4762537181377411, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3963039815425873, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8923677802085876, "eval_runtime": 55.9566, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1770 }, { "epoch": 0.16339522546419097, "grad_norm": 2.2097031063476797, "learning_rate": 1.197672124149729e-06, "loss": 0.8733, "step": 1771 }, { "epoch": 0.16348748702571791, "grad_norm": 1.8180984617525522, "learning_rate": 1.1975967363917225e-06, "loss": 0.8292, "step": 1772 }, { "epoch": 0.16357974858724483, "grad_norm": 1.3777427473261157, "learning_rate": 1.1975212967440983e-06, "loss": 0.8133, "step": 1773 }, { "epoch": 0.16367201014877178, "grad_norm": 2.904575933076612, "learning_rate": 1.197445805213693e-06, "loss": 0.8565, "step": 1774 }, { "epoch": 0.1637642717102987, "grad_norm": 2.2467603792144306, "learning_rate": 1.197370261807348e-06, "loss": 0.7633, "step": 1775 }, { "epoch": 0.1637642717102987, "eval_GEN Loss": 0.47734469175338745, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.44640040397644043, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9230168461799622, "eval_runtime": 55.9677, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1775 }, { "epoch": 0.16385653327182562, "grad_norm": 2.054697081292661, "learning_rate": 1.1972946665319088e-06, "loss": 0.867, "step": 1776 }, { "epoch": 0.16394879483335256, "grad_norm": 2.8727010273222864, "learning_rate": 1.1972190193942259e-06, "loss": 0.8253, "step": 1777 }, { "epoch": 0.16404105639487948, "grad_norm": 2.716670343247038, "learning_rate": 1.1971433204011552e-06, "loss": 1.0008, "step": 1778 }, { "epoch": 0.1641333179564064, "grad_norm": 3.8480085615947606, "learning_rate": 1.197067569559556e-06, "loss": 1.0191, "step": 1779 }, { "epoch": 0.16422557951793335, "grad_norm": 1.5197868351541262, "learning_rate": 1.1969917668762932e-06, "loss": 0.816, "step": 1780 }, { "epoch": 0.16422557951793335, "eval_GEN Loss": 0.47710874676704407, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.4292348325252533, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.922776460647583, "eval_runtime": 55.9198, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1780 }, { "epoch": 0.16431784107946026, "grad_norm": 2.996241200808312, "learning_rate": 1.1969159123582361e-06, "loss": 0.7155, "step": 1781 }, { "epoch": 0.1644101026409872, "grad_norm": 1.4503014184697487, "learning_rate": 1.1968400060122589e-06, "loss": 0.6684, "step": 1782 }, { "epoch": 0.16450236420251413, "grad_norm": 2.321984586660832, "learning_rate": 1.1967640478452402e-06, "loss": 0.777, "step": 1783 }, { "epoch": 0.16459462576404105, "grad_norm": 1.6149520618062305, "learning_rate": 1.1966880378640636e-06, "loss": 0.7009, "step": 1784 }, { "epoch": 0.164686887325568, "grad_norm": 1.4362764575132554, "learning_rate": 1.1966119760756173e-06, "loss": 0.7981, "step": 1785 }, { "epoch": 0.164686887325568, "eval_GEN Loss": 0.47585561871528625, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.40282073616981506, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9460336565971375, "eval_runtime": 55.8059, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 1785 }, { "epoch": 0.1647791488870949, "grad_norm": 1.68124564818914, "learning_rate": 1.1965358624867936e-06, "loss": 0.8926, "step": 1786 }, { "epoch": 0.16487141044862183, "grad_norm": 1.8189750538289764, "learning_rate": 1.196459697104491e-06, "loss": 0.7107, "step": 1787 }, { "epoch": 0.16496367201014878, "grad_norm": 3.8822325320822824, "learning_rate": 1.1963834799356106e-06, "loss": 0.9042, "step": 1788 }, { "epoch": 0.1650559335716757, "grad_norm": 2.377530408699936, "learning_rate": 1.19630721098706e-06, "loss": 0.7527, "step": 1789 }, { "epoch": 0.16514819513320264, "grad_norm": 1.4515146490342556, "learning_rate": 1.1962308902657508e-06, "loss": 0.7672, "step": 1790 }, { "epoch": 0.16514819513320264, "eval_GEN Loss": 0.47496604919433594, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM Loss": 0.40148061513900757, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9661658406257629, "eval_runtime": 55.8316, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1790 }, { "epoch": 0.16524045669472956, "grad_norm": 1.8367418287024868, "learning_rate": 1.1961545177785994e-06, "loss": 0.9241, "step": 1791 }, { "epoch": 0.16533271825625648, "grad_norm": 1.7373451874372527, "learning_rate": 1.1960780935325263e-06, "loss": 0.7596, "step": 1792 }, { "epoch": 0.16542497981778342, "grad_norm": 2.199842245342328, "learning_rate": 1.1960016175344574e-06, "loss": 1.0013, "step": 1793 }, { "epoch": 0.16551724137931034, "grad_norm": 1.3624274925812592, "learning_rate": 1.1959250897913235e-06, "loss": 0.6842, "step": 1794 }, { "epoch": 0.16560950294083726, "grad_norm": 2.105499786133481, "learning_rate": 1.195848510310059e-06, "loss": 0.887, "step": 1795 }, { "epoch": 0.16560950294083726, "eval_GEN Loss": 0.4728744924068451, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.4052446782588959, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9497596025466919, "eval_runtime": 56.9528, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1795 }, { "epoch": 0.1657017645023642, "grad_norm": 2.4826299160827947, "learning_rate": 1.195771879097604e-06, "loss": 0.8808, "step": 1796 }, { "epoch": 0.16579402606389113, "grad_norm": 1.4297200589498609, "learning_rate": 1.1956951961609032e-06, "loss": 0.7984, "step": 1797 }, { "epoch": 0.16588628762541807, "grad_norm": 1.4074620516650813, "learning_rate": 1.195618461506905e-06, "loss": 0.606, "step": 1798 }, { "epoch": 0.165978549186945, "grad_norm": 1.8470885961957082, "learning_rate": 1.1955416751425638e-06, "loss": 0.922, "step": 1799 }, { "epoch": 0.1660708107484719, "grad_norm": 1.6546661085060437, "learning_rate": 1.1954648370748382e-06, "loss": 0.7227, "step": 1800 }, { "epoch": 0.1660708107484719, "eval_GEN Loss": 0.47097355127334595, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4237675070762634, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9322115182876587, "eval_runtime": 56.9229, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 1800 }, { "epoch": 0.16616307230999885, "grad_norm": 1.6426354604079443, "learning_rate": 1.1953879473106909e-06, "loss": 0.746, "step": 1801 }, { "epoch": 0.16625533387152577, "grad_norm": 2.074416629403325, "learning_rate": 1.19531100585709e-06, "loss": 0.8324, "step": 1802 }, { "epoch": 0.1663475954330527, "grad_norm": 1.7389515438506715, "learning_rate": 1.1952340127210084e-06, "loss": 0.7606, "step": 1803 }, { "epoch": 0.16643985699457964, "grad_norm": 1.2344952399735567, "learning_rate": 1.1951569679094225e-06, "loss": 0.64, "step": 1804 }, { "epoch": 0.16653211855610656, "grad_norm": 1.265859398615304, "learning_rate": 1.195079871429315e-06, "loss": 0.6751, "step": 1805 }, { "epoch": 0.16653211855610656, "eval_GEN Loss": 0.4726194739341736, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4417702555656433, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9378004670143127, "eval_runtime": 56.0617, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1805 }, { "epoch": 0.1666243801176335, "grad_norm": 2.996394260517124, "learning_rate": 1.1950027232876723e-06, "loss": 0.649, "step": 1806 }, { "epoch": 0.16671664167916042, "grad_norm": 2.070350182240329, "learning_rate": 1.1949255234914855e-06, "loss": 0.6666, "step": 1807 }, { "epoch": 0.16680890324068734, "grad_norm": 2.5651078496165804, "learning_rate": 1.1948482720477506e-06, "loss": 0.8245, "step": 1808 }, { "epoch": 0.16690116480221429, "grad_norm": 2.818405435354929, "learning_rate": 1.1947709689634685e-06, "loss": 0.8456, "step": 1809 }, { "epoch": 0.1669934263637412, "grad_norm": 1.3221976867543705, "learning_rate": 1.1946936142456443e-06, "loss": 0.6072, "step": 1810 }, { "epoch": 0.1669934263637412, "eval_GEN Loss": 0.47267863154411316, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.4132683575153351, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9447716474533081, "eval_runtime": 55.9272, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1810 }, { "epoch": 0.16708568792526812, "grad_norm": 1.57219569330212, "learning_rate": 1.194616207901288e-06, "loss": 0.7223, "step": 1811 }, { "epoch": 0.16717794948679507, "grad_norm": 1.4754263132976029, "learning_rate": 1.1945387499374146e-06, "loss": 0.6975, "step": 1812 }, { "epoch": 0.167270211048322, "grad_norm": 2.8838211570500176, "learning_rate": 1.1944612403610429e-06, "loss": 0.9909, "step": 1813 }, { "epoch": 0.16736247260984893, "grad_norm": 2.0838869934665407, "learning_rate": 1.1943836791791974e-06, "loss": 0.8582, "step": 1814 }, { "epoch": 0.16745473417137585, "grad_norm": 2.0720505816262813, "learning_rate": 1.1943060663989065e-06, "loss": 0.7503, "step": 1815 }, { "epoch": 0.16745473417137585, "eval_GEN Loss": 0.4740515649318695, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 Neg": 0.5, "eval_PRM Loss": 0.40221935510635376, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.965624988079071, "eval_runtime": 55.9164, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1815 }, { "epoch": 0.16754699573290277, "grad_norm": 1.9489886302628043, "learning_rate": 1.194228402027204e-06, "loss": 0.6032, "step": 1816 }, { "epoch": 0.16763925729442972, "grad_norm": 3.146227514371221, "learning_rate": 1.1941506860711277e-06, "loss": 0.8231, "step": 1817 }, { "epoch": 0.16773151885595664, "grad_norm": 1.8486025174842518, "learning_rate": 1.1940729185377204e-06, "loss": 0.7736, "step": 1818 }, { "epoch": 0.16782378041748355, "grad_norm": 2.3156176425509485, "learning_rate": 1.1939950994340295e-06, "loss": 0.8739, "step": 1819 }, { "epoch": 0.1679160419790105, "grad_norm": 1.8496325085265781, "learning_rate": 1.1939172287671069e-06, "loss": 0.7784, "step": 1820 }, { "epoch": 0.1679160419790105, "eval_GEN Loss": 0.47243618965148926, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM Loss": 0.40494734048843384, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9459735751152039, "eval_runtime": 55.886, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1820 }, { "epoch": 0.16800830354053742, "grad_norm": 1.369839127474054, "learning_rate": 1.1938393065440094e-06, "loss": 0.8119, "step": 1821 }, { "epoch": 0.16810056510206436, "grad_norm": 1.5572494870346232, "learning_rate": 1.1937613327717989e-06, "loss": 0.6656, "step": 1822 }, { "epoch": 0.16819282666359128, "grad_norm": 1.2733382757256089, "learning_rate": 1.193683307457541e-06, "loss": 0.6123, "step": 1823 }, { "epoch": 0.1682850882251182, "grad_norm": 2.302630167731284, "learning_rate": 1.1936052306083069e-06, "loss": 0.6936, "step": 1824 }, { "epoch": 0.16837734978664515, "grad_norm": 2.0470012487601275, "learning_rate": 1.1935271022311715e-06, "loss": 0.9461, "step": 1825 }, { "epoch": 0.16837734978664515, "eval_GEN Loss": 0.47079581022262573, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4052063822746277, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9320312738418579, "eval_runtime": 55.9966, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1825 }, { "epoch": 0.16846961134817207, "grad_norm": 2.6111676028904975, "learning_rate": 1.1934489223332154e-06, "loss": 0.924, "step": 1826 }, { "epoch": 0.16856187290969898, "grad_norm": 2.276340324668247, "learning_rate": 1.1933706909215232e-06, "loss": 0.8264, "step": 1827 }, { "epoch": 0.16865413447122593, "grad_norm": 1.3305571111012198, "learning_rate": 1.1932924080031843e-06, "loss": 0.7021, "step": 1828 }, { "epoch": 0.16874639603275285, "grad_norm": 1.7884137397764654, "learning_rate": 1.193214073585293e-06, "loss": 0.617, "step": 1829 }, { "epoch": 0.1688386575942798, "grad_norm": 1.9236606276039037, "learning_rate": 1.1931356876749479e-06, "loss": 0.7649, "step": 1830 }, { "epoch": 0.1688386575942798, "eval_GEN Loss": 0.4701881408691406, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3850785493850708, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9339542984962463, "eval_runtime": 55.9442, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1830 }, { "epoch": 0.1689309191558067, "grad_norm": 2.432346492635802, "learning_rate": 1.1930572502792524e-06, "loss": 1.0868, "step": 1831 }, { "epoch": 0.16902318071733363, "grad_norm": 1.7381174837752686, "learning_rate": 1.1929787614053148e-06, "loss": 0.6999, "step": 1832 }, { "epoch": 0.16911544227886058, "grad_norm": 3.1065036645173594, "learning_rate": 1.1929002210602479e-06, "loss": 0.8944, "step": 1833 }, { "epoch": 0.1692077038403875, "grad_norm": 1.3985172252832394, "learning_rate": 1.192821629251169e-06, "loss": 0.7605, "step": 1834 }, { "epoch": 0.16929996540191442, "grad_norm": 2.0996990775788413, "learning_rate": 1.1927429859852003e-06, "loss": 0.7781, "step": 1835 }, { "epoch": 0.16929996540191442, "eval_GEN Loss": 0.46855273842811584, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3788681626319885, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.9432091116905212, "eval_runtime": 55.8578, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1835 }, { "epoch": 0.16939222696344136, "grad_norm": 1.373389670403736, "learning_rate": 1.1926642912694685e-06, "loss": 0.7181, "step": 1836 }, { "epoch": 0.16948448852496828, "grad_norm": 1.3460589965050005, "learning_rate": 1.1925855451111053e-06, "loss": 0.7506, "step": 1837 }, { "epoch": 0.16957675008649523, "grad_norm": 2.1119266670809163, "learning_rate": 1.1925067475172466e-06, "loss": 0.9014, "step": 1838 }, { "epoch": 0.16966901164802214, "grad_norm": 1.7106487417678713, "learning_rate": 1.1924278984950331e-06, "loss": 0.6861, "step": 1839 }, { "epoch": 0.16976127320954906, "grad_norm": 2.2103833265963777, "learning_rate": 1.1923489980516104e-06, "loss": 0.7988, "step": 1840 }, { "epoch": 0.16976127320954906, "eval_GEN Loss": 0.46745893359184265, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36948809027671814, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9295673370361328, "eval_runtime": 55.898, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1840 }, { "epoch": 0.169853534771076, "grad_norm": 2.5020171248511134, "learning_rate": 1.1922700461941283e-06, "loss": 0.6389, "step": 1841 }, { "epoch": 0.16994579633260293, "grad_norm": 2.3921345275085897, "learning_rate": 1.1921910429297418e-06, "loss": 0.8788, "step": 1842 }, { "epoch": 0.17003805789412985, "grad_norm": 1.0725633407914312, "learning_rate": 1.1921119882656101e-06, "loss": 0.597, "step": 1843 }, { "epoch": 0.1701303194556568, "grad_norm": 1.9758289520461825, "learning_rate": 1.1920328822088974e-06, "loss": 0.65, "step": 1844 }, { "epoch": 0.1702225810171837, "grad_norm": 1.3922603490803653, "learning_rate": 1.1919537247667726e-06, "loss": 0.668, "step": 1845 }, { "epoch": 0.1702225810171837, "eval_GEN Loss": 0.46774396300315857, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3799689710140228, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9161057472229004, "eval_runtime": 56.1623, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1845 }, { "epoch": 0.17031484257871066, "grad_norm": 1.6231177902314144, "learning_rate": 1.1918745159464087e-06, "loss": 0.6615, "step": 1846 }, { "epoch": 0.17040710414023758, "grad_norm": 1.3090450478129656, "learning_rate": 1.191795255754984e-06, "loss": 0.7573, "step": 1847 }, { "epoch": 0.1704993657017645, "grad_norm": 2.794326829308904, "learning_rate": 1.191715944199681e-06, "loss": 0.7382, "step": 1848 }, { "epoch": 0.17059162726329144, "grad_norm": 3.159342566083108, "learning_rate": 1.191636581287687e-06, "loss": 1.1812, "step": 1849 }, { "epoch": 0.17068388882481836, "grad_norm": 1.5542403126104076, "learning_rate": 1.1915571670261944e-06, "loss": 0.4285, "step": 1850 }, { "epoch": 0.17068388882481836, "eval_GEN Loss": 0.4687207341194153, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.38126498460769653, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9199519157409668, "eval_runtime": 55.8179, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 1850 }, { "epoch": 0.17077615038634528, "grad_norm": 1.6366686188141122, "learning_rate": 1.1914777014223993e-06, "loss": 0.6588, "step": 1851 }, { "epoch": 0.17086841194787222, "grad_norm": 1.763222407711819, "learning_rate": 1.1913981844835033e-06, "loss": 0.7652, "step": 1852 }, { "epoch": 0.17096067350939914, "grad_norm": 2.261970091002136, "learning_rate": 1.1913186162167122e-06, "loss": 0.8263, "step": 1853 }, { "epoch": 0.1710529350709261, "grad_norm": 2.233581755609803, "learning_rate": 1.191238996629237e-06, "loss": 0.7478, "step": 1854 }, { "epoch": 0.171145196632453, "grad_norm": 2.5150143585753444, "learning_rate": 1.1911593257282926e-06, "loss": 0.9442, "step": 1855 }, { "epoch": 0.171145196632453, "eval_GEN Loss": 0.4689250588417053, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.37381306290626526, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9309495091438293, "eval_runtime": 55.769, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1855 }, { "epoch": 0.17123745819397992, "grad_norm": 1.9653967057939061, "learning_rate": 1.1910796035210986e-06, "loss": 0.7906, "step": 1856 }, { "epoch": 0.17132971975550687, "grad_norm": 2.4563107770390133, "learning_rate": 1.1909998300148802e-06, "loss": 0.7522, "step": 1857 }, { "epoch": 0.1714219813170338, "grad_norm": 2.425855312863495, "learning_rate": 1.1909200052168662e-06, "loss": 1.12, "step": 1858 }, { "epoch": 0.1715142428785607, "grad_norm": 1.9460311578544538, "learning_rate": 1.1908401291342906e-06, "loss": 0.8324, "step": 1859 }, { "epoch": 0.17160650444008765, "grad_norm": 1.5972274760046872, "learning_rate": 1.1907602017743919e-06, "loss": 0.8474, "step": 1860 }, { "epoch": 0.17160650444008765, "eval_GEN Loss": 0.46865659952163696, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.38174164295196533, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9336538314819336, "eval_runtime": 55.9742, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1860 }, { "epoch": 0.17169876600161457, "grad_norm": 1.7692435542544476, "learning_rate": 1.1906802231444132e-06, "loss": 0.5984, "step": 1861 }, { "epoch": 0.17179102756314152, "grad_norm": 1.2937208992413296, "learning_rate": 1.190600193251602e-06, "loss": 0.6311, "step": 1862 }, { "epoch": 0.17188328912466844, "grad_norm": 2.1915470807528123, "learning_rate": 1.1905201121032114e-06, "loss": 1.0597, "step": 1863 }, { "epoch": 0.17197555068619536, "grad_norm": 2.094873538641951, "learning_rate": 1.1904399797064978e-06, "loss": 0.6461, "step": 1864 }, { "epoch": 0.1720678122477223, "grad_norm": 1.9349259284452442, "learning_rate": 1.1903597960687235e-06, "loss": 0.7687, "step": 1865 }, { "epoch": 0.1720678122477223, "eval_GEN Loss": 0.4682375192642212, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3880854845046997, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9427884817123413, "eval_runtime": 56.1305, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 1865 }, { "epoch": 0.17216007380924922, "grad_norm": 1.6799371021089247, "learning_rate": 1.1902795611971545e-06, "loss": 0.8063, "step": 1866 }, { "epoch": 0.17225233537077614, "grad_norm": 2.0228644674773713, "learning_rate": 1.1901992750990618e-06, "loss": 0.8166, "step": 1867 }, { "epoch": 0.17234459693230308, "grad_norm": 2.5252102679387276, "learning_rate": 1.1901189377817212e-06, "loss": 0.6701, "step": 1868 }, { "epoch": 0.17243685849383, "grad_norm": 1.9980916127907438, "learning_rate": 1.190038549252413e-06, "loss": 0.809, "step": 1869 }, { "epoch": 0.17252912005535695, "grad_norm": 2.0079522762005446, "learning_rate": 1.189958109518422e-06, "loss": 1.0007, "step": 1870 }, { "epoch": 0.17252912005535695, "eval_GEN Loss": 0.4692970812320709, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.41786956787109375, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9440504908561707, "eval_runtime": 55.8881, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1870 }, { "epoch": 0.17262138161688387, "grad_norm": 1.8787687357136489, "learning_rate": 1.1898776185870378e-06, "loss": 0.8742, "step": 1871 }, { "epoch": 0.1727136431784108, "grad_norm": 2.2622161929407705, "learning_rate": 1.189797076465555e-06, "loss": 0.8112, "step": 1872 }, { "epoch": 0.17280590473993773, "grad_norm": 1.4773040619683082, "learning_rate": 1.1897164831612717e-06, "loss": 0.6426, "step": 1873 }, { "epoch": 0.17289816630146465, "grad_norm": 2.7782129345098676, "learning_rate": 1.1896358386814922e-06, "loss": 0.862, "step": 1874 }, { "epoch": 0.17299042786299157, "grad_norm": 3.2884494924228718, "learning_rate": 1.189555143033524e-06, "loss": 0.6958, "step": 1875 }, { "epoch": 0.17299042786299157, "eval_GEN Loss": 0.4688989818096161, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4337483048439026, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9493389129638672, "eval_runtime": 56.0161, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1875 }, { "epoch": 0.17308268942451852, "grad_norm": 1.9003758440236473, "learning_rate": 1.1894743962246802e-06, "loss": 0.8281, "step": 1876 }, { "epoch": 0.17317495098604543, "grad_norm": 2.4667028650650504, "learning_rate": 1.189393598262278e-06, "loss": 0.8671, "step": 1877 }, { "epoch": 0.17326721254757238, "grad_norm": 1.9819340573548156, "learning_rate": 1.1893127491536397e-06, "loss": 0.5571, "step": 1878 }, { "epoch": 0.1733594741090993, "grad_norm": 1.9869611101078306, "learning_rate": 1.1892318489060918e-06, "loss": 0.8948, "step": 1879 }, { "epoch": 0.17345173567062622, "grad_norm": 2.054294013985498, "learning_rate": 1.1891508975269655e-06, "loss": 0.7908, "step": 1880 }, { "epoch": 0.17345173567062622, "eval_GEN Loss": 0.4685158133506775, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM Loss": 0.3908511698246002, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.951442301273346, "eval_runtime": 56.7739, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 1880 }, { "epoch": 0.17354399723215316, "grad_norm": 1.6717171649021387, "learning_rate": 1.189069895023597e-06, "loss": 0.7849, "step": 1881 }, { "epoch": 0.17363625879368008, "grad_norm": 1.7825294071368827, "learning_rate": 1.1889888414033268e-06, "loss": 0.791, "step": 1882 }, { "epoch": 0.173728520355207, "grad_norm": 2.3399100576380185, "learning_rate": 1.1889077366735e-06, "loss": 0.8288, "step": 1883 }, { "epoch": 0.17382078191673395, "grad_norm": 1.4659728050258447, "learning_rate": 1.1888265808414667e-06, "loss": 0.7501, "step": 1884 }, { "epoch": 0.17391304347826086, "grad_norm": 1.55020720573834, "learning_rate": 1.188745373914581e-06, "loss": 0.7398, "step": 1885 }, { "epoch": 0.17391304347826086, "eval_GEN Loss": 0.4690574109554291, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM Loss": 0.3869512975215912, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9814903736114502, "eval_runtime": 55.822, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1885 }, { "epoch": 0.1740053050397878, "grad_norm": 2.3344400330851114, "learning_rate": 1.1886641159002022e-06, "loss": 0.7529, "step": 1886 }, { "epoch": 0.17409756660131473, "grad_norm": 1.982474628280561, "learning_rate": 1.1885828068056937e-06, "loss": 0.7663, "step": 1887 }, { "epoch": 0.17418982816284165, "grad_norm": 2.180397432523735, "learning_rate": 1.1885014466384245e-06, "loss": 0.655, "step": 1888 }, { "epoch": 0.1742820897243686, "grad_norm": 3.8786558250419008, "learning_rate": 1.1884200354057672e-06, "loss": 0.9249, "step": 1889 }, { "epoch": 0.1743743512858955, "grad_norm": 1.4128292216687506, "learning_rate": 1.1883385731150995e-06, "loss": 0.794, "step": 1890 }, { "epoch": 0.1743743512858955, "eval_GEN Loss": 0.46872907876968384, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM Loss": 0.3835473656654358, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.9583533406257629, "eval_runtime": 56.173, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 1890 }, { "epoch": 0.17446661284742243, "grad_norm": 1.7512735734999927, "learning_rate": 1.1882570597738032e-06, "loss": 0.8348, "step": 1891 }, { "epoch": 0.17455887440894938, "grad_norm": 2.5214015504072105, "learning_rate": 1.1881754953892661e-06, "loss": 0.7224, "step": 1892 }, { "epoch": 0.1746511359704763, "grad_norm": 1.6795900667309693, "learning_rate": 1.1880938799688787e-06, "loss": 0.8449, "step": 1893 }, { "epoch": 0.17474339753200324, "grad_norm": 1.7118345168670674, "learning_rate": 1.188012213520038e-06, "loss": 0.7201, "step": 1894 }, { "epoch": 0.17483565909353016, "grad_norm": 1.584372664384906, "learning_rate": 1.1879304960501441e-06, "loss": 0.7297, "step": 1895 }, { "epoch": 0.17483565909353016, "eval_GEN Loss": 0.4695640206336975, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3987809717655182, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.918870210647583, "eval_runtime": 55.7564, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1895 }, { "epoch": 0.17492792065505708, "grad_norm": 2.6131805911009676, "learning_rate": 1.1878487275666025e-06, "loss": 0.7928, "step": 1896 }, { "epoch": 0.17502018221658402, "grad_norm": 1.5966418591815272, "learning_rate": 1.1877669080768235e-06, "loss": 0.7113, "step": 1897 }, { "epoch": 0.17511244377811094, "grad_norm": 1.6367611060894423, "learning_rate": 1.1876850375882213e-06, "loss": 0.6772, "step": 1898 }, { "epoch": 0.17520470533963786, "grad_norm": 2.0825135677424855, "learning_rate": 1.1876031161082154e-06, "loss": 0.8016, "step": 1899 }, { "epoch": 0.1752969669011648, "grad_norm": 1.9678959563769876, "learning_rate": 1.1875211436442293e-06, "loss": 0.8319, "step": 1900 }, { "epoch": 0.1752969669011648, "eval_GEN Loss": 0.4692772924900055, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4279230535030365, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9149038195610046, "eval_runtime": 55.7671, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 1900 }, { "epoch": 0.17538922846269173, "grad_norm": 2.3252179355430083, "learning_rate": 1.187439120203692e-06, "loss": 0.5821, "step": 1901 }, { "epoch": 0.17548149002421867, "grad_norm": 2.9514616238302844, "learning_rate": 1.1873570457940364e-06, "loss": 0.8697, "step": 1902 }, { "epoch": 0.1755737515857456, "grad_norm": 1.8577708695461148, "learning_rate": 1.1872749204227e-06, "loss": 0.6237, "step": 1903 }, { "epoch": 0.1756660131472725, "grad_norm": 1.6169552802513891, "learning_rate": 1.1871927440971254e-06, "loss": 0.696, "step": 1904 }, { "epoch": 0.17575827470879946, "grad_norm": 2.739107800746727, "learning_rate": 1.1871105168247592e-06, "loss": 0.6307, "step": 1905 }, { "epoch": 0.17575827470879946, "eval_GEN Loss": 0.46751323342323303, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.38527750968933105, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8990384340286255, "eval_runtime": 56.2352, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 1905 }, { "epoch": 0.17585053627032637, "grad_norm": 1.683112032608916, "learning_rate": 1.1870282386130536e-06, "loss": 0.6837, "step": 1906 }, { "epoch": 0.1759427978318533, "grad_norm": 1.5973651948445948, "learning_rate": 1.186945909469464e-06, "loss": 0.6812, "step": 1907 }, { "epoch": 0.17603505939338024, "grad_norm": 2.3245973463415366, "learning_rate": 1.1868635294014517e-06, "loss": 0.9884, "step": 1908 }, { "epoch": 0.17612732095490716, "grad_norm": 1.817496038080407, "learning_rate": 1.186781098416482e-06, "loss": 0.7388, "step": 1909 }, { "epoch": 0.1762195825164341, "grad_norm": 1.3311852279017433, "learning_rate": 1.1866986165220248e-06, "loss": 0.6314, "step": 1910 }, { "epoch": 0.1762195825164341, "eval_GEN Loss": 0.4685840606689453, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.35463541746139526, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9057692289352417, "eval_runtime": 55.8633, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1910 }, { "epoch": 0.17631184407796102, "grad_norm": 1.7186034726360713, "learning_rate": 1.186616083725555e-06, "loss": 0.7453, "step": 1911 }, { "epoch": 0.17640410563948794, "grad_norm": 2.224287522579521, "learning_rate": 1.1865335000345515e-06, "loss": 0.608, "step": 1912 }, { "epoch": 0.1764963672010149, "grad_norm": 1.7476775322804345, "learning_rate": 1.1864508654564986e-06, "loss": 0.5619, "step": 1913 }, { "epoch": 0.1765886287625418, "grad_norm": 2.0527580222396797, "learning_rate": 1.1863681799988844e-06, "loss": 0.7012, "step": 1914 }, { "epoch": 0.17668089032406872, "grad_norm": 2.3313585606950946, "learning_rate": 1.186285443669202e-06, "loss": 0.8966, "step": 1915 }, { "epoch": 0.17668089032406872, "eval_GEN Loss": 0.46925368905067444, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.34594297409057617, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9025240540504456, "eval_runtime": 57.0764, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 1915 }, { "epoch": 0.17677315188559567, "grad_norm": 2.535215320237209, "learning_rate": 1.1862026564749492e-06, "loss": 0.9057, "step": 1916 }, { "epoch": 0.1768654134471226, "grad_norm": 3.5084157619272656, "learning_rate": 1.1861198184236286e-06, "loss": 0.9853, "step": 1917 }, { "epoch": 0.17695767500864953, "grad_norm": 2.060703280233832, "learning_rate": 1.1860369295227468e-06, "loss": 0.8597, "step": 1918 }, { "epoch": 0.17704993657017645, "grad_norm": 1.5742432988107469, "learning_rate": 1.1859539897798152e-06, "loss": 0.8047, "step": 1919 }, { "epoch": 0.17714219813170337, "grad_norm": 1.7976768419993143, "learning_rate": 1.1858709992023501e-06, "loss": 0.7721, "step": 1920 }, { "epoch": 0.17714219813170337, "eval_GEN Loss": 0.4682477116584778, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3484565317630768, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8586538434028625, "eval_runtime": 55.9293, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1920 }, { "epoch": 0.17723445969323032, "grad_norm": 2.343535713364003, "learning_rate": 1.1857879577978724e-06, "loss": 0.5613, "step": 1921 }, { "epoch": 0.17732672125475724, "grad_norm": 1.757333883870705, "learning_rate": 1.185704865573907e-06, "loss": 0.7187, "step": 1922 }, { "epoch": 0.17741898281628415, "grad_norm": 2.0400670424123133, "learning_rate": 1.1856217225379842e-06, "loss": 0.8537, "step": 1923 }, { "epoch": 0.1775112443778111, "grad_norm": 1.7479042814278654, "learning_rate": 1.1855385286976387e-06, "loss": 0.7641, "step": 1924 }, { "epoch": 0.17760350593933802, "grad_norm": 2.417533290690098, "learning_rate": 1.1854552840604092e-06, "loss": 0.7124, "step": 1925 }, { "epoch": 0.17760350593933802, "eval_GEN Loss": 0.4683780074119568, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.3596678078174591, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.854687511920929, "eval_runtime": 56.0748, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1925 }, { "epoch": 0.17769576750086497, "grad_norm": 1.641541075462338, "learning_rate": 1.18537198863384e-06, "loss": 0.8352, "step": 1926 }, { "epoch": 0.17778802906239188, "grad_norm": 1.3910642781393008, "learning_rate": 1.1852886424254788e-06, "loss": 0.6602, "step": 1927 }, { "epoch": 0.1778802906239188, "grad_norm": 2.232958456514103, "learning_rate": 1.185205245442879e-06, "loss": 0.8616, "step": 1928 }, { "epoch": 0.17797255218544575, "grad_norm": 2.3839649191841006, "learning_rate": 1.185121797693598e-06, "loss": 0.631, "step": 1929 }, { "epoch": 0.17806481374697267, "grad_norm": 1.8444372479741982, "learning_rate": 1.1850382991851982e-06, "loss": 0.7821, "step": 1930 }, { "epoch": 0.17806481374697267, "eval_GEN Loss": 0.4683499038219452, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.3657971918582916, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8576322197914124, "eval_runtime": 55.8482, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1930 }, { "epoch": 0.17815707530849959, "grad_norm": 2.25169689693887, "learning_rate": 1.1849547499252462e-06, "loss": 0.9682, "step": 1931 }, { "epoch": 0.17824933687002653, "grad_norm": 1.947708892171765, "learning_rate": 1.1848711499213134e-06, "loss": 0.6699, "step": 1932 }, { "epoch": 0.17834159843155345, "grad_norm": 2.7578340026793176, "learning_rate": 1.1847874991809757e-06, "loss": 0.7486, "step": 1933 }, { "epoch": 0.1784338599930804, "grad_norm": 1.8144475086471232, "learning_rate": 1.1847037977118136e-06, "loss": 0.7841, "step": 1934 }, { "epoch": 0.17852612155460731, "grad_norm": 2.1749335875167395, "learning_rate": 1.1846200455214128e-06, "loss": 0.8312, "step": 1935 }, { "epoch": 0.17852612155460731, "eval_GEN Loss": 0.4700009822845459, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.3598850667476654, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8522836565971375, "eval_runtime": 56.0167, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1935 }, { "epoch": 0.17861838311613423, "grad_norm": 1.8202686727472561, "learning_rate": 1.184536242617362e-06, "loss": 0.7958, "step": 1936 }, { "epoch": 0.17871064467766118, "grad_norm": 2.3130305737826484, "learning_rate": 1.1844523890072566e-06, "loss": 0.7722, "step": 1937 }, { "epoch": 0.1788029062391881, "grad_norm": 1.9812235010674377, "learning_rate": 1.1843684846986949e-06, "loss": 0.7294, "step": 1938 }, { "epoch": 0.17889516780071502, "grad_norm": 3.1377665851712013, "learning_rate": 1.1842845296992809e-06, "loss": 0.902, "step": 1939 }, { "epoch": 0.17898742936224196, "grad_norm": 2.0456290093446277, "learning_rate": 1.1842005240166222e-06, "loss": 0.8287, "step": 1940 }, { "epoch": 0.17898742936224196, "eval_GEN Loss": 0.46932679414749146, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9202453987730062, "eval_PRM F1 AUC": 0.8431115767417497, "eval_PRM F1 Neg": 0.7346938775510204, "eval_PRM Loss": 0.34539997577667236, "eval_PRM NPV": 0.6923076923076923, "eval_PRM Precision": 0.9375, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.844531238079071, "eval_runtime": 55.9681, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1940 }, { "epoch": 0.17907969092376888, "grad_norm": 1.7501401490304878, "learning_rate": 1.184116467658332e-06, "loss": 0.598, "step": 1941 }, { "epoch": 0.17917195248529583, "grad_norm": 2.751844920732577, "learning_rate": 1.1840323606320273e-06, "loss": 0.8756, "step": 1942 }, { "epoch": 0.17926421404682275, "grad_norm": 1.7486262039835792, "learning_rate": 1.1839482029453302e-06, "loss": 0.6555, "step": 1943 }, { "epoch": 0.17935647560834966, "grad_norm": 3.3452249547582564, "learning_rate": 1.1838639946058673e-06, "loss": 0.8685, "step": 1944 }, { "epoch": 0.1794487371698766, "grad_norm": 1.8288374287804032, "learning_rate": 1.1837797356212693e-06, "loss": 0.8282, "step": 1945 }, { "epoch": 0.1794487371698766, "eval_GEN Loss": 0.4705554246902466, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.328626811504364, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8490384817123413, "eval_runtime": 56.3921, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 1945 }, { "epoch": 0.17954099873140353, "grad_norm": 1.943313902167551, "learning_rate": 1.1836954259991724e-06, "loss": 0.917, "step": 1946 }, { "epoch": 0.17963326029293045, "grad_norm": 1.5216936319454786, "learning_rate": 1.1836110657472162e-06, "loss": 0.6325, "step": 1947 }, { "epoch": 0.1797255218544574, "grad_norm": 2.5124030329025335, "learning_rate": 1.1835266548730465e-06, "loss": 0.7952, "step": 1948 }, { "epoch": 0.1798177834159843, "grad_norm": 1.6176394503610152, "learning_rate": 1.1834421933843118e-06, "loss": 0.7563, "step": 1949 }, { "epoch": 0.17991004497751126, "grad_norm": 2.4086105514681106, "learning_rate": 1.1833576812886666e-06, "loss": 0.847, "step": 1950 }, { "epoch": 0.17991004497751126, "eval_GEN Loss": 0.46942463517189026, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3282986879348755, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8774038553237915, "eval_runtime": 56.8631, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1950 }, { "epoch": 0.18000230653903818, "grad_norm": 4.602223665033289, "learning_rate": 1.1832731185937695e-06, "loss": 0.8888, "step": 1951 }, { "epoch": 0.1800945681005651, "grad_norm": 1.8659980358360455, "learning_rate": 1.1831885053072837e-06, "loss": 0.7075, "step": 1952 }, { "epoch": 0.18018682966209204, "grad_norm": 1.8337120619647553, "learning_rate": 1.183103841436877e-06, "loss": 0.7455, "step": 1953 }, { "epoch": 0.18027909122361896, "grad_norm": 1.8044581737282863, "learning_rate": 1.1830191269902216e-06, "loss": 0.8378, "step": 1954 }, { "epoch": 0.18037135278514588, "grad_norm": 1.843116592608778, "learning_rate": 1.1829343619749944e-06, "loss": 0.7311, "step": 1955 }, { "epoch": 0.18037135278514588, "eval_GEN Loss": 0.4702025353908539, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33778148889541626, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8728365302085876, "eval_runtime": 56.9483, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 1955 }, { "epoch": 0.18046361434667282, "grad_norm": 1.5054335447800735, "learning_rate": 1.1828495463988774e-06, "loss": 0.6745, "step": 1956 }, { "epoch": 0.18055587590819974, "grad_norm": 1.920825500204467, "learning_rate": 1.1827646802695563e-06, "loss": 0.8852, "step": 1957 }, { "epoch": 0.1806481374697267, "grad_norm": 2.0527177750313452, "learning_rate": 1.182679763594722e-06, "loss": 0.9191, "step": 1958 }, { "epoch": 0.1807403990312536, "grad_norm": 1.6131473811718557, "learning_rate": 1.1825947963820698e-06, "loss": 0.7022, "step": 1959 }, { "epoch": 0.18083266059278053, "grad_norm": 1.5671800926925206, "learning_rate": 1.1825097786392994e-06, "loss": 0.6837, "step": 1960 }, { "epoch": 0.18083266059278053, "eval_GEN Loss": 0.4705111086368561, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9156626506024096, "eval_PRM F1 AUC": 0.8056574122577265, "eval_PRM F1 Neg": 0.6956521739130435, "eval_PRM Loss": 0.34896120429039, "eval_PRM NPV": 0.6956521739130435, "eval_PRM Precision": 0.9156626506024096, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8716346025466919, "eval_runtime": 56.8601, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 1960 }, { "epoch": 0.18092492215430747, "grad_norm": 2.79084900873371, "learning_rate": 1.1824247103741154e-06, "loss": 0.7971, "step": 1961 }, { "epoch": 0.1810171837158344, "grad_norm": 1.9170428272343674, "learning_rate": 1.1823395915942265e-06, "loss": 0.7246, "step": 1962 }, { "epoch": 0.1811094452773613, "grad_norm": 1.9462537574889882, "learning_rate": 1.1822544223073467e-06, "loss": 0.8289, "step": 1963 }, { "epoch": 0.18120170683888825, "grad_norm": 1.9375282632531803, "learning_rate": 1.1821692025211942e-06, "loss": 0.76, "step": 1964 }, { "epoch": 0.18129396840041517, "grad_norm": 1.3435109446325704, "learning_rate": 1.1820839322434913e-06, "loss": 0.6949, "step": 1965 }, { "epoch": 0.18129396840041517, "eval_GEN Loss": 0.4705446660518646, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37570104002952576, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8603365421295166, "eval_runtime": 56.0616, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 1965 }, { "epoch": 0.18138622996194212, "grad_norm": 2.409717875745877, "learning_rate": 1.1819986114819656e-06, "loss": 0.8287, "step": 1966 }, { "epoch": 0.18147849152346904, "grad_norm": 2.018430092064614, "learning_rate": 1.1819132402443491e-06, "loss": 0.8305, "step": 1967 }, { "epoch": 0.18157075308499596, "grad_norm": 1.6910998307111729, "learning_rate": 1.1818278185383783e-06, "loss": 0.774, "step": 1968 }, { "epoch": 0.1816630146465229, "grad_norm": 2.1156338275691637, "learning_rate": 1.181742346371794e-06, "loss": 0.632, "step": 1969 }, { "epoch": 0.18175527620804982, "grad_norm": 1.8875932222931249, "learning_rate": 1.1816568237523419e-06, "loss": 0.668, "step": 1970 }, { "epoch": 0.18175527620804982, "eval_GEN Loss": 0.4716153144836426, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.39824846386909485, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8655648827552795, "eval_runtime": 55.9045, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1970 }, { "epoch": 0.18184753776957674, "grad_norm": 1.8218580804105595, "learning_rate": 1.1815712506877725e-06, "loss": 0.6293, "step": 1971 }, { "epoch": 0.18193979933110369, "grad_norm": 2.323150747517259, "learning_rate": 1.18148562718584e-06, "loss": 0.7472, "step": 1972 }, { "epoch": 0.1820320608926306, "grad_norm": 2.2830565197763906, "learning_rate": 1.181399953254304e-06, "loss": 0.6765, "step": 1973 }, { "epoch": 0.18212432245415755, "grad_norm": 2.81192357035052, "learning_rate": 1.1813142289009286e-06, "loss": 0.809, "step": 1974 }, { "epoch": 0.18221658401568447, "grad_norm": 1.9730415783176882, "learning_rate": 1.1812284541334821e-06, "loss": 0.8976, "step": 1975 }, { "epoch": 0.18221658401568447, "eval_GEN Loss": 0.4716103971004486, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3583613634109497, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8695913553237915, "eval_runtime": 55.9433, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 1975 }, { "epoch": 0.1823088455772114, "grad_norm": 2.8985150365969434, "learning_rate": 1.1811426289597377e-06, "loss": 0.8941, "step": 1976 }, { "epoch": 0.18240110713873833, "grad_norm": 2.1626277533488376, "learning_rate": 1.1810567533874728e-06, "loss": 0.7578, "step": 1977 }, { "epoch": 0.18249336870026525, "grad_norm": 2.357520483642952, "learning_rate": 1.1809708274244695e-06, "loss": 0.8202, "step": 1978 }, { "epoch": 0.18258563026179217, "grad_norm": 3.1136973651999953, "learning_rate": 1.1808848510785149e-06, "loss": 1.128, "step": 1979 }, { "epoch": 0.18267789182331912, "grad_norm": 2.472151221670113, "learning_rate": 1.1807988243574e-06, "loss": 0.9272, "step": 1980 }, { "epoch": 0.18267789182331912, "eval_GEN Loss": 0.4723505675792694, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3514373302459717, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8723557591438293, "eval_runtime": 55.8327, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 1980 }, { "epoch": 0.18277015338484603, "grad_norm": 1.7355618460112476, "learning_rate": 1.1807127472689208e-06, "loss": 0.6718, "step": 1981 }, { "epoch": 0.18286241494637298, "grad_norm": 1.7950478995183463, "learning_rate": 1.180626619820878e-06, "loss": 0.6722, "step": 1982 }, { "epoch": 0.1829546765078999, "grad_norm": 2.4822181820471343, "learning_rate": 1.180540442021076e-06, "loss": 0.8901, "step": 1983 }, { "epoch": 0.18304693806942682, "grad_norm": 1.6620784138258664, "learning_rate": 1.1804542138773247e-06, "loss": 0.7279, "step": 1984 }, { "epoch": 0.18313919963095376, "grad_norm": 1.669328072447358, "learning_rate": 1.1803679353974384e-06, "loss": 0.7729, "step": 1985 }, { "epoch": 0.18313919963095376, "eval_GEN Loss": 0.47229859232902527, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.35772424936294556, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8501201868057251, "eval_runtime": 56.0208, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 1985 }, { "epoch": 0.18323146119248068, "grad_norm": 1.334830857646573, "learning_rate": 1.1802816065892356e-06, "loss": 0.6131, "step": 1986 }, { "epoch": 0.1833237227540076, "grad_norm": 2.405568253699568, "learning_rate": 1.1801952274605397e-06, "loss": 0.7406, "step": 1987 }, { "epoch": 0.18341598431553455, "grad_norm": 2.1917242170043476, "learning_rate": 1.1801087980191784e-06, "loss": 0.7511, "step": 1988 }, { "epoch": 0.18350824587706147, "grad_norm": 2.554704922098671, "learning_rate": 1.1800223182729839e-06, "loss": 0.896, "step": 1989 }, { "epoch": 0.1836005074385884, "grad_norm": 2.3679975677847698, "learning_rate": 1.1799357882297934e-06, "loss": 0.9535, "step": 1990 }, { "epoch": 0.1836005074385884, "eval_GEN Loss": 0.47487273812294006, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8930817610062893, "eval_PRM F1 AUC": 0.819015191199581, "eval_PRM F1 Neg": 0.6792452830188679, "eval_PRM Loss": 0.3714655339717865, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9342105263157895, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.845973551273346, "eval_runtime": 55.9976, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 1990 }, { "epoch": 0.18369276900011533, "grad_norm": 1.6180444080504108, "learning_rate": 1.1798492078974484e-06, "loss": 0.6486, "step": 1991 }, { "epoch": 0.18378503056164225, "grad_norm": 1.683006147370453, "learning_rate": 1.1797625772837946e-06, "loss": 0.859, "step": 1992 }, { "epoch": 0.1838772921231692, "grad_norm": 2.2510671580043202, "learning_rate": 1.1796758963966828e-06, "loss": 0.7019, "step": 1993 }, { "epoch": 0.1839695536846961, "grad_norm": 1.8567289016022117, "learning_rate": 1.1795891652439684e-06, "loss": 0.8697, "step": 1994 }, { "epoch": 0.18406181524622303, "grad_norm": 2.422870701730181, "learning_rate": 1.1795023838335107e-06, "loss": 0.7371, "step": 1995 }, { "epoch": 0.18406181524622303, "eval_GEN Loss": 0.4758482873439789, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9, "eval_PRM F1 AUC": 0.8250392875851232, "eval_PRM F1 Neg": 0.6923076923076923, "eval_PRM Loss": 0.3763881325721741, "eval_PRM NPV": 0.6206896551724138, "eval_PRM Precision": 0.935064935064935, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8481971025466919, "eval_runtime": 55.8838, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 1995 }, { "epoch": 0.18415407680774998, "grad_norm": 1.8054001363809202, "learning_rate": 1.1794155521731744e-06, "loss": 0.6933, "step": 1996 }, { "epoch": 0.1842463383692769, "grad_norm": 1.5414872633375913, "learning_rate": 1.1793286702708279e-06, "loss": 0.8097, "step": 1997 }, { "epoch": 0.18433859993080384, "grad_norm": 2.322123260692024, "learning_rate": 1.1792417381343448e-06, "loss": 0.9594, "step": 1998 }, { "epoch": 0.18443086149233076, "grad_norm": 2.403147298475866, "learning_rate": 1.1791547557716031e-06, "loss": 0.6702, "step": 1999 }, { "epoch": 0.18452312305385768, "grad_norm": 1.8937608761817435, "learning_rate": 1.1790677231904852e-06, "loss": 0.7323, "step": 2000 }, { "epoch": 0.18452312305385768, "eval_GEN Loss": 0.47482290863990784, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9135802469135802, "eval_PRM F1 AUC": 0.8370874803562075, "eval_PRM F1 Neg": 0.72, "eval_PRM Loss": 0.34736916422843933, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9367088607594937, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8415865302085876, "eval_runtime": 55.9308, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2000 }, { "epoch": 0.18461538461538463, "grad_norm": 1.7218811898237494, "learning_rate": 1.1789806403988781e-06, "loss": 0.6016, "step": 2001 }, { "epoch": 0.18470764617691154, "grad_norm": 1.6092138907105, "learning_rate": 1.1788935074046735e-06, "loss": 0.8096, "step": 2002 }, { "epoch": 0.18479990773843846, "grad_norm": 1.5971983932629983, "learning_rate": 1.1788063242157671e-06, "loss": 0.7057, "step": 2003 }, { "epoch": 0.1848921692999654, "grad_norm": 1.3621746398913959, "learning_rate": 1.1787190908400602e-06, "loss": 0.5874, "step": 2004 }, { "epoch": 0.18498443086149233, "grad_norm": 3.8139246079298226, "learning_rate": 1.1786318072854574e-06, "loss": 0.8478, "step": 2005 }, { "epoch": 0.18498443086149233, "eval_GEN Loss": 0.47527387738227844, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33743923902511597, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8596153855323792, "eval_runtime": 56.9064, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2005 }, { "epoch": 0.18507669242301927, "grad_norm": 2.781499716829389, "learning_rate": 1.1785444735598692e-06, "loss": 0.8955, "step": 2006 }, { "epoch": 0.1851689539845462, "grad_norm": 2.206461851230783, "learning_rate": 1.1784570896712091e-06, "loss": 0.861, "step": 2007 }, { "epoch": 0.1852612155460731, "grad_norm": 1.6405028562717892, "learning_rate": 1.1783696556273966e-06, "loss": 0.7969, "step": 2008 }, { "epoch": 0.18535347710760006, "grad_norm": 1.937622062292657, "learning_rate": 1.1782821714363548e-06, "loss": 0.7386, "step": 2009 }, { "epoch": 0.18544573866912697, "grad_norm": 1.871704342430374, "learning_rate": 1.178194637106012e-06, "loss": 0.7642, "step": 2010 }, { "epoch": 0.18544573866912697, "eval_GEN Loss": 0.4762713313102722, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3472242057323456, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8661057949066162, "eval_runtime": 56.8425, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2010 }, { "epoch": 0.1855380002306539, "grad_norm": 1.300223142727639, "learning_rate": 1.1781070526443002e-06, "loss": 0.6246, "step": 2011 }, { "epoch": 0.18563026179218084, "grad_norm": 1.4839254987161208, "learning_rate": 1.1780194180591567e-06, "loss": 0.712, "step": 2012 }, { "epoch": 0.18572252335370776, "grad_norm": 1.3638374277079743, "learning_rate": 1.1779317333585232e-06, "loss": 0.5256, "step": 2013 }, { "epoch": 0.1858147849152347, "grad_norm": 3.1800809335198794, "learning_rate": 1.1778439985503456e-06, "loss": 0.781, "step": 2014 }, { "epoch": 0.18590704647676162, "grad_norm": 2.8899657971448702, "learning_rate": 1.1777562136425747e-06, "loss": 1.0692, "step": 2015 }, { "epoch": 0.18590704647676162, "eval_GEN Loss": 0.4769386053085327, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35975176095962524, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8862980604171753, "eval_runtime": 56.8541, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2015 }, { "epoch": 0.18599930803828854, "grad_norm": 2.145923227050257, "learning_rate": 1.1776683786431655e-06, "loss": 0.7344, "step": 2016 }, { "epoch": 0.1860915695998155, "grad_norm": 1.5044043557834834, "learning_rate": 1.1775804935600781e-06, "loss": 0.7167, "step": 2017 }, { "epoch": 0.1861838311613424, "grad_norm": 1.742271416763045, "learning_rate": 1.1774925584012766e-06, "loss": 0.7182, "step": 2018 }, { "epoch": 0.18627609272286932, "grad_norm": 2.3624915019513644, "learning_rate": 1.1774045731747299e-06, "loss": 0.8248, "step": 2019 }, { "epoch": 0.18636835428439627, "grad_norm": 2.1935117177206647, "learning_rate": 1.177316537888411e-06, "loss": 0.7486, "step": 2020 }, { "epoch": 0.18636835428439627, "eval_GEN Loss": 0.4771266579627991, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3712487518787384, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9055288434028625, "eval_runtime": 57.2909, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 2020 }, { "epoch": 0.1864606158459232, "grad_norm": 1.7514578539412164, "learning_rate": 1.1772284525502983e-06, "loss": 0.7124, "step": 2021 }, { "epoch": 0.1865528774074501, "grad_norm": 1.6268295502484904, "learning_rate": 1.177140317168374e-06, "loss": 0.6699, "step": 2022 }, { "epoch": 0.18664513896897705, "grad_norm": 1.7886518441477073, "learning_rate": 1.177052131750625e-06, "loss": 0.6993, "step": 2023 }, { "epoch": 0.18673740053050397, "grad_norm": 5.2219209888016325, "learning_rate": 1.1769638963050428e-06, "loss": 1.0932, "step": 2024 }, { "epoch": 0.18682966209203092, "grad_norm": 2.1651132863048232, "learning_rate": 1.1768756108396237e-06, "loss": 0.7829, "step": 2025 }, { "epoch": 0.18682966209203092, "eval_GEN Loss": 0.4762979745864868, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.37799975275993347, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9197115302085876, "eval_runtime": 56.8767, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2025 }, { "epoch": 0.18692192365355784, "grad_norm": 2.4120105181234504, "learning_rate": 1.176787275362368e-06, "loss": 0.9647, "step": 2026 }, { "epoch": 0.18701418521508476, "grad_norm": 1.4392912028263638, "learning_rate": 1.1766988898812808e-06, "loss": 0.7379, "step": 2027 }, { "epoch": 0.1871064467766117, "grad_norm": 1.59708899434638, "learning_rate": 1.176610454404372e-06, "loss": 0.7667, "step": 2028 }, { "epoch": 0.18719870833813862, "grad_norm": 1.3651238541526256, "learning_rate": 1.1765219689396553e-06, "loss": 0.6794, "step": 2029 }, { "epoch": 0.18729096989966554, "grad_norm": 2.079074025639708, "learning_rate": 1.17643343349515e-06, "loss": 0.8413, "step": 2030 }, { "epoch": 0.18729096989966554, "eval_GEN Loss": 0.47625789046287537, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3893580138683319, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9141826629638672, "eval_runtime": 56.9139, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2030 }, { "epoch": 0.18738323146119248, "grad_norm": 1.3647385935413638, "learning_rate": 1.1763448480788786e-06, "loss": 0.6232, "step": 2031 }, { "epoch": 0.1874754930227194, "grad_norm": 3.510711336384845, "learning_rate": 1.1762562126988696e-06, "loss": 1.1275, "step": 2032 }, { "epoch": 0.18756775458424635, "grad_norm": 1.7667114211392427, "learning_rate": 1.176167527363155e-06, "loss": 0.7605, "step": 2033 }, { "epoch": 0.18766001614577327, "grad_norm": 1.5509237422154474, "learning_rate": 1.176078792079771e-06, "loss": 0.7539, "step": 2034 }, { "epoch": 0.18775227770730019, "grad_norm": 1.929023562753418, "learning_rate": 1.1759900068567599e-06, "loss": 0.8275, "step": 2035 }, { "epoch": 0.18775227770730019, "eval_GEN Loss": 0.47494471073150635, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.40141040086746216, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9050480723381042, "eval_runtime": 55.9735, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2035 }, { "epoch": 0.18784453926882713, "grad_norm": 1.5786079669231259, "learning_rate": 1.1759011717021668e-06, "loss": 0.7178, "step": 2036 }, { "epoch": 0.18793680083035405, "grad_norm": 3.363351897038916, "learning_rate": 1.1758122866240425e-06, "loss": 0.9335, "step": 2037 }, { "epoch": 0.18802906239188097, "grad_norm": 1.7553134317965489, "learning_rate": 1.1757233516304419e-06, "loss": 0.7692, "step": 2038 }, { "epoch": 0.18812132395340792, "grad_norm": 1.5074484864053896, "learning_rate": 1.1756343667294243e-06, "loss": 0.841, "step": 2039 }, { "epoch": 0.18821358551493483, "grad_norm": 1.9001341763009556, "learning_rate": 1.1755453319290535e-06, "loss": 0.6041, "step": 2040 }, { "epoch": 0.18821358551493483, "eval_GEN Loss": 0.47478625178337097, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3914642632007599, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9007812738418579, "eval_runtime": 56.0471, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2040 }, { "epoch": 0.18830584707646178, "grad_norm": 1.887618824502614, "learning_rate": 1.1754562472373984e-06, "loss": 0.61, "step": 2041 }, { "epoch": 0.1883981086379887, "grad_norm": 2.537116970872114, "learning_rate": 1.1753671126625315e-06, "loss": 0.9013, "step": 2042 }, { "epoch": 0.18849037019951562, "grad_norm": 1.749885410614083, "learning_rate": 1.1752779282125307e-06, "loss": 0.7976, "step": 2043 }, { "epoch": 0.18858263176104256, "grad_norm": 1.7703292830260156, "learning_rate": 1.1751886938954779e-06, "loss": 0.691, "step": 2044 }, { "epoch": 0.18867489332256948, "grad_norm": 1.9204534035808125, "learning_rate": 1.1750994097194595e-06, "loss": 0.6879, "step": 2045 }, { "epoch": 0.18867489332256948, "eval_GEN Loss": 0.4729349613189697, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.37438541650772095, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8925480842590332, "eval_runtime": 55.9191, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2045 }, { "epoch": 0.1887671548840964, "grad_norm": 1.5905092183160414, "learning_rate": 1.175010075692567e-06, "loss": 0.7958, "step": 2046 }, { "epoch": 0.18885941644562335, "grad_norm": 2.599172986193549, "learning_rate": 1.1749206918228956e-06, "loss": 1.0229, "step": 2047 }, { "epoch": 0.18895167800715026, "grad_norm": 1.5407394588399215, "learning_rate": 1.1748312581185453e-06, "loss": 0.6175, "step": 2048 }, { "epoch": 0.1890439395686772, "grad_norm": 1.7075539827400186, "learning_rate": 1.1747417745876211e-06, "loss": 0.7414, "step": 2049 }, { "epoch": 0.18913620113020413, "grad_norm": 1.7729999806091692, "learning_rate": 1.174652241238232e-06, "loss": 0.8014, "step": 2050 }, { "epoch": 0.18913620113020413, "eval_GEN Loss": 0.4732709228992462, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3624724745750427, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.893750011920929, "eval_runtime": 56.1189, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2050 }, { "epoch": 0.18922846269173105, "grad_norm": 1.3814801364156035, "learning_rate": 1.1745626580784916e-06, "loss": 0.7294, "step": 2051 }, { "epoch": 0.189320724253258, "grad_norm": 2.742469468717978, "learning_rate": 1.174473025116518e-06, "loss": 0.9501, "step": 2052 }, { "epoch": 0.1894129858147849, "grad_norm": 1.899074295936426, "learning_rate": 1.1743833423604344e-06, "loss": 0.6854, "step": 2053 }, { "epoch": 0.18950524737631183, "grad_norm": 1.805086519608829, "learning_rate": 1.1742936098183672e-06, "loss": 0.6486, "step": 2054 }, { "epoch": 0.18959750893783878, "grad_norm": 2.569618963834657, "learning_rate": 1.1742038274984485e-06, "loss": 0.7753, "step": 2055 }, { "epoch": 0.18959750893783878, "eval_GEN Loss": 0.47299501299858093, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36366239190101624, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8921874761581421, "eval_runtime": 56.0044, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2055 }, { "epoch": 0.1896897704993657, "grad_norm": 2.914152850560168, "learning_rate": 1.1741139954088147e-06, "loss": 0.8671, "step": 2056 }, { "epoch": 0.18978203206089264, "grad_norm": 1.4479355516929415, "learning_rate": 1.174024113557606e-06, "loss": 0.7495, "step": 2057 }, { "epoch": 0.18987429362241956, "grad_norm": 1.3999078074787001, "learning_rate": 1.1739341819529683e-06, "loss": 0.6818, "step": 2058 }, { "epoch": 0.18996655518394648, "grad_norm": 1.797137528146229, "learning_rate": 1.1738442006030507e-06, "loss": 0.6997, "step": 2059 }, { "epoch": 0.19005881674547342, "grad_norm": 2.181809965715182, "learning_rate": 1.173754169516008e-06, "loss": 0.9243, "step": 2060 }, { "epoch": 0.19005881674547342, "eval_GEN Loss": 0.47521984577178955, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.38565847277641296, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.893629789352417, "eval_runtime": 55.9352, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2060 }, { "epoch": 0.19015107830700034, "grad_norm": 1.6489695067822996, "learning_rate": 1.1736640886999987e-06, "loss": 0.8201, "step": 2061 }, { "epoch": 0.19024333986852726, "grad_norm": 2.2030014674323226, "learning_rate": 1.1735739581631858e-06, "loss": 0.8497, "step": 2062 }, { "epoch": 0.1903356014300542, "grad_norm": 2.391613576562548, "learning_rate": 1.1734837779137374e-06, "loss": 0.6548, "step": 2063 }, { "epoch": 0.19042786299158113, "grad_norm": 2.438905114414268, "learning_rate": 1.1733935479598258e-06, "loss": 0.8612, "step": 2064 }, { "epoch": 0.19052012455310807, "grad_norm": 1.907891784799133, "learning_rate": 1.1733032683096279e-06, "loss": 0.7451, "step": 2065 }, { "epoch": 0.19052012455310807, "eval_GEN Loss": 0.476781964302063, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.3958512544631958, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9001802802085876, "eval_runtime": 56.1362, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2065 }, { "epoch": 0.190612386114635, "grad_norm": 1.412398127994599, "learning_rate": 1.1732129389713246e-06, "loss": 0.7208, "step": 2066 }, { "epoch": 0.1907046476761619, "grad_norm": 1.5377625095076017, "learning_rate": 1.1731225599531018e-06, "loss": 0.7473, "step": 2067 }, { "epoch": 0.19079690923768886, "grad_norm": 1.739774552853579, "learning_rate": 1.1730321312631499e-06, "loss": 0.7613, "step": 2068 }, { "epoch": 0.19088917079921577, "grad_norm": 1.5628178567314877, "learning_rate": 1.1729416529096635e-06, "loss": 0.6486, "step": 2069 }, { "epoch": 0.1909814323607427, "grad_norm": 1.8349339622653353, "learning_rate": 1.1728511249008424e-06, "loss": 0.9405, "step": 2070 }, { "epoch": 0.1909814323607427, "eval_GEN Loss": 0.47572657465934753, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3906554877758026, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9009014368057251, "eval_runtime": 55.8639, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2070 }, { "epoch": 0.19107369392226964, "grad_norm": 1.6341536898808608, "learning_rate": 1.1727605472448899e-06, "loss": 0.641, "step": 2071 }, { "epoch": 0.19116595548379656, "grad_norm": 1.5734194760396665, "learning_rate": 1.1726699199500142e-06, "loss": 0.6824, "step": 2072 }, { "epoch": 0.1912582170453235, "grad_norm": 1.899392202542072, "learning_rate": 1.1725792430244286e-06, "loss": 0.8438, "step": 2073 }, { "epoch": 0.19135047860685042, "grad_norm": 1.4655415320012528, "learning_rate": 1.17248851647635e-06, "loss": 0.7546, "step": 2074 }, { "epoch": 0.19144274016837734, "grad_norm": 1.5406032119092525, "learning_rate": 1.1723977403140002e-06, "loss": 0.7013, "step": 2075 }, { "epoch": 0.19144274016837734, "eval_GEN Loss": 0.4752981960773468, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3990924656391144, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9125601053237915, "eval_runtime": 55.9667, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2075 }, { "epoch": 0.1915350017299043, "grad_norm": 2.1057681799535932, "learning_rate": 1.1723069145456055e-06, "loss": 0.7732, "step": 2076 }, { "epoch": 0.1916272632914312, "grad_norm": 1.8863658332607263, "learning_rate": 1.172216039179397e-06, "loss": 0.7382, "step": 2077 }, { "epoch": 0.19171952485295812, "grad_norm": 2.2750369010593197, "learning_rate": 1.1721251142236095e-06, "loss": 0.713, "step": 2078 }, { "epoch": 0.19181178641448507, "grad_norm": 2.5443842796035256, "learning_rate": 1.172034139686483e-06, "loss": 0.7111, "step": 2079 }, { "epoch": 0.191904047976012, "grad_norm": 2.0015549144460234, "learning_rate": 1.1719431155762617e-06, "loss": 0.8692, "step": 2080 }, { "epoch": 0.191904047976012, "eval_GEN Loss": 0.4749683737754822, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.4088994860649109, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9153845906257629, "eval_runtime": 56.0366, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2080 }, { "epoch": 0.19199630953753893, "grad_norm": 1.723692974059648, "learning_rate": 1.1718520419011943e-06, "loss": 0.7381, "step": 2081 }, { "epoch": 0.19208857109906585, "grad_norm": 1.6204546727085558, "learning_rate": 1.171760918669534e-06, "loss": 0.6291, "step": 2082 }, { "epoch": 0.19218083266059277, "grad_norm": 1.7591591876718784, "learning_rate": 1.171669745889539e-06, "loss": 0.6556, "step": 2083 }, { "epoch": 0.19227309422211972, "grad_norm": 1.6837994993989869, "learning_rate": 1.1715785235694709e-06, "loss": 0.5594, "step": 2084 }, { "epoch": 0.19236535578364664, "grad_norm": 2.1498111899108165, "learning_rate": 1.1714872517175967e-06, "loss": 0.976, "step": 2085 }, { "epoch": 0.19236535578364664, "eval_GEN Loss": 0.47523412108421326, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.4029233455657959, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9121394157409668, "eval_runtime": 55.9498, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2085 }, { "epoch": 0.19245761734517355, "grad_norm": 1.594466370015717, "learning_rate": 1.1713959303421877e-06, "loss": 0.7225, "step": 2086 }, { "epoch": 0.1925498789067005, "grad_norm": 1.2921041280679968, "learning_rate": 1.1713045594515194e-06, "loss": 0.6543, "step": 2087 }, { "epoch": 0.19264214046822742, "grad_norm": 1.603007946484057, "learning_rate": 1.171213139053872e-06, "loss": 0.757, "step": 2088 }, { "epoch": 0.19273440202975436, "grad_norm": 2.7035496344344776, "learning_rate": 1.1711216691575302e-06, "loss": 0.9921, "step": 2089 }, { "epoch": 0.19282666359128128, "grad_norm": 2.627501808473552, "learning_rate": 1.171030149770783e-06, "loss": 0.7437, "step": 2090 }, { "epoch": 0.19282666359128128, "eval_GEN Loss": 0.47421345114707947, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.37928611040115356, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9138821959495544, "eval_runtime": 55.8172, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2090 }, { "epoch": 0.1929189251528082, "grad_norm": 2.939675116898713, "learning_rate": 1.1709385809019243e-06, "loss": 0.9881, "step": 2091 }, { "epoch": 0.19301118671433515, "grad_norm": 1.5382624829545013, "learning_rate": 1.170846962559252e-06, "loss": 0.5454, "step": 2092 }, { "epoch": 0.19310344827586207, "grad_norm": 2.412140666845858, "learning_rate": 1.1707552947510689e-06, "loss": 0.8449, "step": 2093 }, { "epoch": 0.19319570983738898, "grad_norm": 2.050495972674451, "learning_rate": 1.170663577485682e-06, "loss": 0.8667, "step": 2094 }, { "epoch": 0.19328797139891593, "grad_norm": 2.412449004816114, "learning_rate": 1.1705718107714025e-06, "loss": 0.8212, "step": 2095 }, { "epoch": 0.19328797139891593, "eval_GEN Loss": 0.47555992007255554, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.37556973099708557, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9121994972229004, "eval_runtime": 56.066, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2095 }, { "epoch": 0.19338023296044285, "grad_norm": 1.8618620941503157, "learning_rate": 1.1704799946165471e-06, "loss": 0.9453, "step": 2096 }, { "epoch": 0.1934724945219698, "grad_norm": 1.7248835980945905, "learning_rate": 1.1703881290294357e-06, "loss": 0.6785, "step": 2097 }, { "epoch": 0.19356475608349671, "grad_norm": 2.42521747941105, "learning_rate": 1.1702962140183938e-06, "loss": 0.9181, "step": 2098 }, { "epoch": 0.19365701764502363, "grad_norm": 1.6569213548155524, "learning_rate": 1.1702042495917507e-06, "loss": 0.4116, "step": 2099 }, { "epoch": 0.19374927920655058, "grad_norm": 2.445742982708023, "learning_rate": 1.1701122357578402e-06, "loss": 0.8711, "step": 2100 }, { "epoch": 0.19374927920655058, "eval_GEN Loss": 0.47657743096351624, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38126426935195923, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.904026448726654, "eval_runtime": 55.9303, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2100 }, { "epoch": 0.1938415407680775, "grad_norm": 2.489860100516864, "learning_rate": 1.170020172525001e-06, "loss": 0.8869, "step": 2101 }, { "epoch": 0.19393380232960442, "grad_norm": 1.7185828996157118, "learning_rate": 1.1699280599015758e-06, "loss": 0.8002, "step": 2102 }, { "epoch": 0.19402606389113136, "grad_norm": 1.730053667769409, "learning_rate": 1.1698358978959121e-06, "loss": 0.6431, "step": 2103 }, { "epoch": 0.19411832545265828, "grad_norm": 2.210130976296359, "learning_rate": 1.1697436865163617e-06, "loss": 0.8812, "step": 2104 }, { "epoch": 0.19421058701418523, "grad_norm": 1.7501335028584264, "learning_rate": 1.1696514257712812e-06, "loss": 0.6264, "step": 2105 }, { "epoch": 0.19421058701418523, "eval_GEN Loss": 0.47559112310409546, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37901872396469116, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9000601172447205, "eval_runtime": 55.8737, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2105 }, { "epoch": 0.19430284857571214, "grad_norm": 1.518035137093612, "learning_rate": 1.169559115669031e-06, "loss": 0.8045, "step": 2106 }, { "epoch": 0.19439511013723906, "grad_norm": 1.8605848033256487, "learning_rate": 1.1694667562179766e-06, "loss": 0.7365, "step": 2107 }, { "epoch": 0.194487371698766, "grad_norm": 2.2692257263639997, "learning_rate": 1.1693743474264879e-06, "loss": 0.8885, "step": 2108 }, { "epoch": 0.19457963326029293, "grad_norm": 1.7389934815117432, "learning_rate": 1.1692818893029386e-06, "loss": 0.61, "step": 2109 }, { "epoch": 0.19467189482181985, "grad_norm": 1.8801892562984148, "learning_rate": 1.1691893818557081e-06, "loss": 0.7616, "step": 2110 }, { "epoch": 0.19467189482181985, "eval_GEN Loss": 0.4751238226890564, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3778570294380188, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8924880027770996, "eval_runtime": 56.1755, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 2110 }, { "epoch": 0.1947641563833468, "grad_norm": 2.9935999868900574, "learning_rate": 1.1690968250931793e-06, "loss": 0.8215, "step": 2111 }, { "epoch": 0.1948564179448737, "grad_norm": 1.240026989214338, "learning_rate": 1.1690042190237397e-06, "loss": 0.7554, "step": 2112 }, { "epoch": 0.19494867950640066, "grad_norm": 1.663347006712576, "learning_rate": 1.1689115636557817e-06, "loss": 0.7469, "step": 2113 }, { "epoch": 0.19504094106792758, "grad_norm": 2.1324165398294737, "learning_rate": 1.1688188589977012e-06, "loss": 0.878, "step": 2114 }, { "epoch": 0.1951332026294545, "grad_norm": 1.5318585856133733, "learning_rate": 1.1687261050578999e-06, "loss": 0.7284, "step": 2115 }, { "epoch": 0.1951332026294545, "eval_GEN Loss": 0.47557395696640015, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38053131103515625, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8861178159713745, "eval_runtime": 55.9378, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2115 }, { "epoch": 0.19522546419098144, "grad_norm": 1.9406484809626303, "learning_rate": 1.1686333018447831e-06, "loss": 0.7447, "step": 2116 }, { "epoch": 0.19531772575250836, "grad_norm": 1.4661856513402853, "learning_rate": 1.168540449366761e-06, "loss": 0.7673, "step": 2117 }, { "epoch": 0.19540998731403528, "grad_norm": 1.5532965239645762, "learning_rate": 1.1684475476322477e-06, "loss": 0.6529, "step": 2118 }, { "epoch": 0.19550224887556222, "grad_norm": 1.7328866001668306, "learning_rate": 1.1683545966496624e-06, "loss": 0.7228, "step": 2119 }, { "epoch": 0.19559451043708914, "grad_norm": 2.653230913036073, "learning_rate": 1.1682615964274282e-06, "loss": 0.9043, "step": 2120 }, { "epoch": 0.19559451043708914, "eval_GEN Loss": 0.4752795100212097, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3887932300567627, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8825721144676208, "eval_runtime": 56.2164, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 2120 }, { "epoch": 0.1956867719986161, "grad_norm": 1.834892901245111, "learning_rate": 1.1681685469739728e-06, "loss": 0.736, "step": 2121 }, { "epoch": 0.195779033560143, "grad_norm": 2.268595314023195, "learning_rate": 1.168075448297729e-06, "loss": 0.7198, "step": 2122 }, { "epoch": 0.19587129512166992, "grad_norm": 2.8209869109637893, "learning_rate": 1.167982300407133e-06, "loss": 0.9889, "step": 2123 }, { "epoch": 0.19596355668319687, "grad_norm": 2.2758613417274995, "learning_rate": 1.1678891033106265e-06, "loss": 0.7325, "step": 2124 }, { "epoch": 0.1960558182447238, "grad_norm": 2.5891500558623437, "learning_rate": 1.167795857016655e-06, "loss": 0.7827, "step": 2125 }, { "epoch": 0.1960558182447238, "eval_GEN Loss": 0.4752276539802551, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3605865240097046, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8686298131942749, "eval_runtime": 56.9304, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2125 }, { "epoch": 0.1961480798062507, "grad_norm": 1.7321506869110495, "learning_rate": 1.1677025615336684e-06, "loss": 0.8529, "step": 2126 }, { "epoch": 0.19624034136777765, "grad_norm": 1.6446856506620964, "learning_rate": 1.1676092168701214e-06, "loss": 0.812, "step": 2127 }, { "epoch": 0.19633260292930457, "grad_norm": 2.035225255341396, "learning_rate": 1.1675158230344731e-06, "loss": 0.6864, "step": 2128 }, { "epoch": 0.19642486449083152, "grad_norm": 1.6727419464219047, "learning_rate": 1.1674223800351871e-06, "loss": 0.6947, "step": 2129 }, { "epoch": 0.19651712605235844, "grad_norm": 2.7270117150880293, "learning_rate": 1.1673288878807312e-06, "loss": 0.9565, "step": 2130 }, { "epoch": 0.19651712605235844, "eval_GEN Loss": 0.4728906452655792, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9146341463414634, "eval_PRM F1 AUC": 0.8213724463069669, "eval_PRM F1 Neg": 0.7083333333333334, "eval_PRM Loss": 0.34505847096443176, "eval_PRM NPV": 0.68, "eval_PRM Precision": 0.9259259259259259, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8583533763885498, "eval_runtime": 56.8477, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2130 }, { "epoch": 0.19660938761388536, "grad_norm": 2.315561439377134, "learning_rate": 1.1672353465795778e-06, "loss": 0.8579, "step": 2131 }, { "epoch": 0.1967016491754123, "grad_norm": 2.445484447216849, "learning_rate": 1.1671417561402037e-06, "loss": 0.7155, "step": 2132 }, { "epoch": 0.19679391073693922, "grad_norm": 1.4171824307104404, "learning_rate": 1.1670481165710906e-06, "loss": 0.786, "step": 2133 }, { "epoch": 0.19688617229846614, "grad_norm": 1.9530654960217884, "learning_rate": 1.1669544278807239e-06, "loss": 0.791, "step": 2134 }, { "epoch": 0.19697843385999309, "grad_norm": 1.9259482942527117, "learning_rate": 1.1668606900775936e-06, "loss": 0.855, "step": 2135 }, { "epoch": 0.19697843385999309, "eval_GEN Loss": 0.4720461666584015, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.34648963809013367, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8544471263885498, "eval_runtime": 56.7497, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2135 }, { "epoch": 0.19707069542152, "grad_norm": 1.7540937429449306, "learning_rate": 1.166766903170195e-06, "loss": 0.6871, "step": 2136 }, { "epoch": 0.19716295698304695, "grad_norm": 2.2431423540689486, "learning_rate": 1.1666730671670269e-06, "loss": 0.7345, "step": 2137 }, { "epoch": 0.19725521854457387, "grad_norm": 2.180562741419492, "learning_rate": 1.1665791820765926e-06, "loss": 0.6921, "step": 2138 }, { "epoch": 0.1973474801061008, "grad_norm": 1.869450975392008, "learning_rate": 1.1664852479074005e-06, "loss": 0.8264, "step": 2139 }, { "epoch": 0.19743974166762773, "grad_norm": 1.57533144178452, "learning_rate": 1.1663912646679628e-06, "loss": 0.6432, "step": 2140 }, { "epoch": 0.19743974166762773, "eval_GEN Loss": 0.47172442078590393, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.3543279767036438, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8531851172447205, "eval_runtime": 55.8033, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2140 }, { "epoch": 0.19753200322915465, "grad_norm": 1.2884555954442063, "learning_rate": 1.1662972323667967e-06, "loss": 0.5873, "step": 2141 }, { "epoch": 0.19762426479068157, "grad_norm": 2.5057557700609068, "learning_rate": 1.1662031510124233e-06, "loss": 0.7394, "step": 2142 }, { "epoch": 0.19771652635220852, "grad_norm": 2.1793536972246894, "learning_rate": 1.1661090206133686e-06, "loss": 0.8169, "step": 2143 }, { "epoch": 0.19780878791373543, "grad_norm": 1.7726817338950984, "learning_rate": 1.1660148411781625e-06, "loss": 0.824, "step": 2144 }, { "epoch": 0.19790104947526238, "grad_norm": 2.0722325893696443, "learning_rate": 1.16592061271534e-06, "loss": 0.5855, "step": 2145 }, { "epoch": 0.19790104947526238, "eval_GEN Loss": 0.4713197350502014, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3694514036178589, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8676682710647583, "eval_runtime": 55.8797, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2145 }, { "epoch": 0.1979933110367893, "grad_norm": 1.4638687069641676, "learning_rate": 1.1658263352334402e-06, "loss": 0.684, "step": 2146 }, { "epoch": 0.19808557259831622, "grad_norm": 1.3822063982717827, "learning_rate": 1.1657320087410068e-06, "loss": 0.6227, "step": 2147 }, { "epoch": 0.19817783415984316, "grad_norm": 1.709733050362052, "learning_rate": 1.1656376332465873e-06, "loss": 0.6928, "step": 2148 }, { "epoch": 0.19827009572137008, "grad_norm": 1.8248242738528617, "learning_rate": 1.1655432087587348e-06, "loss": 0.8613, "step": 2149 }, { "epoch": 0.198362357282897, "grad_norm": 1.9798829605323542, "learning_rate": 1.165448735286006e-06, "loss": 0.7774, "step": 2150 }, { "epoch": 0.198362357282897, "eval_GEN Loss": 0.4713093638420105, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3774649500846863, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8806490302085876, "eval_runtime": 55.8184, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2150 }, { "epoch": 0.19845461884442395, "grad_norm": 2.9023380907319134, "learning_rate": 1.1653542128369615e-06, "loss": 1.0227, "step": 2151 }, { "epoch": 0.19854688040595087, "grad_norm": 1.9566433766921913, "learning_rate": 1.1652596414201683e-06, "loss": 0.6662, "step": 2152 }, { "epoch": 0.1986391419674778, "grad_norm": 3.0263774573118845, "learning_rate": 1.1651650210441958e-06, "loss": 1.0691, "step": 2153 }, { "epoch": 0.19873140352900473, "grad_norm": 1.8388460908019544, "learning_rate": 1.1650703517176188e-06, "loss": 0.5693, "step": 2154 }, { "epoch": 0.19882366509053165, "grad_norm": 1.7077486572942435, "learning_rate": 1.1649756334490165e-06, "loss": 0.7307, "step": 2155 }, { "epoch": 0.19882366509053165, "eval_GEN Loss": 0.4734862446784973, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4129568040370941, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8912860751152039, "eval_runtime": 55.758, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2155 }, { "epoch": 0.1989159266520586, "grad_norm": 2.1519996732380497, "learning_rate": 1.1648808662469725e-06, "loss": 0.7858, "step": 2156 }, { "epoch": 0.1990081882135855, "grad_norm": 2.8792455478180288, "learning_rate": 1.1647860501200744e-06, "loss": 0.8351, "step": 2157 }, { "epoch": 0.19910044977511243, "grad_norm": 2.5978872367652084, "learning_rate": 1.164691185076915e-06, "loss": 0.7649, "step": 2158 }, { "epoch": 0.19919271133663938, "grad_norm": 2.4542299987549216, "learning_rate": 1.1645962711260908e-06, "loss": 0.861, "step": 2159 }, { "epoch": 0.1992849728981663, "grad_norm": 1.826676457982078, "learning_rate": 1.1645013082762034e-06, "loss": 0.7304, "step": 2160 }, { "epoch": 0.1992849728981663, "eval_GEN Loss": 0.4735404849052429, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4202714264392853, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.899218738079071, "eval_runtime": 55.8929, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2160 }, { "epoch": 0.19937723445969324, "grad_norm": 2.0889619371874173, "learning_rate": 1.164406296535858e-06, "loss": 0.875, "step": 2161 }, { "epoch": 0.19946949602122016, "grad_norm": 2.213142481426363, "learning_rate": 1.1643112359136648e-06, "loss": 0.6971, "step": 2162 }, { "epoch": 0.19956175758274708, "grad_norm": 2.0919058344979153, "learning_rate": 1.1642161264182389e-06, "loss": 0.7692, "step": 2163 }, { "epoch": 0.19965401914427403, "grad_norm": 2.0040945903130782, "learning_rate": 1.1641209680581986e-06, "loss": 0.7919, "step": 2164 }, { "epoch": 0.19974628070580094, "grad_norm": 2.67666508515558, "learning_rate": 1.1640257608421679e-06, "loss": 1.0232, "step": 2165 }, { "epoch": 0.19974628070580094, "eval_GEN Loss": 0.4732702374458313, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.41842952370643616, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9045072197914124, "eval_runtime": 55.9137, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2165 }, { "epoch": 0.19983854226732786, "grad_norm": 2.211300331233957, "learning_rate": 1.163930504778774e-06, "loss": 0.8335, "step": 2166 }, { "epoch": 0.1999308038288548, "grad_norm": 2.2516906475534624, "learning_rate": 1.1638351998766495e-06, "loss": 1.0556, "step": 2167 }, { "epoch": 0.20002306539038173, "grad_norm": 1.854903417938329, "learning_rate": 1.1637398461444313e-06, "loss": 0.7604, "step": 2168 }, { "epoch": 0.20011532695190867, "grad_norm": 2.695239187375436, "learning_rate": 1.16364444359076e-06, "loss": 0.9138, "step": 2169 }, { "epoch": 0.2002075885134356, "grad_norm": 2.417092201907459, "learning_rate": 1.1635489922242816e-06, "loss": 0.8951, "step": 2170 }, { "epoch": 0.2002075885134356, "eval_GEN Loss": 0.47371259331703186, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4227430522441864, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9177283644676208, "eval_runtime": 55.7797, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2170 }, { "epoch": 0.2002998500749625, "grad_norm": 2.8940595211064455, "learning_rate": 1.1634534920536458e-06, "loss": 0.926, "step": 2171 }, { "epoch": 0.20039211163648946, "grad_norm": 1.5796208126736675, "learning_rate": 1.1633579430875067e-06, "loss": 0.8173, "step": 2172 }, { "epoch": 0.20048437319801637, "grad_norm": 2.2360021997772366, "learning_rate": 1.1632623453345238e-06, "loss": 0.8244, "step": 2173 }, { "epoch": 0.2005766347595433, "grad_norm": 1.9058751759846053, "learning_rate": 1.1631666988033595e-06, "loss": 0.7873, "step": 2174 }, { "epoch": 0.20066889632107024, "grad_norm": 1.637412668967031, "learning_rate": 1.1630710035026824e-06, "loss": 0.8754, "step": 2175 }, { "epoch": 0.20066889632107024, "eval_GEN Loss": 0.4731568992137909, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.3976535201072693, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9191105961799622, "eval_runtime": 55.7887, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2175 }, { "epoch": 0.20076115788259716, "grad_norm": 2.0792545831549614, "learning_rate": 1.1629752594411636e-06, "loss": 0.8187, "step": 2176 }, { "epoch": 0.2008534194441241, "grad_norm": 1.5427235907101737, "learning_rate": 1.1628794666274803e-06, "loss": 0.7435, "step": 2177 }, { "epoch": 0.20094568100565102, "grad_norm": 1.9341408509913365, "learning_rate": 1.1627836250703127e-06, "loss": 0.842, "step": 2178 }, { "epoch": 0.20103794256717794, "grad_norm": 2.5845751856843986, "learning_rate": 1.162687734778347e-06, "loss": 0.6199, "step": 2179 }, { "epoch": 0.2011302041287049, "grad_norm": 1.7097335293652327, "learning_rate": 1.1625917957602723e-06, "loss": 0.6996, "step": 2180 }, { "epoch": 0.2011302041287049, "eval_GEN Loss": 0.4752475619316101, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.40738368034362793, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9316105842590332, "eval_runtime": 55.9206, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2180 }, { "epoch": 0.2012224656902318, "grad_norm": 1.7254864136798387, "learning_rate": 1.1624958080247826e-06, "loss": 0.6264, "step": 2181 }, { "epoch": 0.20131472725175872, "grad_norm": 1.7315952013574136, "learning_rate": 1.1623997715805771e-06, "loss": 0.6824, "step": 2182 }, { "epoch": 0.20140698881328567, "grad_norm": 1.5971953206050904, "learning_rate": 1.1623036864363582e-06, "loss": 0.7546, "step": 2183 }, { "epoch": 0.2014992503748126, "grad_norm": 2.0592919744913183, "learning_rate": 1.1622075526008337e-06, "loss": 0.636, "step": 2184 }, { "epoch": 0.20159151193633953, "grad_norm": 1.4963490463559308, "learning_rate": 1.162111370082715e-06, "loss": 0.6686, "step": 2185 }, { "epoch": 0.20159151193633953, "eval_GEN Loss": 0.475746750831604, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3980647027492523, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9399038553237915, "eval_runtime": 56.1855, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 2185 }, { "epoch": 0.20168377349786645, "grad_norm": 1.7118715761439545, "learning_rate": 1.1620151388907186e-06, "loss": 0.8563, "step": 2186 }, { "epoch": 0.20177603505939337, "grad_norm": 1.8824076807560626, "learning_rate": 1.1619188590335651e-06, "loss": 0.9051, "step": 2187 }, { "epoch": 0.20186829662092032, "grad_norm": 1.502251399123566, "learning_rate": 1.1618225305199794e-06, "loss": 0.563, "step": 2188 }, { "epoch": 0.20196055818244724, "grad_norm": 2.339386555095602, "learning_rate": 1.161726153358691e-06, "loss": 0.9121, "step": 2189 }, { "epoch": 0.20205281974397415, "grad_norm": 1.9191486206770145, "learning_rate": 1.1616297275584338e-06, "loss": 0.8298, "step": 2190 }, { "epoch": 0.20205281974397415, "eval_GEN Loss": 0.4742852747440338, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3946433961391449, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9516226053237915, "eval_runtime": 56.8234, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2190 }, { "epoch": 0.2021450813055011, "grad_norm": 1.4872003622550216, "learning_rate": 1.1615332531279459e-06, "loss": 0.7534, "step": 2191 }, { "epoch": 0.20223734286702802, "grad_norm": 1.8293995126466744, "learning_rate": 1.1614367300759702e-06, "loss": 0.7144, "step": 2192 }, { "epoch": 0.20232960442855497, "grad_norm": 2.424816644760713, "learning_rate": 1.1613401584112535e-06, "loss": 0.9931, "step": 2193 }, { "epoch": 0.20242186599008188, "grad_norm": 1.4672034085405155, "learning_rate": 1.1612435381425478e-06, "loss": 0.6609, "step": 2194 }, { "epoch": 0.2025141275516088, "grad_norm": 3.1144754000810835, "learning_rate": 1.1611468692786083e-06, "loss": 0.8067, "step": 2195 }, { "epoch": 0.2025141275516088, "eval_GEN Loss": 0.47315630316734314, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.39846715331077576, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9524038434028625, "eval_runtime": 56.0352, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2195 }, { "epoch": 0.20260638911313575, "grad_norm": 1.5713749669294763, "learning_rate": 1.1610501518281957e-06, "loss": 0.9158, "step": 2196 }, { "epoch": 0.20269865067466267, "grad_norm": 2.8028927388889344, "learning_rate": 1.1609533858000747e-06, "loss": 0.7719, "step": 2197 }, { "epoch": 0.20279091223618959, "grad_norm": 1.6739765872226005, "learning_rate": 1.160856571203014e-06, "loss": 0.7266, "step": 2198 }, { "epoch": 0.20288317379771653, "grad_norm": 1.615812143284236, "learning_rate": 1.1607597080457876e-06, "loss": 0.8073, "step": 2199 }, { "epoch": 0.20297543535924345, "grad_norm": 2.141367380534688, "learning_rate": 1.160662796337173e-06, "loss": 0.8588, "step": 2200 }, { "epoch": 0.20297543535924345, "eval_GEN Loss": 0.4725123941898346, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.4200517237186432, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.940625011920929, "eval_runtime": 56.0489, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2200 }, { "epoch": 0.2030676969207704, "grad_norm": 1.8213880271221528, "learning_rate": 1.1605658360859528e-06, "loss": 0.6891, "step": 2201 }, { "epoch": 0.20315995848229731, "grad_norm": 1.656531375970182, "learning_rate": 1.1604688273009136e-06, "loss": 0.7833, "step": 2202 }, { "epoch": 0.20325222004382423, "grad_norm": 2.263318720055018, "learning_rate": 1.1603717699908461e-06, "loss": 0.7284, "step": 2203 }, { "epoch": 0.20334448160535118, "grad_norm": 2.576418203657882, "learning_rate": 1.1602746641645462e-06, "loss": 0.7333, "step": 2204 }, { "epoch": 0.2034367431668781, "grad_norm": 1.767694725912544, "learning_rate": 1.160177509830814e-06, "loss": 0.6952, "step": 2205 }, { "epoch": 0.2034367431668781, "eval_GEN Loss": 0.47379887104034424, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.44554200768470764, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9538461565971375, "eval_runtime": 55.7983, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2205 }, { "epoch": 0.20352900472840502, "grad_norm": 2.023565969537719, "learning_rate": 1.160080306998453e-06, "loss": 0.5573, "step": 2206 }, { "epoch": 0.20362126628993196, "grad_norm": 1.5327095711767684, "learning_rate": 1.1599830556762728e-06, "loss": 0.7337, "step": 2207 }, { "epoch": 0.20371352785145888, "grad_norm": 2.4388722426346257, "learning_rate": 1.1598857558730858e-06, "loss": 0.8009, "step": 2208 }, { "epoch": 0.20380578941298583, "grad_norm": 1.7281652578654474, "learning_rate": 1.1597884075977097e-06, "loss": 0.6855, "step": 2209 }, { "epoch": 0.20389805097451275, "grad_norm": 2.320746802377084, "learning_rate": 1.1596910108589665e-06, "loss": 0.864, "step": 2210 }, { "epoch": 0.20389805097451275, "eval_GEN Loss": 0.4759262502193451, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.4454600512981415, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9655048251152039, "eval_runtime": 55.8888, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2210 }, { "epoch": 0.20399031253603966, "grad_norm": 1.5772755489697625, "learning_rate": 1.1595935656656823e-06, "loss": 0.6484, "step": 2211 }, { "epoch": 0.2040825740975666, "grad_norm": 1.9593363728966164, "learning_rate": 1.1594960720266875e-06, "loss": 0.8232, "step": 2212 }, { "epoch": 0.20417483565909353, "grad_norm": 3.061828812767506, "learning_rate": 1.1593985299508173e-06, "loss": 0.7763, "step": 2213 }, { "epoch": 0.20426709722062045, "grad_norm": 2.034800705615405, "learning_rate": 1.1593009394469113e-06, "loss": 0.6538, "step": 2214 }, { "epoch": 0.2043593587821474, "grad_norm": 2.2677067288477204, "learning_rate": 1.1592033005238132e-06, "loss": 0.8398, "step": 2215 }, { "epoch": 0.2043593587821474, "eval_GEN Loss": 0.4771953225135803, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.42658737301826477, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9716346263885498, "eval_runtime": 57.2219, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 2215 }, { "epoch": 0.2044516203436743, "grad_norm": 1.8709461722271208, "learning_rate": 1.159105613190371e-06, "loss": 0.6145, "step": 2216 }, { "epoch": 0.20454388190520126, "grad_norm": 1.6362598916212179, "learning_rate": 1.1590078774554375e-06, "loss": 0.5606, "step": 2217 }, { "epoch": 0.20463614346672818, "grad_norm": 1.5807983911321843, "learning_rate": 1.1589100933278698e-06, "loss": 0.5946, "step": 2218 }, { "epoch": 0.2047284050282551, "grad_norm": 1.9108688609185664, "learning_rate": 1.158812260816529e-06, "loss": 0.5409, "step": 2219 }, { "epoch": 0.20482066658978204, "grad_norm": 1.9265345321607514, "learning_rate": 1.1587143799302806e-06, "loss": 0.6977, "step": 2220 }, { "epoch": 0.20482066658978204, "eval_GEN Loss": 0.4785206615924835, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.41944700479507446, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9948317408561707, "eval_runtime": 56.9385, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2220 }, { "epoch": 0.20491292815130896, "grad_norm": 2.395886053095591, "learning_rate": 1.1586164506779952e-06, "loss": 0.828, "step": 2221 }, { "epoch": 0.20500518971283588, "grad_norm": 2.119859533382076, "learning_rate": 1.1585184730685472e-06, "loss": 0.7004, "step": 2222 }, { "epoch": 0.20509745127436282, "grad_norm": 1.5753261897183282, "learning_rate": 1.1584204471108151e-06, "loss": 0.6569, "step": 2223 }, { "epoch": 0.20518971283588974, "grad_norm": 2.784071443294006, "learning_rate": 1.1583223728136828e-06, "loss": 0.8896, "step": 2224 }, { "epoch": 0.2052819743974167, "grad_norm": 3.5920705062442426, "learning_rate": 1.1582242501860375e-06, "loss": 0.9065, "step": 2225 }, { "epoch": 0.2052819743974167, "eval_GEN Loss": 0.4771478474140167, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.4128265082836151, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 1.0010817050933838, "eval_runtime": 56.9999, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 2225 }, { "epoch": 0.2053742359589436, "grad_norm": 2.849917161964412, "learning_rate": 1.1581260792367714e-06, "loss": 0.9079, "step": 2226 }, { "epoch": 0.20546649752047053, "grad_norm": 4.075805587999574, "learning_rate": 1.1580278599747807e-06, "loss": 0.9575, "step": 2227 }, { "epoch": 0.20555875908199747, "grad_norm": 1.5820298116715013, "learning_rate": 1.1579295924089665e-06, "loss": 0.5648, "step": 2228 }, { "epoch": 0.2056510206435244, "grad_norm": 1.8614520135578403, "learning_rate": 1.1578312765482335e-06, "loss": 0.874, "step": 2229 }, { "epoch": 0.2057432822050513, "grad_norm": 1.973629767428031, "learning_rate": 1.1577329124014918e-06, "loss": 0.8192, "step": 2230 }, { "epoch": 0.2057432822050513, "eval_GEN Loss": 0.4752151370048523, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.40567606687545776, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9876201748847961, "eval_runtime": 57.1134, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 2230 }, { "epoch": 0.20583554376657826, "grad_norm": 1.959528236745921, "learning_rate": 1.157634499977655e-06, "loss": 0.7145, "step": 2231 }, { "epoch": 0.20592780532810517, "grad_norm": 3.7674519565202194, "learning_rate": 1.1575360392856414e-06, "loss": 0.6961, "step": 2232 }, { "epoch": 0.20602006688963212, "grad_norm": 2.9903737460475868, "learning_rate": 1.1574375303343738e-06, "loss": 1.0235, "step": 2233 }, { "epoch": 0.20611232845115904, "grad_norm": 2.062107256056617, "learning_rate": 1.157338973132779e-06, "loss": 0.8793, "step": 2234 }, { "epoch": 0.20620459001268596, "grad_norm": 1.5714567565958513, "learning_rate": 1.1572403676897886e-06, "loss": 0.6572, "step": 2235 }, { "epoch": 0.20620459001268596, "eval_GEN Loss": 0.47319895029067993, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.41750359535217285, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9718149304389954, "eval_runtime": 56.9057, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2235 }, { "epoch": 0.2062968515742129, "grad_norm": 2.102201250010656, "learning_rate": 1.1571417140143384e-06, "loss": 0.8417, "step": 2236 }, { "epoch": 0.20638911313573982, "grad_norm": 1.4546035367495007, "learning_rate": 1.1570430121153683e-06, "loss": 0.6773, "step": 2237 }, { "epoch": 0.20648137469726674, "grad_norm": 2.257513931694606, "learning_rate": 1.1569442620018232e-06, "loss": 0.8263, "step": 2238 }, { "epoch": 0.20657363625879369, "grad_norm": 1.5450495346865374, "learning_rate": 1.1568454636826515e-06, "loss": 0.6472, "step": 2239 }, { "epoch": 0.2066658978203206, "grad_norm": 2.2640080839540087, "learning_rate": 1.1567466171668067e-06, "loss": 0.8704, "step": 2240 }, { "epoch": 0.2066658978203206, "eval_GEN Loss": 0.47217726707458496, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4422333836555481, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9549278616905212, "eval_runtime": 56.8929, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2240 }, { "epoch": 0.20675815938184755, "grad_norm": 1.9422457799858017, "learning_rate": 1.156647722463247e-06, "loss": 0.6511, "step": 2241 }, { "epoch": 0.20685042094337447, "grad_norm": 1.882138731890447, "learning_rate": 1.1565487795809334e-06, "loss": 0.7802, "step": 2242 }, { "epoch": 0.2069426825049014, "grad_norm": 2.08874878682335, "learning_rate": 1.1564497885288328e-06, "loss": 0.7902, "step": 2243 }, { "epoch": 0.20703494406642833, "grad_norm": 1.557435516696818, "learning_rate": 1.156350749315916e-06, "loss": 0.7547, "step": 2244 }, { "epoch": 0.20712720562795525, "grad_norm": 1.3826535986615829, "learning_rate": 1.1562516619511576e-06, "loss": 0.7163, "step": 2245 }, { "epoch": 0.20712720562795525, "eval_GEN Loss": 0.47124239802360535, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4405944049358368, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9440504908561707, "eval_runtime": 57.0393, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 2245 }, { "epoch": 0.20721946718948217, "grad_norm": 2.6485078662914034, "learning_rate": 1.1561525264435378e-06, "loss": 0.7523, "step": 2246 }, { "epoch": 0.20731172875100912, "grad_norm": 2.150377140764201, "learning_rate": 1.1560533428020398e-06, "loss": 0.9366, "step": 2247 }, { "epoch": 0.20740399031253604, "grad_norm": 1.5380322833366769, "learning_rate": 1.155954111035652e-06, "loss": 0.6323, "step": 2248 }, { "epoch": 0.20749625187406298, "grad_norm": 2.707062319921174, "learning_rate": 1.1558548311533671e-06, "loss": 1.0883, "step": 2249 }, { "epoch": 0.2075885134355899, "grad_norm": 1.7728842055382055, "learning_rate": 1.1557555031641815e-06, "loss": 0.8393, "step": 2250 }, { "epoch": 0.2075885134355899, "eval_GEN Loss": 0.46939241886138916, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4045702815055847, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9229567050933838, "eval_runtime": 56.2359, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 2250 }, { "epoch": 0.20768077499711682, "grad_norm": 1.9400906411710708, "learning_rate": 1.1556561270770971e-06, "loss": 0.8392, "step": 2251 }, { "epoch": 0.20777303655864376, "grad_norm": 1.713949094373851, "learning_rate": 1.155556702901119e-06, "loss": 0.6385, "step": 2252 }, { "epoch": 0.20786529812017068, "grad_norm": 1.4296639261220656, "learning_rate": 1.1554572306452575e-06, "loss": 0.5572, "step": 2253 }, { "epoch": 0.2079575596816976, "grad_norm": 2.0860711101621385, "learning_rate": 1.1553577103185268e-06, "loss": 0.6838, "step": 2254 }, { "epoch": 0.20804982124322455, "grad_norm": 1.2807061636561392, "learning_rate": 1.1552581419299455e-06, "loss": 0.7326, "step": 2255 }, { "epoch": 0.20804982124322455, "eval_GEN Loss": 0.46940556168556213, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.37396758794784546, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9145432710647583, "eval_runtime": 56.0935, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2255 }, { "epoch": 0.20814208280475147, "grad_norm": 1.6619205021563814, "learning_rate": 1.1551585254885366e-06, "loss": 0.6068, "step": 2256 }, { "epoch": 0.2082343443662784, "grad_norm": 1.758571705646242, "learning_rate": 1.155058861003328e-06, "loss": 0.7124, "step": 2257 }, { "epoch": 0.20832660592780533, "grad_norm": 2.3864128225982273, "learning_rate": 1.1549591484833509e-06, "loss": 0.7266, "step": 2258 }, { "epoch": 0.20841886748933225, "grad_norm": 2.0267324513331517, "learning_rate": 1.1548593879376417e-06, "loss": 0.6844, "step": 2259 }, { "epoch": 0.2085111290508592, "grad_norm": 1.520344931273364, "learning_rate": 1.1547595793752404e-06, "loss": 0.6734, "step": 2260 }, { "epoch": 0.2085111290508592, "eval_GEN Loss": 0.4700671434402466, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3706658184528351, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9083533883094788, "eval_runtime": 56.1305, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2260 }, { "epoch": 0.2086033906123861, "grad_norm": 1.5288111304880814, "learning_rate": 1.1546597228051924e-06, "loss": 0.5556, "step": 2261 }, { "epoch": 0.20869565217391303, "grad_norm": 1.6684899236360808, "learning_rate": 1.1545598182365467e-06, "loss": 0.6458, "step": 2262 }, { "epoch": 0.20878791373543998, "grad_norm": 1.6059246926166975, "learning_rate": 1.1544598656783566e-06, "loss": 0.7448, "step": 2263 }, { "epoch": 0.2088801752969669, "grad_norm": 1.6885814137936577, "learning_rate": 1.1543598651396803e-06, "loss": 0.6189, "step": 2264 }, { "epoch": 0.20897243685849384, "grad_norm": 2.0709593140019833, "learning_rate": 1.1542598166295795e-06, "loss": 0.8351, "step": 2265 }, { "epoch": 0.20897243685849384, "eval_GEN Loss": 0.47002270817756653, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3875349462032318, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9081730842590332, "eval_runtime": 56.9324, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2265 }, { "epoch": 0.20906469842002076, "grad_norm": 1.4131631275588865, "learning_rate": 1.1541597201571213e-06, "loss": 0.6641, "step": 2266 }, { "epoch": 0.20915695998154768, "grad_norm": 1.802653364706875, "learning_rate": 1.1540595757313762e-06, "loss": 0.6437, "step": 2267 }, { "epoch": 0.20924922154307463, "grad_norm": 1.5221604622967477, "learning_rate": 1.1539593833614197e-06, "loss": 0.5606, "step": 2268 }, { "epoch": 0.20934148310460154, "grad_norm": 2.8260828422142095, "learning_rate": 1.153859143056331e-06, "loss": 0.6902, "step": 2269 }, { "epoch": 0.20943374466612846, "grad_norm": 2.305636405276973, "learning_rate": 1.1537588548251949e-06, "loss": 0.6833, "step": 2270 }, { "epoch": 0.20943374466612846, "eval_GEN Loss": 0.46963343024253845, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.40641361474990845, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.918749988079071, "eval_runtime": 56.8849, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2270 }, { "epoch": 0.2095260062276554, "grad_norm": 3.34761906162355, "learning_rate": 1.1536585186770986e-06, "loss": 0.8558, "step": 2271 }, { "epoch": 0.20961826778918233, "grad_norm": 1.6061109119553205, "learning_rate": 1.1535581346211352e-06, "loss": 0.9361, "step": 2272 }, { "epoch": 0.20971052935070927, "grad_norm": 2.5392476724228845, "learning_rate": 1.153457702666402e-06, "loss": 0.9529, "step": 2273 }, { "epoch": 0.2098027909122362, "grad_norm": 1.9642139317507186, "learning_rate": 1.1533572228219998e-06, "loss": 0.6781, "step": 2274 }, { "epoch": 0.2098950524737631, "grad_norm": 2.1817493632736245, "learning_rate": 1.1532566950970344e-06, "loss": 0.7433, "step": 2275 }, { "epoch": 0.2098950524737631, "eval_GEN Loss": 0.4717455208301544, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.40705302357673645, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9230769276618958, "eval_runtime": 55.9526, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2275 }, { "epoch": 0.20998731403529006, "grad_norm": 2.07245401836506, "learning_rate": 1.1531561195006157e-06, "loss": 0.8597, "step": 2276 }, { "epoch": 0.21007957559681698, "grad_norm": 1.8762935610064746, "learning_rate": 1.1530554960418586e-06, "loss": 0.7134, "step": 2277 }, { "epoch": 0.2101718371583439, "grad_norm": 2.0624062792250513, "learning_rate": 1.1529548247298807e-06, "loss": 0.7134, "step": 2278 }, { "epoch": 0.21026409871987084, "grad_norm": 1.5135048395455495, "learning_rate": 1.152854105573806e-06, "loss": 0.5582, "step": 2279 }, { "epoch": 0.21035636028139776, "grad_norm": 1.8250532253357739, "learning_rate": 1.1527533385827611e-06, "loss": 0.6407, "step": 2280 }, { "epoch": 0.21035636028139776, "eval_GEN Loss": 0.4707697927951813, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3882807195186615, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9154447317123413, "eval_runtime": 56.2476, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 2280 }, { "epoch": 0.2104486218429247, "grad_norm": 2.1871585738069617, "learning_rate": 1.1526525237658781e-06, "loss": 0.7079, "step": 2281 }, { "epoch": 0.21054088340445162, "grad_norm": 4.136395112624742, "learning_rate": 1.1525516611322929e-06, "loss": 1.043, "step": 2282 }, { "epoch": 0.21063314496597854, "grad_norm": 1.7781751336623937, "learning_rate": 1.1524507506911457e-06, "loss": 0.9093, "step": 2283 }, { "epoch": 0.2107254065275055, "grad_norm": 1.468557325789731, "learning_rate": 1.1523497924515812e-06, "loss": 0.6357, "step": 2284 }, { "epoch": 0.2108176680890324, "grad_norm": 4.01144786534884, "learning_rate": 1.1522487864227485e-06, "loss": 1.1312, "step": 2285 }, { "epoch": 0.2108176680890324, "eval_GEN Loss": 0.47120070457458496, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3929106593132019, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9097355604171753, "eval_runtime": 55.9853, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2285 }, { "epoch": 0.21090992965055932, "grad_norm": 3.2513916000655785, "learning_rate": 1.152147732613801e-06, "loss": 0.6032, "step": 2286 }, { "epoch": 0.21100219121208627, "grad_norm": 1.460368053452147, "learning_rate": 1.1520466310338961e-06, "loss": 0.7242, "step": 2287 }, { "epoch": 0.2110944527736132, "grad_norm": 2.680184935014927, "learning_rate": 1.151945481692196e-06, "loss": 0.9445, "step": 2288 }, { "epoch": 0.21118671433514014, "grad_norm": 1.9445908018721438, "learning_rate": 1.1518442845978668e-06, "loss": 0.8572, "step": 2289 }, { "epoch": 0.21127897589666705, "grad_norm": 2.2245065211449035, "learning_rate": 1.1517430397600794e-06, "loss": 0.8897, "step": 2290 }, { "epoch": 0.21127897589666705, "eval_GEN Loss": 0.4726479649543762, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.42766568064689636, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9161959290504456, "eval_runtime": 56.8666, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2290 }, { "epoch": 0.21137123745819397, "grad_norm": 1.89519577801565, "learning_rate": 1.1516417471880083e-06, "loss": 0.7204, "step": 2291 }, { "epoch": 0.21146349901972092, "grad_norm": 2.519218451131417, "learning_rate": 1.1515404068908336e-06, "loss": 0.8184, "step": 2292 }, { "epoch": 0.21155576058124784, "grad_norm": 2.7804067284655263, "learning_rate": 1.151439018877738e-06, "loss": 0.9123, "step": 2293 }, { "epoch": 0.21164802214277476, "grad_norm": 1.5898426208901604, "learning_rate": 1.1513375831579102e-06, "loss": 0.7653, "step": 2294 }, { "epoch": 0.2117402837043017, "grad_norm": 1.475260349760314, "learning_rate": 1.1512360997405423e-06, "loss": 0.646, "step": 2295 }, { "epoch": 0.2117402837043017, "eval_GEN Loss": 0.47331321239471436, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8717948717948718, "eval_PRM F1 AUC": 0.8009429020429545, "eval_PRM F1 Neg": 0.6428571428571429, "eval_PRM Loss": 0.45182713866233826, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.9315068493150684, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9334735870361328, "eval_runtime": 56.8636, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2295 }, { "epoch": 0.21183254526582862, "grad_norm": 2.1198426529587864, "learning_rate": 1.1511345686348303e-06, "loss": 0.7455, "step": 2296 }, { "epoch": 0.21192480682735557, "grad_norm": 1.9830299211465507, "learning_rate": 1.1510329898499757e-06, "loss": 0.9839, "step": 2297 }, { "epoch": 0.21201706838888248, "grad_norm": 1.9188414390512405, "learning_rate": 1.1509313633951835e-06, "loss": 0.8163, "step": 2298 }, { "epoch": 0.2121093299504094, "grad_norm": 2.4727749001007933, "learning_rate": 1.1508296892796637e-06, "loss": 0.8645, "step": 2299 }, { "epoch": 0.21220159151193635, "grad_norm": 1.5287857215679712, "learning_rate": 1.1507279675126292e-06, "loss": 0.7882, "step": 2300 }, { "epoch": 0.21220159151193635, "eval_GEN Loss": 0.473702609539032, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.449951171875, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9365684986114502, "eval_runtime": 56.9733, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 2300 }, { "epoch": 0.21229385307346327, "grad_norm": 2.0629844309652077, "learning_rate": 1.1506261981032993e-06, "loss": 0.7907, "step": 2301 }, { "epoch": 0.2123861146349902, "grad_norm": 1.9978895455166346, "learning_rate": 1.1505243810608956e-06, "loss": 0.7675, "step": 2302 }, { "epoch": 0.21247837619651713, "grad_norm": 2.0449103375414825, "learning_rate": 1.1504225163946455e-06, "loss": 0.947, "step": 2303 }, { "epoch": 0.21257063775804405, "grad_norm": 1.7881179619619427, "learning_rate": 1.1503206041137798e-06, "loss": 0.7616, "step": 2304 }, { "epoch": 0.212662899319571, "grad_norm": 1.4617832613411683, "learning_rate": 1.1502186442275343e-06, "loss": 0.7394, "step": 2305 }, { "epoch": 0.212662899319571, "eval_GEN Loss": 0.4710967242717743, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4045696556568146, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9139423370361328, "eval_runtime": 56.7701, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2305 }, { "epoch": 0.21275516088109792, "grad_norm": 1.7463932326806049, "learning_rate": 1.1501166367451487e-06, "loss": 0.6597, "step": 2306 }, { "epoch": 0.21284742244262483, "grad_norm": 1.8822327415848314, "learning_rate": 1.1500145816758665e-06, "loss": 0.8181, "step": 2307 }, { "epoch": 0.21293968400415178, "grad_norm": 2.800533451323056, "learning_rate": 1.1499124790289366e-06, "loss": 0.6983, "step": 2308 }, { "epoch": 0.2130319455656787, "grad_norm": 2.5893522569938074, "learning_rate": 1.1498103288136117e-06, "loss": 0.8804, "step": 2309 }, { "epoch": 0.21312420712720562, "grad_norm": 2.004701548344563, "learning_rate": 1.1497081310391487e-06, "loss": 0.7371, "step": 2310 }, { "epoch": 0.21312420712720562, "eval_GEN Loss": 0.4717312753200531, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.38857412338256836, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9256009459495544, "eval_runtime": 56.7822, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2310 }, { "epoch": 0.21321646868873256, "grad_norm": 1.915192617305031, "learning_rate": 1.1496058857148092e-06, "loss": 0.6161, "step": 2311 }, { "epoch": 0.21330873025025948, "grad_norm": 2.398367890800583, "learning_rate": 1.1495035928498583e-06, "loss": 0.6897, "step": 2312 }, { "epoch": 0.21340099181178643, "grad_norm": 2.056290982286057, "learning_rate": 1.1494012524535663e-06, "loss": 0.9089, "step": 2313 }, { "epoch": 0.21349325337331335, "grad_norm": 1.5304632400591565, "learning_rate": 1.1492988645352076e-06, "loss": 0.6597, "step": 2314 }, { "epoch": 0.21358551493484026, "grad_norm": 1.6754110826954896, "learning_rate": 1.1491964291040603e-06, "loss": 0.6768, "step": 2315 }, { "epoch": 0.21358551493484026, "eval_GEN Loss": 0.4733254611492157, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4184282124042511, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9504807591438293, "eval_runtime": 57.0241, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 2315 }, { "epoch": 0.2136777764963672, "grad_norm": 1.7498588420362595, "learning_rate": 1.1490939461694076e-06, "loss": 0.6434, "step": 2316 }, { "epoch": 0.21377003805789413, "grad_norm": 1.828200640622191, "learning_rate": 1.1489914157405366e-06, "loss": 0.8032, "step": 2317 }, { "epoch": 0.21386229961942105, "grad_norm": 1.83234122485386, "learning_rate": 1.1488888378267386e-06, "loss": 0.7374, "step": 2318 }, { "epoch": 0.213954561180948, "grad_norm": 1.7295731226131061, "learning_rate": 1.1487862124373094e-06, "loss": 0.7779, "step": 2319 }, { "epoch": 0.2140468227424749, "grad_norm": 1.5441769824026699, "learning_rate": 1.1486835395815495e-06, "loss": 0.6952, "step": 2320 }, { "epoch": 0.2140468227424749, "eval_GEN Loss": 0.4737255573272705, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.4278686046600342, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9647836685180664, "eval_runtime": 55.8031, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2320 }, { "epoch": 0.21413908430400186, "grad_norm": 1.511777944246195, "learning_rate": 1.1485808192687628e-06, "loss": 0.5728, "step": 2321 }, { "epoch": 0.21423134586552878, "grad_norm": 2.1065699580074853, "learning_rate": 1.148478051508258e-06, "loss": 0.9463, "step": 2322 }, { "epoch": 0.2143236074270557, "grad_norm": 3.2278463260050407, "learning_rate": 1.1483752363093483e-06, "loss": 0.7803, "step": 2323 }, { "epoch": 0.21441586898858264, "grad_norm": 1.5233719435589255, "learning_rate": 1.1482723736813511e-06, "loss": 0.7441, "step": 2324 }, { "epoch": 0.21450813055010956, "grad_norm": 1.5885137468512758, "learning_rate": 1.1481694636335874e-06, "loss": 0.6965, "step": 2325 }, { "epoch": 0.21450813055010956, "eval_GEN Loss": 0.4758618175983429, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.4119797348976135, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9652644395828247, "eval_runtime": 55.8377, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2325 }, { "epoch": 0.21460039211163648, "grad_norm": 1.5039896057405835, "learning_rate": 1.1480665061753838e-06, "loss": 0.7052, "step": 2326 }, { "epoch": 0.21469265367316342, "grad_norm": 1.7498110914358747, "learning_rate": 1.1479635013160698e-06, "loss": 0.7319, "step": 2327 }, { "epoch": 0.21478491523469034, "grad_norm": 2.132755590620228, "learning_rate": 1.1478604490649802e-06, "loss": 0.7302, "step": 2328 }, { "epoch": 0.2148771767962173, "grad_norm": 2.5800827059678726, "learning_rate": 1.1477573494314536e-06, "loss": 0.9263, "step": 2329 }, { "epoch": 0.2149694383577442, "grad_norm": 1.5882991923459204, "learning_rate": 1.1476542024248335e-06, "loss": 0.7195, "step": 2330 }, { "epoch": 0.2149694383577442, "eval_GEN Loss": 0.4753049910068512, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.40260228514671326, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.960156261920929, "eval_runtime": 55.9356, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2330 }, { "epoch": 0.21506169991927113, "grad_norm": 1.7885748342602523, "learning_rate": 1.1475510080544665e-06, "loss": 0.7798, "step": 2331 }, { "epoch": 0.21515396148079807, "grad_norm": 1.480208733609352, "learning_rate": 1.147447766329705e-06, "loss": 0.6837, "step": 2332 }, { "epoch": 0.215246223042325, "grad_norm": 1.895530242420699, "learning_rate": 1.1473444772599045e-06, "loss": 0.783, "step": 2333 }, { "epoch": 0.2153384846038519, "grad_norm": 2.431044283870173, "learning_rate": 1.1472411408544252e-06, "loss": 0.6952, "step": 2334 }, { "epoch": 0.21543074616537886, "grad_norm": 1.7642384605238612, "learning_rate": 1.1471377571226316e-06, "loss": 0.6747, "step": 2335 }, { "epoch": 0.21543074616537886, "eval_GEN Loss": 0.47444283962249756, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4047582149505615, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9581730961799622, "eval_runtime": 55.8988, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2335 }, { "epoch": 0.21552300772690577, "grad_norm": 1.868259521679867, "learning_rate": 1.1470343260738928e-06, "loss": 0.7325, "step": 2336 }, { "epoch": 0.21561526928843272, "grad_norm": 2.4300969412096998, "learning_rate": 1.1469308477175817e-06, "loss": 0.825, "step": 2337 }, { "epoch": 0.21570753084995964, "grad_norm": 1.993711784578015, "learning_rate": 1.1468273220630756e-06, "loss": 0.7888, "step": 2338 }, { "epoch": 0.21579979241148656, "grad_norm": 1.6353502032591918, "learning_rate": 1.1467237491197559e-06, "loss": 0.7462, "step": 2339 }, { "epoch": 0.2158920539730135, "grad_norm": 3.1713808076121976, "learning_rate": 1.146620128897009e-06, "loss": 0.9708, "step": 2340 }, { "epoch": 0.2158920539730135, "eval_GEN Loss": 0.47516658902168274, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM Loss": 0.42991694808006287, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9573917984962463, "eval_runtime": 55.8666, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2340 }, { "epoch": 0.21598431553454042, "grad_norm": 1.9589790408647827, "learning_rate": 1.1465164614042251e-06, "loss": 0.7606, "step": 2341 }, { "epoch": 0.21607657709606734, "grad_norm": 2.0162196837094744, "learning_rate": 1.1464127466507987e-06, "loss": 0.6981, "step": 2342 }, { "epoch": 0.2161688386575943, "grad_norm": 2.2410233024067265, "learning_rate": 1.1463089846461283e-06, "loss": 0.8722, "step": 2343 }, { "epoch": 0.2162611002191212, "grad_norm": 1.8122832657732915, "learning_rate": 1.1462051753996172e-06, "loss": 0.8332, "step": 2344 }, { "epoch": 0.21635336178064815, "grad_norm": 1.8244146059988295, "learning_rate": 1.1461013189206728e-06, "loss": 0.8179, "step": 2345 }, { "epoch": 0.21635336178064815, "eval_GEN Loss": 0.4750309884548187, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.4460814893245697, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9593148827552795, "eval_runtime": 55.9823, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2345 }, { "epoch": 0.21644562334217507, "grad_norm": 1.4819709836535895, "learning_rate": 1.1459974152187064e-06, "loss": 0.6879, "step": 2346 }, { "epoch": 0.216537884903702, "grad_norm": 2.5475880117354106, "learning_rate": 1.1458934643031344e-06, "loss": 0.6995, "step": 2347 }, { "epoch": 0.21663014646522893, "grad_norm": 1.7298597891054333, "learning_rate": 1.1457894661833767e-06, "loss": 0.6828, "step": 2348 }, { "epoch": 0.21672240802675585, "grad_norm": 1.5181012040835442, "learning_rate": 1.1456854208688578e-06, "loss": 0.7195, "step": 2349 }, { "epoch": 0.21681466958828277, "grad_norm": 1.906492177727322, "learning_rate": 1.1455813283690064e-06, "loss": 0.7811, "step": 2350 }, { "epoch": 0.21681466958828277, "eval_GEN Loss": 0.47427472472190857, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.4521903991699219, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9660456776618958, "eval_runtime": 56.8725, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2350 }, { "epoch": 0.21690693114980972, "grad_norm": 2.0952804451135987, "learning_rate": 1.145477188693256e-06, "loss": 0.684, "step": 2351 }, { "epoch": 0.21699919271133664, "grad_norm": 2.386165354308659, "learning_rate": 1.145373001851043e-06, "loss": 0.8854, "step": 2352 }, { "epoch": 0.21709145427286355, "grad_norm": 1.8874466244002326, "learning_rate": 1.1452687678518097e-06, "loss": 0.6785, "step": 2353 }, { "epoch": 0.2171837158343905, "grad_norm": 2.0608842425595477, "learning_rate": 1.1451644867050022e-06, "loss": 0.804, "step": 2354 }, { "epoch": 0.21727597739591742, "grad_norm": 2.022665852118557, "learning_rate": 1.1450601584200696e-06, "loss": 0.7699, "step": 2355 }, { "epoch": 0.21727597739591742, "eval_GEN Loss": 0.47283825278282166, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.43678930401802063, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9777644276618958, "eval_runtime": 56.002, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2355 }, { "epoch": 0.21736823895744437, "grad_norm": 2.0400495938169145, "learning_rate": 1.144955783006467e-06, "loss": 0.9566, "step": 2356 }, { "epoch": 0.21746050051897128, "grad_norm": 2.1740673572995015, "learning_rate": 1.144851360473653e-06, "loss": 0.8656, "step": 2357 }, { "epoch": 0.2175527620804982, "grad_norm": 2.42001296340199, "learning_rate": 1.1447468908310904e-06, "loss": 0.7008, "step": 2358 }, { "epoch": 0.21764502364202515, "grad_norm": 1.9788688615523606, "learning_rate": 1.1446423740882464e-06, "loss": 0.8722, "step": 2359 }, { "epoch": 0.21773728520355207, "grad_norm": 2.5999805764933424, "learning_rate": 1.1445378102545926e-06, "loss": 0.7861, "step": 2360 }, { "epoch": 0.21773728520355207, "eval_GEN Loss": 0.4706652760505676, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.42590969800949097, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9721153974533081, "eval_runtime": 56.1296, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2360 }, { "epoch": 0.21782954676507899, "grad_norm": 1.559569118407366, "learning_rate": 1.1444331993396046e-06, "loss": 0.7351, "step": 2361 }, { "epoch": 0.21792180832660593, "grad_norm": 2.1665835047710367, "learning_rate": 1.1443285413527626e-06, "loss": 0.8115, "step": 2362 }, { "epoch": 0.21801406988813285, "grad_norm": 1.5822610252059668, "learning_rate": 1.1442238363035506e-06, "loss": 0.7499, "step": 2363 }, { "epoch": 0.2181063314496598, "grad_norm": 1.5238898164541468, "learning_rate": 1.1441190842014574e-06, "loss": 0.7761, "step": 2364 }, { "epoch": 0.21819859301118671, "grad_norm": 1.985694895982136, "learning_rate": 1.1440142850559758e-06, "loss": 0.7319, "step": 2365 }, { "epoch": 0.21819859301118671, "eval_GEN Loss": 0.468374639749527, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.4251801371574402, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9659855961799622, "eval_runtime": 55.9352, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2365 }, { "epoch": 0.21829085457271363, "grad_norm": 1.808616661632616, "learning_rate": 1.1439094388766026e-06, "loss": 0.6165, "step": 2366 }, { "epoch": 0.21838311613424058, "grad_norm": 1.8714653109491266, "learning_rate": 1.1438045456728392e-06, "loss": 0.682, "step": 2367 }, { "epoch": 0.2184753776957675, "grad_norm": 2.3334762045797404, "learning_rate": 1.1436996054541912e-06, "loss": 1.0488, "step": 2368 }, { "epoch": 0.21856763925729442, "grad_norm": 1.553192305658262, "learning_rate": 1.1435946182301686e-06, "loss": 0.8035, "step": 2369 }, { "epoch": 0.21865990081882136, "grad_norm": 1.6675862371845878, "learning_rate": 1.1434895840102856e-06, "loss": 0.6578, "step": 2370 }, { "epoch": 0.21865990081882136, "eval_GEN Loss": 0.46896758675575256, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.42500072717666626, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9605769515037537, "eval_runtime": 55.8721, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2370 }, { "epoch": 0.21875216238034828, "grad_norm": 1.6936454210685636, "learning_rate": 1.1433845028040603e-06, "loss": 0.7876, "step": 2371 }, { "epoch": 0.21884442394187523, "grad_norm": 3.188558427741426, "learning_rate": 1.1432793746210152e-06, "loss": 0.9185, "step": 2372 }, { "epoch": 0.21893668550340215, "grad_norm": 2.0587332732713484, "learning_rate": 1.1431741994706776e-06, "loss": 0.8059, "step": 2373 }, { "epoch": 0.21902894706492906, "grad_norm": 2.838131575363757, "learning_rate": 1.1430689773625783e-06, "loss": 0.8441, "step": 2374 }, { "epoch": 0.219121208626456, "grad_norm": 2.296253791344834, "learning_rate": 1.1429637083062528e-06, "loss": 0.5491, "step": 2375 }, { "epoch": 0.219121208626456, "eval_GEN Loss": 0.4697877764701843, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.41090792417526245, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9453125, "eval_runtime": 55.8973, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2375 }, { "epoch": 0.21921347018798293, "grad_norm": 2.1846944804918462, "learning_rate": 1.142858392311241e-06, "loss": 0.6736, "step": 2376 }, { "epoch": 0.21930573174950985, "grad_norm": 1.9274668959793566, "learning_rate": 1.1427530293870865e-06, "loss": 0.793, "step": 2377 }, { "epoch": 0.2193979933110368, "grad_norm": 1.5422715509371179, "learning_rate": 1.1426476195433372e-06, "loss": 0.684, "step": 2378 }, { "epoch": 0.2194902548725637, "grad_norm": 1.502657644965345, "learning_rate": 1.142542162789546e-06, "loss": 0.6823, "step": 2379 }, { "epoch": 0.21958251643409066, "grad_norm": 1.7822182835928675, "learning_rate": 1.1424366591352694e-06, "loss": 0.7874, "step": 2380 }, { "epoch": 0.21958251643409066, "eval_GEN Loss": 0.46932539343833923, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.38606709241867065, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9384615421295166, "eval_runtime": 55.9097, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2380 }, { "epoch": 0.21967477799561758, "grad_norm": 1.7523445852540822, "learning_rate": 1.1423311085900684e-06, "loss": 0.7415, "step": 2381 }, { "epoch": 0.2197670395571445, "grad_norm": 1.7913442418646242, "learning_rate": 1.142225511163508e-06, "loss": 0.8646, "step": 2382 }, { "epoch": 0.21985930111867144, "grad_norm": 1.761396358655263, "learning_rate": 1.1421198668651579e-06, "loss": 0.884, "step": 2383 }, { "epoch": 0.21995156268019836, "grad_norm": 2.0539365928270605, "learning_rate": 1.1420141757045911e-06, "loss": 0.591, "step": 2384 }, { "epoch": 0.22004382424172528, "grad_norm": 2.3418539255499304, "learning_rate": 1.141908437691386e-06, "loss": 0.9255, "step": 2385 }, { "epoch": 0.22004382424172528, "eval_GEN Loss": 0.4676920473575592, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3769882023334503, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9442908763885498, "eval_runtime": 56.1242, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2385 }, { "epoch": 0.22013608580325222, "grad_norm": 1.5027133667777839, "learning_rate": 1.1418026528351248e-06, "loss": 0.6969, "step": 2386 }, { "epoch": 0.22022834736477914, "grad_norm": 1.8817816249958745, "learning_rate": 1.1416968211453934e-06, "loss": 0.8139, "step": 2387 }, { "epoch": 0.2203206089263061, "grad_norm": 1.7124071370104497, "learning_rate": 1.1415909426317832e-06, "loss": 0.8992, "step": 2388 }, { "epoch": 0.220412870487833, "grad_norm": 1.978229345626964, "learning_rate": 1.1414850173038885e-06, "loss": 0.5924, "step": 2389 }, { "epoch": 0.22050513204935993, "grad_norm": 1.6016314739029147, "learning_rate": 1.1413790451713085e-06, "loss": 0.6232, "step": 2390 }, { "epoch": 0.22050513204935993, "eval_GEN Loss": 0.46786993741989136, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3706422448158264, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9359976053237915, "eval_runtime": 55.9104, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2390 }, { "epoch": 0.22059739361088687, "grad_norm": 2.2803210506354565, "learning_rate": 1.1412730262436467e-06, "loss": 0.8871, "step": 2391 }, { "epoch": 0.2206896551724138, "grad_norm": 1.7584831030043306, "learning_rate": 1.1411669605305107e-06, "loss": 0.6859, "step": 2392 }, { "epoch": 0.2207819167339407, "grad_norm": 2.260883576001255, "learning_rate": 1.141060848041512e-06, "loss": 0.7366, "step": 2393 }, { "epoch": 0.22087417829546765, "grad_norm": 1.6312673244843356, "learning_rate": 1.1409546887862671e-06, "loss": 0.5583, "step": 2394 }, { "epoch": 0.22096643985699457, "grad_norm": 1.6042762461377682, "learning_rate": 1.1408484827743963e-06, "loss": 0.7177, "step": 2395 }, { "epoch": 0.22096643985699457, "eval_GEN Loss": 0.4680069386959076, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.37928250432014465, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9259615540504456, "eval_runtime": 56.3175, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 2395 }, { "epoch": 0.22105870141852152, "grad_norm": 1.527794619670946, "learning_rate": 1.140742230015524e-06, "loss": 0.8465, "step": 2396 }, { "epoch": 0.22115096298004844, "grad_norm": 1.969434610489511, "learning_rate": 1.1406359305192789e-06, "loss": 0.6828, "step": 2397 }, { "epoch": 0.22124322454157536, "grad_norm": 1.5875569813257355, "learning_rate": 1.1405295842952944e-06, "loss": 0.7225, "step": 2398 }, { "epoch": 0.2213354861031023, "grad_norm": 2.4401147860126207, "learning_rate": 1.140423191353207e-06, "loss": 0.7447, "step": 2399 }, { "epoch": 0.22142774766462922, "grad_norm": 1.6427035393739329, "learning_rate": 1.1403167517026591e-06, "loss": 0.6974, "step": 2400 }, { "epoch": 0.22142774766462922, "eval_GEN Loss": 0.46850404143333435, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.38373351097106934, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9254807829856873, "eval_runtime": 55.9352, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2400 }, { "epoch": 0.22152000922615614, "grad_norm": 1.7451701920144373, "learning_rate": 1.1402102653532961e-06, "loss": 0.8668, "step": 2401 }, { "epoch": 0.22161227078768309, "grad_norm": 2.151270156869049, "learning_rate": 1.140103732314768e-06, "loss": 0.8334, "step": 2402 }, { "epoch": 0.22170453234921, "grad_norm": 1.6133499639668547, "learning_rate": 1.1399971525967285e-06, "loss": 0.5765, "step": 2403 }, { "epoch": 0.22179679391073695, "grad_norm": 1.2951764413763402, "learning_rate": 1.1398905262088366e-06, "loss": 0.5789, "step": 2404 }, { "epoch": 0.22188905547226387, "grad_norm": 1.9143571737959348, "learning_rate": 1.1397838531607548e-06, "loss": 0.8101, "step": 2405 }, { "epoch": 0.22188905547226387, "eval_GEN Loss": 0.46997690200805664, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3785282075405121, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9268629550933838, "eval_runtime": 55.9975, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2405 }, { "epoch": 0.2219813170337908, "grad_norm": 2.1369828854602892, "learning_rate": 1.1396771334621499e-06, "loss": 0.7544, "step": 2406 }, { "epoch": 0.22207357859531773, "grad_norm": 1.3784225486612767, "learning_rate": 1.1395703671226932e-06, "loss": 0.7144, "step": 2407 }, { "epoch": 0.22216584015684465, "grad_norm": 1.6688989208818583, "learning_rate": 1.1394635541520598e-06, "loss": 0.6259, "step": 2408 }, { "epoch": 0.22225810171837157, "grad_norm": 1.8506620044841888, "learning_rate": 1.1393566945599293e-06, "loss": 0.7966, "step": 2409 }, { "epoch": 0.22235036327989852, "grad_norm": 2.238252442399522, "learning_rate": 1.1392497883559853e-06, "loss": 0.8908, "step": 2410 }, { "epoch": 0.22235036327989852, "eval_GEN Loss": 0.4711766839027405, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.37810245156288147, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9131009578704834, "eval_runtime": 55.9686, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2410 }, { "epoch": 0.22244262484142543, "grad_norm": 1.6627933985265864, "learning_rate": 1.1391428355499163e-06, "loss": 0.7435, "step": 2411 }, { "epoch": 0.22253488640295238, "grad_norm": 1.6940717176891962, "learning_rate": 1.1390358361514143e-06, "loss": 0.8278, "step": 2412 }, { "epoch": 0.2226271479644793, "grad_norm": 2.7938614253432323, "learning_rate": 1.1389287901701757e-06, "loss": 0.7211, "step": 2413 }, { "epoch": 0.22271940952600622, "grad_norm": 1.690730641332566, "learning_rate": 1.1388216976159012e-06, "loss": 0.528, "step": 2414 }, { "epoch": 0.22281167108753316, "grad_norm": 2.131417765946894, "learning_rate": 1.1387145584982956e-06, "loss": 0.9121, "step": 2415 }, { "epoch": 0.22281167108753316, "eval_GEN Loss": 0.47082820534706116, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.38620659708976746, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.907932698726654, "eval_runtime": 56.9834, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 2415 }, { "epoch": 0.22290393264906008, "grad_norm": 1.665691644810356, "learning_rate": 1.1386073728270682e-06, "loss": 0.734, "step": 2416 }, { "epoch": 0.222996194210587, "grad_norm": 1.6187270870803299, "learning_rate": 1.1385001406119322e-06, "loss": 0.6109, "step": 2417 }, { "epoch": 0.22308845577211395, "grad_norm": 1.9602103537950144, "learning_rate": 1.1383928618626052e-06, "loss": 0.7229, "step": 2418 }, { "epoch": 0.22318071733364087, "grad_norm": 2.0472504753973286, "learning_rate": 1.138285536588809e-06, "loss": 0.7685, "step": 2419 }, { "epoch": 0.2232729788951678, "grad_norm": 2.481401439851354, "learning_rate": 1.1381781648002695e-06, "loss": 0.7794, "step": 2420 }, { "epoch": 0.2232729788951678, "eval_GEN Loss": 0.4718153476715088, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.39808425307273865, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9167668223381042, "eval_runtime": 56.8258, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2420 }, { "epoch": 0.22336524045669473, "grad_norm": 2.152102989463276, "learning_rate": 1.138070746506717e-06, "loss": 0.9804, "step": 2421 }, { "epoch": 0.22345750201822165, "grad_norm": 1.9955954711734134, "learning_rate": 1.1379632817178859e-06, "loss": 0.8168, "step": 2422 }, { "epoch": 0.2235497635797486, "grad_norm": 1.599732125977681, "learning_rate": 1.1378557704435147e-06, "loss": 0.5893, "step": 2423 }, { "epoch": 0.2236420251412755, "grad_norm": 2.055255500617136, "learning_rate": 1.1377482126933463e-06, "loss": 0.891, "step": 2424 }, { "epoch": 0.22373428670280243, "grad_norm": 2.0444524277785803, "learning_rate": 1.137640608477128e-06, "loss": 0.7909, "step": 2425 }, { "epoch": 0.22373428670280243, "eval_GEN Loss": 0.4728257954120636, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.4107135236263275, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9212139248847961, "eval_runtime": 56.9273, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2425 }, { "epoch": 0.22382654826432938, "grad_norm": 1.6192087375379063, "learning_rate": 1.1375329578046105e-06, "loss": 0.8534, "step": 2426 }, { "epoch": 0.2239188098258563, "grad_norm": 2.132404090605897, "learning_rate": 1.1374252606855498e-06, "loss": 0.7363, "step": 2427 }, { "epoch": 0.22401107138738324, "grad_norm": 2.1744719112179864, "learning_rate": 1.1373175171297055e-06, "loss": 0.8048, "step": 2428 }, { "epoch": 0.22410333294891016, "grad_norm": 1.6479747531841462, "learning_rate": 1.1372097271468413e-06, "loss": 0.9014, "step": 2429 }, { "epoch": 0.22419559451043708, "grad_norm": 1.7625154033683774, "learning_rate": 1.1371018907467256e-06, "loss": 0.855, "step": 2430 }, { "epoch": 0.22419559451043708, "eval_GEN Loss": 0.47299402952194214, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8589743589743589, "eval_PRM F1 AUC": 0.7731796752226295, "eval_PRM F1 Neg": 0.6071428571428571, "eval_PRM Loss": 0.43708139657974243, "eval_PRM NPV": 0.5151515151515151, "eval_PRM Precision": 0.9178082191780822, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9305288195610046, "eval_runtime": 56.8176, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2430 }, { "epoch": 0.22428785607196403, "grad_norm": 2.3010725350981294, "learning_rate": 1.1369940079391303e-06, "loss": 0.9764, "step": 2431 }, { "epoch": 0.22438011763349094, "grad_norm": 2.0818426827837357, "learning_rate": 1.136886078733832e-06, "loss": 0.719, "step": 2432 }, { "epoch": 0.22447237919501786, "grad_norm": 1.7541157290491092, "learning_rate": 1.1367781031406119e-06, "loss": 0.7939, "step": 2433 }, { "epoch": 0.2245646407565448, "grad_norm": 3.2390284510728558, "learning_rate": 1.1366700811692542e-06, "loss": 0.8502, "step": 2434 }, { "epoch": 0.22465690231807173, "grad_norm": 2.3228636799465607, "learning_rate": 1.1365620128295484e-06, "loss": 0.698, "step": 2435 }, { "epoch": 0.22465690231807173, "eval_GEN Loss": 0.47129055857658386, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8516129032258064, "eval_PRM F1 AUC": 0.7671555788370874, "eval_PRM F1 Neg": 0.5964912280701754, "eval_PRM Loss": 0.4372565746307373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9247596263885498, "eval_runtime": 56.8818, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2435 }, { "epoch": 0.22474916387959867, "grad_norm": 2.425877722634202, "learning_rate": 1.1364538981312879e-06, "loss": 0.6756, "step": 2436 }, { "epoch": 0.2248414254411256, "grad_norm": 2.361565498188788, "learning_rate": 1.13634573708427e-06, "loss": 0.656, "step": 2437 }, { "epoch": 0.2249336870026525, "grad_norm": 1.6936773950644115, "learning_rate": 1.1362375296982966e-06, "loss": 0.7373, "step": 2438 }, { "epoch": 0.22502594856417946, "grad_norm": 2.388291506864521, "learning_rate": 1.1361292759831738e-06, "loss": 0.7895, "step": 2439 }, { "epoch": 0.22511821012570638, "grad_norm": 2.4285604544608903, "learning_rate": 1.1360209759487112e-06, "loss": 0.8819, "step": 2440 }, { "epoch": 0.22511821012570638, "eval_GEN Loss": 0.4684344232082367, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.36903172731399536, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9042067527770996, "eval_runtime": 56.941, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2440 }, { "epoch": 0.2252104716872333, "grad_norm": 1.9214486009218754, "learning_rate": 1.1359126296047235e-06, "loss": 0.7505, "step": 2441 }, { "epoch": 0.22530273324876024, "grad_norm": 1.4059886334090042, "learning_rate": 1.1358042369610289e-06, "loss": 0.6201, "step": 2442 }, { "epoch": 0.22539499481028716, "grad_norm": 1.3026528887742264, "learning_rate": 1.1356957980274504e-06, "loss": 0.5657, "step": 2443 }, { "epoch": 0.2254872563718141, "grad_norm": 2.1622229210816104, "learning_rate": 1.135587312813815e-06, "loss": 0.6993, "step": 2444 }, { "epoch": 0.22557951793334102, "grad_norm": 1.5415557007956615, "learning_rate": 1.1354787813299536e-06, "loss": 0.6928, "step": 2445 }, { "epoch": 0.22557951793334102, "eval_GEN Loss": 0.469711035490036, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3571073114871979, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9175480604171753, "eval_runtime": 56.7865, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2445 }, { "epoch": 0.22567177949486794, "grad_norm": 1.3915882131267747, "learning_rate": 1.1353702035857017e-06, "loss": 0.7732, "step": 2446 }, { "epoch": 0.2257640410563949, "grad_norm": 2.878040973623829, "learning_rate": 1.1352615795908983e-06, "loss": 0.8507, "step": 2447 }, { "epoch": 0.2258563026179218, "grad_norm": 1.8932740611767567, "learning_rate": 1.1351529093553876e-06, "loss": 0.6389, "step": 2448 }, { "epoch": 0.22594856417944872, "grad_norm": 1.8058416639527972, "learning_rate": 1.1350441928890171e-06, "loss": 0.7784, "step": 2449 }, { "epoch": 0.22604082574097567, "grad_norm": 1.3383035069198335, "learning_rate": 1.134935430201639e-06, "loss": 0.6901, "step": 2450 }, { "epoch": 0.22604082574097567, "eval_GEN Loss": 0.4697313904762268, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3636733591556549, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9028846025466919, "eval_runtime": 56.8545, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2450 }, { "epoch": 0.2261330873025026, "grad_norm": 1.9378913317121984, "learning_rate": 1.1348266213031097e-06, "loss": 0.7741, "step": 2451 }, { "epoch": 0.22622534886402954, "grad_norm": 2.034692154429518, "learning_rate": 1.1347177662032894e-06, "loss": 0.8802, "step": 2452 }, { "epoch": 0.22631761042555645, "grad_norm": 1.5020953975044546, "learning_rate": 1.134608864912043e-06, "loss": 0.5675, "step": 2453 }, { "epoch": 0.22640987198708337, "grad_norm": 1.618387271348409, "learning_rate": 1.1344999174392388e-06, "loss": 0.7853, "step": 2454 }, { "epoch": 0.22650213354861032, "grad_norm": 1.4706788156565047, "learning_rate": 1.1343909237947504e-06, "loss": 0.634, "step": 2455 }, { "epoch": 0.22650213354861032, "eval_GEN Loss": 0.4696446359157562, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.36343905329704285, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8920673131942749, "eval_runtime": 56.955, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 2455 }, { "epoch": 0.22659439511013724, "grad_norm": 2.202525362172754, "learning_rate": 1.1342818839884548e-06, "loss": 0.6124, "step": 2456 }, { "epoch": 0.22668665667166416, "grad_norm": 2.554850650073834, "learning_rate": 1.134172798030233e-06, "loss": 0.9653, "step": 2457 }, { "epoch": 0.2267789182331911, "grad_norm": 1.410417704172557, "learning_rate": 1.1340636659299707e-06, "loss": 0.6578, "step": 2458 }, { "epoch": 0.22687117979471802, "grad_norm": 2.234493248027032, "learning_rate": 1.133954487697558e-06, "loss": 0.9514, "step": 2459 }, { "epoch": 0.22696344135624497, "grad_norm": 2.0401035606875633, "learning_rate": 1.1338452633428883e-06, "loss": 0.5441, "step": 2460 }, { "epoch": 0.22696344135624497, "eval_GEN Loss": 0.4691702723503113, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3740851879119873, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8882812261581421, "eval_runtime": 56.7323, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2460 }, { "epoch": 0.22705570291777188, "grad_norm": 1.7006937438662142, "learning_rate": 1.13373599287586e-06, "loss": 0.8534, "step": 2461 }, { "epoch": 0.2271479644792988, "grad_norm": 1.3400719713400748, "learning_rate": 1.1336266763063752e-06, "loss": 0.5771, "step": 2462 }, { "epoch": 0.22724022604082575, "grad_norm": 1.9203227243680183, "learning_rate": 1.1335173136443406e-06, "loss": 0.6458, "step": 2463 }, { "epoch": 0.22733248760235267, "grad_norm": 2.1478223804179666, "learning_rate": 1.1334079048996662e-06, "loss": 0.9295, "step": 2464 }, { "epoch": 0.22742474916387959, "grad_norm": 1.8610640901338107, "learning_rate": 1.1332984500822676e-06, "loss": 0.8251, "step": 2465 }, { "epoch": 0.22742474916387959, "eval_GEN Loss": 0.46802860498428345, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3707696497440338, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8885817527770996, "eval_runtime": 57.1267, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 2465 }, { "epoch": 0.22751701072540653, "grad_norm": 1.824966759349408, "learning_rate": 1.1331889492020634e-06, "loss": 0.8261, "step": 2466 }, { "epoch": 0.22760927228693345, "grad_norm": 1.4536672716986374, "learning_rate": 1.1330794022689764e-06, "loss": 0.6273, "step": 2467 }, { "epoch": 0.2277015338484604, "grad_norm": 2.0134294555857015, "learning_rate": 1.1329698092929345e-06, "loss": 0.8769, "step": 2468 }, { "epoch": 0.22779379540998732, "grad_norm": 1.9646142059554255, "learning_rate": 1.1328601702838688e-06, "loss": 0.7944, "step": 2469 }, { "epoch": 0.22788605697151423, "grad_norm": 1.5708958311354917, "learning_rate": 1.1327504852517152e-06, "loss": 0.6498, "step": 2470 }, { "epoch": 0.22788605697151423, "eval_GEN Loss": 0.4714735448360443, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.397542804479599, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9019230604171753, "eval_runtime": 56.9012, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2470 }, { "epoch": 0.22797831853304118, "grad_norm": 1.3681737730047887, "learning_rate": 1.1326407542064132e-06, "loss": 0.497, "step": 2471 }, { "epoch": 0.2280705800945681, "grad_norm": 1.97168956436627, "learning_rate": 1.1325309771579075e-06, "loss": 0.7414, "step": 2472 }, { "epoch": 0.22816284165609502, "grad_norm": 2.3031316138910194, "learning_rate": 1.1324211541161454e-06, "loss": 0.855, "step": 2473 }, { "epoch": 0.22825510321762196, "grad_norm": 2.1849471605093425, "learning_rate": 1.1323112850910794e-06, "loss": 0.7153, "step": 2474 }, { "epoch": 0.22834736477914888, "grad_norm": 2.230071753179375, "learning_rate": 1.1322013700926665e-06, "loss": 0.7911, "step": 2475 }, { "epoch": 0.22834736477914888, "eval_GEN Loss": 0.47294795513153076, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8589743589743589, "eval_PRM F1 AUC": 0.7731796752226295, "eval_PRM F1 Neg": 0.6071428571428571, "eval_PRM Loss": 0.4190768599510193, "eval_PRM NPV": 0.5151515151515151, "eval_PRM Precision": 0.9178082191780822, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9164663553237915, "eval_runtime": 56.9171, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2475 }, { "epoch": 0.22843962634067583, "grad_norm": 1.982015033997405, "learning_rate": 1.1320914091308672e-06, "loss": 0.816, "step": 2476 }, { "epoch": 0.22853188790220275, "grad_norm": 1.6435419692673323, "learning_rate": 1.1319814022156461e-06, "loss": 0.6268, "step": 2477 }, { "epoch": 0.22862414946372966, "grad_norm": 1.5840100620675945, "learning_rate": 1.1318713493569724e-06, "loss": 0.7047, "step": 2478 }, { "epoch": 0.2287164110252566, "grad_norm": 2.0689373763994925, "learning_rate": 1.131761250564819e-06, "loss": 0.6856, "step": 2479 }, { "epoch": 0.22880867258678353, "grad_norm": 2.643783420100991, "learning_rate": 1.1316511058491635e-06, "loss": 0.874, "step": 2480 }, { "epoch": 0.22880867258678353, "eval_GEN Loss": 0.47014084458351135, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM Loss": 0.419371634721756, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9097355604171753, "eval_runtime": 56.6946, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2480 }, { "epoch": 0.22890093414831045, "grad_norm": 1.4845504230546336, "learning_rate": 1.1315409152199875e-06, "loss": 0.6945, "step": 2481 }, { "epoch": 0.2289931957098374, "grad_norm": 1.3983407481004397, "learning_rate": 1.1314306786872764e-06, "loss": 0.6221, "step": 2482 }, { "epoch": 0.2290854572713643, "grad_norm": 1.5308073226456993, "learning_rate": 1.13132039626102e-06, "loss": 0.7287, "step": 2483 }, { "epoch": 0.22917771883289126, "grad_norm": 1.6513885081879696, "learning_rate": 1.1312100679512123e-06, "loss": 0.7563, "step": 2484 }, { "epoch": 0.22926998039441818, "grad_norm": 1.637595673797351, "learning_rate": 1.1310996937678514e-06, "loss": 0.6138, "step": 2485 }, { "epoch": 0.22926998039441818, "eval_GEN Loss": 0.46911635994911194, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3957677185535431, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9058894515037537, "eval_runtime": 56.8024, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2485 }, { "epoch": 0.2293622419559451, "grad_norm": 2.141175588712988, "learning_rate": 1.1309892737209398e-06, "loss": 0.6231, "step": 2486 }, { "epoch": 0.22945450351747204, "grad_norm": 3.5286845366659665, "learning_rate": 1.1308788078204837e-06, "loss": 0.7897, "step": 2487 }, { "epoch": 0.22954676507899896, "grad_norm": 2.3754392821441126, "learning_rate": 1.1307682960764937e-06, "loss": 0.9385, "step": 2488 }, { "epoch": 0.22963902664052588, "grad_norm": 2.075474213820218, "learning_rate": 1.1306577384989848e-06, "loss": 0.7251, "step": 2489 }, { "epoch": 0.22973128820205282, "grad_norm": 1.573113395506502, "learning_rate": 1.1305471350979755e-06, "loss": 0.6645, "step": 2490 }, { "epoch": 0.22973128820205282, "eval_GEN Loss": 0.4681898057460785, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.38737961649894714, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9082331657409668, "eval_runtime": 56.8407, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2490 }, { "epoch": 0.22982354976357974, "grad_norm": 1.7327869966982956, "learning_rate": 1.1304364858834894e-06, "loss": 0.5968, "step": 2491 }, { "epoch": 0.2299158113251067, "grad_norm": 1.546646575464143, "learning_rate": 1.1303257908655529e-06, "loss": 0.5915, "step": 2492 }, { "epoch": 0.2300080728866336, "grad_norm": 1.6666122378775579, "learning_rate": 1.130215050054198e-06, "loss": 0.793, "step": 2493 }, { "epoch": 0.23010033444816053, "grad_norm": 2.4377169421469485, "learning_rate": 1.1301042634594602e-06, "loss": 0.574, "step": 2494 }, { "epoch": 0.23019259600968747, "grad_norm": 1.894979391573054, "learning_rate": 1.129993431091379e-06, "loss": 0.6417, "step": 2495 }, { "epoch": 0.23019259600968747, "eval_GEN Loss": 0.4674574136734009, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.3983570337295532, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9028846025466919, "eval_runtime": 56.7877, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2495 }, { "epoch": 0.2302848575712144, "grad_norm": 2.3448281942223703, "learning_rate": 1.1298825529599983e-06, "loss": 0.8902, "step": 2496 }, { "epoch": 0.2303771191327413, "grad_norm": 1.7789743158712312, "learning_rate": 1.1297716290753657e-06, "loss": 0.6988, "step": 2497 }, { "epoch": 0.23046938069426826, "grad_norm": 1.518338773618905, "learning_rate": 1.1296606594475337e-06, "loss": 0.4898, "step": 2498 }, { "epoch": 0.23056164225579517, "grad_norm": 2.0993593440032865, "learning_rate": 1.1295496440865583e-06, "loss": 0.7423, "step": 2499 }, { "epoch": 0.23065390381732212, "grad_norm": 2.3951483049527615, "learning_rate": 1.1294385830025e-06, "loss": 0.7233, "step": 2500 }, { "epoch": 0.23065390381732212, "eval_GEN Loss": 0.468417227268219, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4037969708442688, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8917668461799622, "eval_runtime": 56.7159, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2500 }, { "epoch": 0.23074616537884904, "grad_norm": 2.212728059817675, "learning_rate": 1.1293274762054233e-06, "loss": 0.8199, "step": 2501 }, { "epoch": 0.23083842694037596, "grad_norm": 2.6001781670563138, "learning_rate": 1.129216323705397e-06, "loss": 1.0106, "step": 2502 }, { "epoch": 0.2309306885019029, "grad_norm": 1.6724983686291832, "learning_rate": 1.1291051255124937e-06, "loss": 0.7285, "step": 2503 }, { "epoch": 0.23102295006342982, "grad_norm": 2.6611634155114245, "learning_rate": 1.1289938816367903e-06, "loss": 0.6679, "step": 2504 }, { "epoch": 0.23111521162495674, "grad_norm": 2.067860591355526, "learning_rate": 1.1288825920883685e-06, "loss": 0.8011, "step": 2505 }, { "epoch": 0.23111521162495674, "eval_GEN Loss": 0.46988198161125183, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.38036635518074036, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8838942050933838, "eval_runtime": 56.0063, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2505 }, { "epoch": 0.2312074731864837, "grad_norm": 1.7813382417817287, "learning_rate": 1.1287712568773127e-06, "loss": 0.7122, "step": 2506 }, { "epoch": 0.2312997347480106, "grad_norm": 2.059914193923338, "learning_rate": 1.1286598760137126e-06, "loss": 0.796, "step": 2507 }, { "epoch": 0.23139199630953755, "grad_norm": 2.3880312965231476, "learning_rate": 1.128548449507662e-06, "loss": 0.831, "step": 2508 }, { "epoch": 0.23148425787106447, "grad_norm": 1.8289964252066055, "learning_rate": 1.1284369773692581e-06, "loss": 0.6621, "step": 2509 }, { "epoch": 0.2315765194325914, "grad_norm": 1.472177833646282, "learning_rate": 1.1283254596086031e-06, "loss": 0.655, "step": 2510 }, { "epoch": 0.2315765194325914, "eval_GEN Loss": 0.4698483645915985, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.362417072057724, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8776442408561707, "eval_runtime": 55.6801, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2510 }, { "epoch": 0.23166878099411833, "grad_norm": 1.5573238422258162, "learning_rate": 1.1282138962358026e-06, "loss": 0.6579, "step": 2511 }, { "epoch": 0.23176104255564525, "grad_norm": 1.7342550230597888, "learning_rate": 1.1281022872609668e-06, "loss": 0.7244, "step": 2512 }, { "epoch": 0.23185330411717217, "grad_norm": 1.676035826200078, "learning_rate": 1.1279906326942097e-06, "loss": 0.4781, "step": 2513 }, { "epoch": 0.23194556567869912, "grad_norm": 1.630407863274102, "learning_rate": 1.12787893254565e-06, "loss": 0.6057, "step": 2514 }, { "epoch": 0.23203782724022604, "grad_norm": 2.1285004105290954, "learning_rate": 1.1277671868254097e-06, "loss": 0.6775, "step": 2515 }, { "epoch": 0.23203782724022604, "eval_GEN Loss": 0.4699053168296814, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.355672687292099, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8748798370361328, "eval_runtime": 55.7112, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2515 }, { "epoch": 0.23213008880175298, "grad_norm": 1.9006796685899903, "learning_rate": 1.1276553955436155e-06, "loss": 0.7582, "step": 2516 }, { "epoch": 0.2322223503632799, "grad_norm": 1.582411726868668, "learning_rate": 1.1275435587103983e-06, "loss": 0.6562, "step": 2517 }, { "epoch": 0.23231461192480682, "grad_norm": 2.2044870251500774, "learning_rate": 1.1274316763358927e-06, "loss": 0.5809, "step": 2518 }, { "epoch": 0.23240687348633376, "grad_norm": 2.2165562061612465, "learning_rate": 1.1273197484302377e-06, "loss": 0.7458, "step": 2519 }, { "epoch": 0.23249913504786068, "grad_norm": 2.065663963935201, "learning_rate": 1.1272077750035767e-06, "loss": 0.723, "step": 2520 }, { "epoch": 0.23249913504786068, "eval_GEN Loss": 0.46835580468177795, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.354735404253006, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8722355961799622, "eval_runtime": 55.774, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2520 }, { "epoch": 0.2325913966093876, "grad_norm": 2.313014337748344, "learning_rate": 1.1270957560660563e-06, "loss": 0.8063, "step": 2521 }, { "epoch": 0.23268365817091455, "grad_norm": 3.635399712281739, "learning_rate": 1.1269836916278284e-06, "loss": 0.8438, "step": 2522 }, { "epoch": 0.23277591973244147, "grad_norm": 1.927833728108103, "learning_rate": 1.1268715816990483e-06, "loss": 0.7967, "step": 2523 }, { "epoch": 0.2328681812939684, "grad_norm": 1.9774224623083527, "learning_rate": 1.1267594262898754e-06, "loss": 0.7281, "step": 2524 }, { "epoch": 0.23296044285549533, "grad_norm": 1.4849486701625527, "learning_rate": 1.1266472254104735e-06, "loss": 0.7488, "step": 2525 }, { "epoch": 0.23296044285549533, "eval_GEN Loss": 0.46815571188926697, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.39794889092445374, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8714542984962463, "eval_runtime": 56.7078, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2525 }, { "epoch": 0.23305270441702225, "grad_norm": 2.052214522194372, "learning_rate": 1.1265349790710102e-06, "loss": 0.6389, "step": 2526 }, { "epoch": 0.2331449659785492, "grad_norm": 1.8405345488527973, "learning_rate": 1.126422687281658e-06, "loss": 0.7683, "step": 2527 }, { "epoch": 0.23323722754007611, "grad_norm": 1.7569126218126419, "learning_rate": 1.1263103500525927e-06, "loss": 0.6766, "step": 2528 }, { "epoch": 0.23332948910160303, "grad_norm": 2.2530742113486104, "learning_rate": 1.1261979673939942e-06, "loss": 0.9568, "step": 2529 }, { "epoch": 0.23342175066312998, "grad_norm": 2.326025848352322, "learning_rate": 1.1260855393160471e-06, "loss": 0.7399, "step": 2530 }, { "epoch": 0.23342175066312998, "eval_GEN Loss": 0.4674154818058014, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.41416069865226746, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8833533525466919, "eval_runtime": 56.7922, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2530 }, { "epoch": 0.2335140122246569, "grad_norm": 1.6557122109170073, "learning_rate": 1.1259730658289396e-06, "loss": 0.5562, "step": 2531 }, { "epoch": 0.23360627378618384, "grad_norm": 1.442127422746816, "learning_rate": 1.1258605469428643e-06, "loss": 0.718, "step": 2532 }, { "epoch": 0.23369853534771076, "grad_norm": 2.168232468969206, "learning_rate": 1.125747982668018e-06, "loss": 0.9217, "step": 2533 }, { "epoch": 0.23379079690923768, "grad_norm": 1.8672615603219742, "learning_rate": 1.1256353730146011e-06, "loss": 0.8414, "step": 2534 }, { "epoch": 0.23388305847076463, "grad_norm": 2.6723027112594555, "learning_rate": 1.125522717992819e-06, "loss": 0.9236, "step": 2535 }, { "epoch": 0.23388305847076463, "eval_GEN Loss": 0.4678378701210022, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4094238579273224, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8882211446762085, "eval_runtime": 57.3303, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 2535 }, { "epoch": 0.23397532003229154, "grad_norm": 2.5711676954810976, "learning_rate": 1.12541001761288e-06, "loss": 0.8562, "step": 2536 }, { "epoch": 0.23406758159381846, "grad_norm": 1.49570424655103, "learning_rate": 1.125297271884998e-06, "loss": 0.695, "step": 2537 }, { "epoch": 0.2341598431553454, "grad_norm": 3.4188011926568325, "learning_rate": 1.1251844808193895e-06, "loss": 0.8133, "step": 2538 }, { "epoch": 0.23425210471687233, "grad_norm": 2.772937083538868, "learning_rate": 1.125071644426276e-06, "loss": 0.8046, "step": 2539 }, { "epoch": 0.23434436627839927, "grad_norm": 1.4829643971961517, "learning_rate": 1.124958762715883e-06, "loss": 0.5224, "step": 2540 }, { "epoch": 0.23434436627839927, "eval_GEN Loss": 0.46604621410369873, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.39644289016723633, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8786057829856873, "eval_runtime": 56.8861, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2540 }, { "epoch": 0.2344366278399262, "grad_norm": 1.6763105657342332, "learning_rate": 1.1248458356984398e-06, "loss": 0.6448, "step": 2541 }, { "epoch": 0.2345288894014531, "grad_norm": 1.7961755994124575, "learning_rate": 1.1247328633841806e-06, "loss": 0.6953, "step": 2542 }, { "epoch": 0.23462115096298006, "grad_norm": 1.6026609778166998, "learning_rate": 1.1246198457833423e-06, "loss": 0.5873, "step": 2543 }, { "epoch": 0.23471341252450698, "grad_norm": 1.8692006613808, "learning_rate": 1.1245067829061675e-06, "loss": 0.9321, "step": 2544 }, { "epoch": 0.2348056740860339, "grad_norm": 1.6154700578899546, "learning_rate": 1.1243936747629017e-06, "loss": 0.6672, "step": 2545 }, { "epoch": 0.2348056740860339, "eval_GEN Loss": 0.4653279781341553, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.3707880973815918, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8753004670143127, "eval_runtime": 56.8048, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2545 }, { "epoch": 0.23489793564756084, "grad_norm": 1.9530299830184554, "learning_rate": 1.124280521363795e-06, "loss": 0.8186, "step": 2546 }, { "epoch": 0.23499019720908776, "grad_norm": 2.0571922856662845, "learning_rate": 1.1241673227191016e-06, "loss": 0.7337, "step": 2547 }, { "epoch": 0.2350824587706147, "grad_norm": 1.953611207398242, "learning_rate": 1.1240540788390798e-06, "loss": 0.7153, "step": 2548 }, { "epoch": 0.23517472033214162, "grad_norm": 1.9533462404809976, "learning_rate": 1.1239407897339915e-06, "loss": 0.5951, "step": 2549 }, { "epoch": 0.23526698189366854, "grad_norm": 4.451501371893454, "learning_rate": 1.1238274554141037e-06, "loss": 0.9408, "step": 2550 }, { "epoch": 0.23526698189366854, "eval_GEN Loss": 0.4650691747665405, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3606521785259247, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8812500238418579, "eval_runtime": 57.4661, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 2550 }, { "epoch": 0.2353592434551955, "grad_norm": 2.2577344799305603, "learning_rate": 1.123714075889687e-06, "loss": 0.7341, "step": 2551 }, { "epoch": 0.2354515050167224, "grad_norm": 1.935955057499266, "learning_rate": 1.1236006511710154e-06, "loss": 0.8388, "step": 2552 }, { "epoch": 0.23554376657824933, "grad_norm": 1.904958157934222, "learning_rate": 1.123487181268368e-06, "loss": 0.6223, "step": 2553 }, { "epoch": 0.23563602813977627, "grad_norm": 2.4034295050685004, "learning_rate": 1.1233736661920278e-06, "loss": 0.7952, "step": 2554 }, { "epoch": 0.2357282897013032, "grad_norm": 3.2878261423784254, "learning_rate": 1.1232601059522814e-06, "loss": 0.8085, "step": 2555 }, { "epoch": 0.2357282897013032, "eval_GEN Loss": 0.46591365337371826, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.3971644639968872, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8887619972229004, "eval_runtime": 56.7474, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2555 }, { "epoch": 0.23582055126283014, "grad_norm": 2.413711180678156, "learning_rate": 1.12314650055942e-06, "loss": 0.7785, "step": 2556 }, { "epoch": 0.23591281282435705, "grad_norm": 1.578646643660678, "learning_rate": 1.1230328500237386e-06, "loss": 0.7172, "step": 2557 }, { "epoch": 0.23600507438588397, "grad_norm": 1.7671334029133194, "learning_rate": 1.1229191543555363e-06, "loss": 0.85, "step": 2558 }, { "epoch": 0.23609733594741092, "grad_norm": 2.0075239914500527, "learning_rate": 1.1228054135651164e-06, "loss": 0.7113, "step": 2559 }, { "epoch": 0.23618959750893784, "grad_norm": 2.8377217672071002, "learning_rate": 1.1226916276627866e-06, "loss": 1.0561, "step": 2560 }, { "epoch": 0.23618959750893784, "eval_GEN Loss": 0.46483534574508667, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.42682313919067383, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9055288434028625, "eval_runtime": 56.6655, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2560 }, { "epoch": 0.23628185907046476, "grad_norm": 1.7992243342898053, "learning_rate": 1.1225777966588582e-06, "loss": 0.7715, "step": 2561 }, { "epoch": 0.2363741206319917, "grad_norm": 1.5924146515434936, "learning_rate": 1.1224639205636465e-06, "loss": 0.7376, "step": 2562 }, { "epoch": 0.23646638219351862, "grad_norm": 2.5928456411016514, "learning_rate": 1.1223499993874712e-06, "loss": 0.7723, "step": 2563 }, { "epoch": 0.23655864375504557, "grad_norm": 2.432199496348407, "learning_rate": 1.1222360331406564e-06, "loss": 0.8685, "step": 2564 }, { "epoch": 0.23665090531657249, "grad_norm": 1.3741751143949394, "learning_rate": 1.1221220218335293e-06, "loss": 0.6125, "step": 2565 }, { "epoch": 0.23665090531657249, "eval_GEN Loss": 0.4643940031528473, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41885513067245483, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9077523946762085, "eval_runtime": 57.0156, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 2565 }, { "epoch": 0.2367431668780994, "grad_norm": 1.4487965371124216, "learning_rate": 1.1220079654764224e-06, "loss": 0.7297, "step": 2566 }, { "epoch": 0.23683542843962635, "grad_norm": 2.158227852156897, "learning_rate": 1.121893864079671e-06, "loss": 0.7006, "step": 2567 }, { "epoch": 0.23692769000115327, "grad_norm": 2.543070925070056, "learning_rate": 1.121779717653616e-06, "loss": 0.8689, "step": 2568 }, { "epoch": 0.2370199515626802, "grad_norm": 1.3737590732668938, "learning_rate": 1.1216655262086008e-06, "loss": 0.6451, "step": 2569 }, { "epoch": 0.23711221312420713, "grad_norm": 2.0399396054569614, "learning_rate": 1.1215512897549738e-06, "loss": 0.8344, "step": 2570 }, { "epoch": 0.23711221312420713, "eval_GEN Loss": 0.46495646238327026, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.3905562162399292, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9021634459495544, "eval_runtime": 56.7579, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2570 }, { "epoch": 0.23720447468573405, "grad_norm": 1.9272540358650754, "learning_rate": 1.1214370083030874e-06, "loss": 0.6872, "step": 2571 }, { "epoch": 0.237296736247261, "grad_norm": 2.0792286041612966, "learning_rate": 1.1213226818632979e-06, "loss": 0.9057, "step": 2572 }, { "epoch": 0.23738899780878792, "grad_norm": 1.7602523207797398, "learning_rate": 1.1212083104459656e-06, "loss": 0.7097, "step": 2573 }, { "epoch": 0.23748125937031483, "grad_norm": 2.7092024520314406, "learning_rate": 1.1210938940614554e-06, "loss": 1.0002, "step": 2574 }, { "epoch": 0.23757352093184178, "grad_norm": 2.213368663770566, "learning_rate": 1.1209794327201354e-06, "loss": 0.9512, "step": 2575 }, { "epoch": 0.23757352093184178, "eval_GEN Loss": 0.46629077196121216, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3744640648365021, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9001802802085876, "eval_runtime": 57.154, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 2575 }, { "epoch": 0.2376657824933687, "grad_norm": 2.2257461915290966, "learning_rate": 1.1208649264323787e-06, "loss": 0.7274, "step": 2576 }, { "epoch": 0.23775804405489562, "grad_norm": 2.0154960156775914, "learning_rate": 1.120750375208562e-06, "loss": 0.7006, "step": 2577 }, { "epoch": 0.23785030561642256, "grad_norm": 1.8514038743508354, "learning_rate": 1.1206357790590657e-06, "loss": 0.6589, "step": 2578 }, { "epoch": 0.23794256717794948, "grad_norm": 1.812508552994726, "learning_rate": 1.120521137994275e-06, "loss": 0.6732, "step": 2579 }, { "epoch": 0.23803482873947643, "grad_norm": 1.7726608492956808, "learning_rate": 1.1204064520245788e-06, "loss": 0.7692, "step": 2580 }, { "epoch": 0.23803482873947643, "eval_GEN Loss": 0.4679611623287201, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3795567750930786, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8996995091438293, "eval_runtime": 56.7412, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2580 }, { "epoch": 0.23812709030100335, "grad_norm": 1.9729873787395944, "learning_rate": 1.1202917211603703e-06, "loss": 0.8437, "step": 2581 }, { "epoch": 0.23821935186253027, "grad_norm": 1.8435487070001206, "learning_rate": 1.1201769454120464e-06, "loss": 0.7759, "step": 2582 }, { "epoch": 0.2383116134240572, "grad_norm": 2.0289952064123127, "learning_rate": 1.1200621247900083e-06, "loss": 0.6987, "step": 2583 }, { "epoch": 0.23840387498558413, "grad_norm": 2.0958208286160525, "learning_rate": 1.119947259304661e-06, "loss": 0.8447, "step": 2584 }, { "epoch": 0.23849613654711105, "grad_norm": 1.9227664424655957, "learning_rate": 1.1198323489664143e-06, "loss": 0.685, "step": 2585 }, { "epoch": 0.23849613654711105, "eval_GEN Loss": 0.4695647358894348, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4069802165031433, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9093149304389954, "eval_runtime": 55.9755, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2585 }, { "epoch": 0.238588398108638, "grad_norm": 2.6346044059746117, "learning_rate": 1.1197173937856812e-06, "loss": 0.8283, "step": 2586 }, { "epoch": 0.2386806596701649, "grad_norm": 2.2779477792534593, "learning_rate": 1.119602393772879e-06, "loss": 0.7428, "step": 2587 }, { "epoch": 0.23877292123169186, "grad_norm": 2.657376334867618, "learning_rate": 1.1194873489384294e-06, "loss": 0.874, "step": 2588 }, { "epoch": 0.23886518279321878, "grad_norm": 1.428451456630398, "learning_rate": 1.119372259292758e-06, "loss": 0.783, "step": 2589 }, { "epoch": 0.2389574443547457, "grad_norm": 1.778757753593459, "learning_rate": 1.1192571248462943e-06, "loss": 0.7061, "step": 2590 }, { "epoch": 0.2389574443547457, "eval_GEN Loss": 0.4712638258934021, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7888947092718702, "eval_PRM F1 Neg": 0.6206896551724138, "eval_PRM Loss": 0.45570430159568787, "eval_PRM NPV": 0.5142857142857142, "eval_PRM Precision": 0.9295774647887324, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9371995329856873, "eval_runtime": 55.6965, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2590 }, { "epoch": 0.23904970591627264, "grad_norm": 1.735152051528127, "learning_rate": 1.1191419456094718e-06, "loss": 0.6781, "step": 2591 }, { "epoch": 0.23914196747779956, "grad_norm": 2.7383848006946643, "learning_rate": 1.1190267215927287e-06, "loss": 0.7268, "step": 2592 }, { "epoch": 0.23923422903932648, "grad_norm": 1.9042119975874754, "learning_rate": 1.1189114528065063e-06, "loss": 0.7572, "step": 2593 }, { "epoch": 0.23932649060085343, "grad_norm": 2.088345537741797, "learning_rate": 1.1187961392612506e-06, "loss": 0.7748, "step": 2594 }, { "epoch": 0.23941875216238034, "grad_norm": 2.757349713158077, "learning_rate": 1.1186807809674115e-06, "loss": 0.6148, "step": 2595 }, { "epoch": 0.23941875216238034, "eval_GEN Loss": 0.4711546003818512, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7888947092718702, "eval_PRM F1 Neg": 0.6206896551724138, "eval_PRM Loss": 0.45487111806869507, "eval_PRM NPV": 0.5142857142857142, "eval_PRM Precision": 0.9295774647887324, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9346153736114502, "eval_runtime": 56.6127, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 2595 }, { "epoch": 0.2395110137239073, "grad_norm": 1.808332122177196, "learning_rate": 1.118565377935443e-06, "loss": 0.7489, "step": 2596 }, { "epoch": 0.2396032752854342, "grad_norm": 1.417073802622359, "learning_rate": 1.1184499301758032e-06, "loss": 0.5061, "step": 2597 }, { "epoch": 0.23969553684696113, "grad_norm": 1.9466946699476475, "learning_rate": 1.1183344376989538e-06, "loss": 0.7785, "step": 2598 }, { "epoch": 0.23978779840848807, "grad_norm": 2.303712894332619, "learning_rate": 1.1182189005153612e-06, "loss": 0.9928, "step": 2599 }, { "epoch": 0.239880059970015, "grad_norm": 2.699353816427195, "learning_rate": 1.1181033186354957e-06, "loss": 0.7598, "step": 2600 }, { "epoch": 0.239880059970015, "eval_GEN Loss": 0.4719969928264618, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4061139225959778, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9103365540504456, "eval_runtime": 55.8192, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2600 }, { "epoch": 0.2399723215315419, "grad_norm": 1.3226400337027335, "learning_rate": 1.117987692069831e-06, "loss": 0.6029, "step": 2601 }, { "epoch": 0.24006458309306886, "grad_norm": 1.8055411209427468, "learning_rate": 1.117872020828846e-06, "loss": 0.8511, "step": 2602 }, { "epoch": 0.24015684465459577, "grad_norm": 2.523980707739512, "learning_rate": 1.1177563049230224e-06, "loss": 0.8335, "step": 2603 }, { "epoch": 0.24024910621612272, "grad_norm": 2.6537671700111254, "learning_rate": 1.117640544362847e-06, "loss": 0.8793, "step": 2604 }, { "epoch": 0.24034136777764964, "grad_norm": 2.6910494722363367, "learning_rate": 1.1175247391588097e-06, "loss": 0.6902, "step": 2605 }, { "epoch": 0.24034136777764964, "eval_GEN Loss": 0.4716975688934326, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3727628290653229, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9069110751152039, "eval_runtime": 55.7799, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2605 }, { "epoch": 0.24043362933917656, "grad_norm": 1.7087716381305673, "learning_rate": 1.1174088893214056e-06, "loss": 0.5984, "step": 2606 }, { "epoch": 0.2405258909007035, "grad_norm": 1.6349844486450962, "learning_rate": 1.117292994861133e-06, "loss": 0.751, "step": 2607 }, { "epoch": 0.24061815246223042, "grad_norm": 2.257379986588271, "learning_rate": 1.1171770557884942e-06, "loss": 0.6488, "step": 2608 }, { "epoch": 0.24071041402375734, "grad_norm": 1.4797117470245391, "learning_rate": 1.1170610721139957e-06, "loss": 0.6943, "step": 2609 }, { "epoch": 0.2408026755852843, "grad_norm": 3.203300606249343, "learning_rate": 1.1169450438481486e-06, "loss": 0.7245, "step": 2610 }, { "epoch": 0.2408026755852843, "eval_GEN Loss": 0.47212257981300354, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3651526868343353, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9094951748847961, "eval_runtime": 55.776, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2610 }, { "epoch": 0.2408949371468112, "grad_norm": 2.082562661039052, "learning_rate": 1.1168289710014673e-06, "loss": 0.6943, "step": 2611 }, { "epoch": 0.24098719870833815, "grad_norm": 1.3461386274799059, "learning_rate": 1.1167128535844705e-06, "loss": 0.7148, "step": 2612 }, { "epoch": 0.24107946026986507, "grad_norm": 1.7466275712776993, "learning_rate": 1.1165966916076807e-06, "loss": 0.8748, "step": 2613 }, { "epoch": 0.241171721831392, "grad_norm": 1.4778306964718693, "learning_rate": 1.116480485081625e-06, "loss": 0.6777, "step": 2614 }, { "epoch": 0.24126398339291893, "grad_norm": 1.5605011569521596, "learning_rate": 1.1163642340168342e-06, "loss": 0.696, "step": 2615 }, { "epoch": 0.24126398339291893, "eval_GEN Loss": 0.4711157977581024, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37030795216560364, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9044471383094788, "eval_runtime": 55.8132, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2615 }, { "epoch": 0.24135624495444585, "grad_norm": 2.2301855181418073, "learning_rate": 1.116247938423843e-06, "loss": 0.7758, "step": 2616 }, { "epoch": 0.24144850651597277, "grad_norm": 2.111904500075404, "learning_rate": 1.1161315983131907e-06, "loss": 0.6658, "step": 2617 }, { "epoch": 0.24154076807749972, "grad_norm": 1.5123236063854808, "learning_rate": 1.1160152136954198e-06, "loss": 0.7382, "step": 2618 }, { "epoch": 0.24163302963902664, "grad_norm": 1.7181890502465444, "learning_rate": 1.1158987845810771e-06, "loss": 0.622, "step": 2619 }, { "epoch": 0.24172529120055358, "grad_norm": 1.7510919721248044, "learning_rate": 1.115782310980714e-06, "loss": 0.7016, "step": 2620 }, { "epoch": 0.24172529120055358, "eval_GEN Loss": 0.47017866373062134, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37671229243278503, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9063100814819336, "eval_runtime": 55.8576, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2620 }, { "epoch": 0.2418175527620805, "grad_norm": 1.8378109776070277, "learning_rate": 1.1156657929048855e-06, "loss": 0.7029, "step": 2621 }, { "epoch": 0.24190981432360742, "grad_norm": 2.321164617975305, "learning_rate": 1.1155492303641503e-06, "loss": 0.692, "step": 2622 }, { "epoch": 0.24200207588513437, "grad_norm": 2.664759457326069, "learning_rate": 1.1154326233690718e-06, "loss": 0.7498, "step": 2623 }, { "epoch": 0.24209433744666128, "grad_norm": 2.6055498615935666, "learning_rate": 1.115315971930217e-06, "loss": 0.9187, "step": 2624 }, { "epoch": 0.2421865990081882, "grad_norm": 1.9355539873623118, "learning_rate": 1.1151992760581573e-06, "loss": 0.609, "step": 2625 }, { "epoch": 0.2421865990081882, "eval_GEN Loss": 0.47074583172798157, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.3882634937763214, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9135817289352417, "eval_runtime": 55.6479, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 2625 }, { "epoch": 0.24227886056971515, "grad_norm": 2.944471657945971, "learning_rate": 1.1150825357634672e-06, "loss": 0.8762, "step": 2626 }, { "epoch": 0.24237112213124207, "grad_norm": 2.200905130844562, "learning_rate": 1.1149657510567265e-06, "loss": 0.6878, "step": 2627 }, { "epoch": 0.242463383692769, "grad_norm": 2.28866226747744, "learning_rate": 1.1148489219485183e-06, "loss": 0.6965, "step": 2628 }, { "epoch": 0.24255564525429593, "grad_norm": 1.824038878062565, "learning_rate": 1.1147320484494299e-06, "loss": 0.7871, "step": 2629 }, { "epoch": 0.24264790681582285, "grad_norm": 1.7826891608940783, "learning_rate": 1.114615130570052e-06, "loss": 0.742, "step": 2630 }, { "epoch": 0.24264790681582285, "eval_GEN Loss": 0.4712772071361542, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.39751917123794556, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9146033525466919, "eval_runtime": 56.0668, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2630 }, { "epoch": 0.2427401683773498, "grad_norm": 1.3443934187863702, "learning_rate": 1.1144981683209808e-06, "loss": 0.5388, "step": 2631 }, { "epoch": 0.24283242993887671, "grad_norm": 1.9350901119904973, "learning_rate": 1.1143811617128147e-06, "loss": 0.7367, "step": 2632 }, { "epoch": 0.24292469150040363, "grad_norm": 2.0198018563883497, "learning_rate": 1.1142641107561576e-06, "loss": 0.6642, "step": 2633 }, { "epoch": 0.24301695306193058, "grad_norm": 1.7564955951482246, "learning_rate": 1.1141470154616165e-06, "loss": 0.7376, "step": 2634 }, { "epoch": 0.2431092146234575, "grad_norm": 2.2912139567429244, "learning_rate": 1.1140298758398032e-06, "loss": 0.7932, "step": 2635 }, { "epoch": 0.2431092146234575, "eval_GEN Loss": 0.4723615348339081, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.4061235785484314, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9222956895828247, "eval_runtime": 55.6989, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2635 }, { "epoch": 0.24320147618498444, "grad_norm": 2.6350049683050263, "learning_rate": 1.1139126919013327e-06, "loss": 0.7523, "step": 2636 }, { "epoch": 0.24329373774651136, "grad_norm": 2.6376997258443313, "learning_rate": 1.1137954636568243e-06, "loss": 0.9642, "step": 2637 }, { "epoch": 0.24338599930803828, "grad_norm": 1.5119685825236164, "learning_rate": 1.1136781911169018e-06, "loss": 0.5982, "step": 2638 }, { "epoch": 0.24347826086956523, "grad_norm": 1.713111181227738, "learning_rate": 1.1135608742921925e-06, "loss": 0.6589, "step": 2639 }, { "epoch": 0.24357052243109215, "grad_norm": 1.8382115876879144, "learning_rate": 1.1134435131933276e-06, "loss": 0.7064, "step": 2640 }, { "epoch": 0.24357052243109215, "eval_GEN Loss": 0.47442442178726196, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41116347908973694, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9266225695610046, "eval_runtime": 56.8658, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2640 }, { "epoch": 0.24366278399261906, "grad_norm": 1.517008188562679, "learning_rate": 1.1133261078309429e-06, "loss": 0.6288, "step": 2641 }, { "epoch": 0.243755045554146, "grad_norm": 1.6833885463981062, "learning_rate": 1.1132086582156775e-06, "loss": 0.8063, "step": 2642 }, { "epoch": 0.24384730711567293, "grad_norm": 1.9506178692626712, "learning_rate": 1.1130911643581752e-06, "loss": 0.9221, "step": 2643 }, { "epoch": 0.24393956867719988, "grad_norm": 1.711158475549289, "learning_rate": 1.1129736262690833e-06, "loss": 0.7147, "step": 2644 }, { "epoch": 0.2440318302387268, "grad_norm": 2.244195921152605, "learning_rate": 1.112856043959053e-06, "loss": 0.7238, "step": 2645 }, { "epoch": 0.2440318302387268, "eval_GEN Loss": 0.47486352920532227, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.40899932384490967, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9401442408561707, "eval_runtime": 56.5917, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 2645 }, { "epoch": 0.2441240918002537, "grad_norm": 1.6849552676106292, "learning_rate": 1.1127384174387405e-06, "loss": 0.5591, "step": 2646 }, { "epoch": 0.24421635336178066, "grad_norm": 2.903197551076138, "learning_rate": 1.1126207467188047e-06, "loss": 0.9402, "step": 2647 }, { "epoch": 0.24430861492330758, "grad_norm": 2.36574246101209, "learning_rate": 1.1125030318099092e-06, "loss": 0.7487, "step": 2648 }, { "epoch": 0.2444008764848345, "grad_norm": 1.5393744570309666, "learning_rate": 1.1123852727227218e-06, "loss": 0.8016, "step": 2649 }, { "epoch": 0.24449313804636144, "grad_norm": 1.868008692844655, "learning_rate": 1.1122674694679137e-06, "loss": 0.6475, "step": 2650 }, { "epoch": 0.24449313804636144, "eval_GEN Loss": 0.4760426878929138, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4073770344257355, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9487980604171753, "eval_runtime": 56.8027, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2650 }, { "epoch": 0.24458539960788836, "grad_norm": 2.734933908646507, "learning_rate": 1.1121496220561605e-06, "loss": 0.985, "step": 2651 }, { "epoch": 0.2446776611694153, "grad_norm": 2.0199063915080253, "learning_rate": 1.112031730498142e-06, "loss": 0.7998, "step": 2652 }, { "epoch": 0.24476992273094222, "grad_norm": 1.7830298994819749, "learning_rate": 1.1119137948045413e-06, "loss": 0.8221, "step": 2653 }, { "epoch": 0.24486218429246914, "grad_norm": 3.3780892989823603, "learning_rate": 1.1117958149860465e-06, "loss": 0.9432, "step": 2654 }, { "epoch": 0.2449544458539961, "grad_norm": 2.0519511551282648, "learning_rate": 1.1116777910533484e-06, "loss": 0.7193, "step": 2655 }, { "epoch": 0.2449544458539961, "eval_GEN Loss": 0.47731730341911316, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.43130752444267273, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9389122724533081, "eval_runtime": 55.7727, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2655 }, { "epoch": 0.245046707415523, "grad_norm": 1.7867197941851463, "learning_rate": 1.1115597230171427e-06, "loss": 0.6895, "step": 2656 }, { "epoch": 0.24513896897704993, "grad_norm": 1.8496498318116188, "learning_rate": 1.111441610888129e-06, "loss": 0.7608, "step": 2657 }, { "epoch": 0.24523123053857687, "grad_norm": 2.9975046480207412, "learning_rate": 1.111323454677011e-06, "loss": 0.6447, "step": 2658 }, { "epoch": 0.2453234921001038, "grad_norm": 2.435834494320346, "learning_rate": 1.1112052543944963e-06, "loss": 0.8602, "step": 2659 }, { "epoch": 0.24541575366163074, "grad_norm": 1.5755190483418144, "learning_rate": 1.1110870100512958e-06, "loss": 0.531, "step": 2660 }, { "epoch": 0.24541575366163074, "eval_GEN Loss": 0.4768896996974945, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.43830370903015137, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.934495210647583, "eval_runtime": 55.8348, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2660 }, { "epoch": 0.24550801522315766, "grad_norm": 1.7338215646981916, "learning_rate": 1.1109687216581255e-06, "loss": 0.666, "step": 2661 }, { "epoch": 0.24560027678468457, "grad_norm": 2.60583301671582, "learning_rate": 1.1108503892257048e-06, "loss": 0.7092, "step": 2662 }, { "epoch": 0.24569253834621152, "grad_norm": 2.6521807938255275, "learning_rate": 1.1107320127647567e-06, "loss": 1.0368, "step": 2663 }, { "epoch": 0.24578479990773844, "grad_norm": 1.9397235093993084, "learning_rate": 1.1106135922860093e-06, "loss": 0.8096, "step": 2664 }, { "epoch": 0.24587706146926536, "grad_norm": 1.4033374000064165, "learning_rate": 1.1104951278001937e-06, "loss": 0.7326, "step": 2665 }, { "epoch": 0.24587706146926536, "eval_GEN Loss": 0.4765397012233734, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4285373389720917, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9275240302085876, "eval_runtime": 55.7565, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2665 }, { "epoch": 0.2459693230307923, "grad_norm": 2.164335109214383, "learning_rate": 1.1103766193180456e-06, "loss": 0.8181, "step": 2666 }, { "epoch": 0.24606158459231922, "grad_norm": 2.2196893197651812, "learning_rate": 1.1102580668503043e-06, "loss": 0.7924, "step": 2667 }, { "epoch": 0.24615384615384617, "grad_norm": 2.993252069894412, "learning_rate": 1.1101394704077132e-06, "loss": 0.9642, "step": 2668 }, { "epoch": 0.24624610771537309, "grad_norm": 2.27327253053909, "learning_rate": 1.1100208300010195e-06, "loss": 0.8564, "step": 2669 }, { "epoch": 0.2463383692769, "grad_norm": 2.3821446459764504, "learning_rate": 1.1099021456409748e-06, "loss": 0.7544, "step": 2670 }, { "epoch": 0.2463383692769, "eval_GEN Loss": 0.4759509563446045, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.42510223388671875, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9228966236114502, "eval_runtime": 56.0279, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2670 }, { "epoch": 0.24643063083842695, "grad_norm": 1.7964367007397872, "learning_rate": 1.1097834173383344e-06, "loss": 0.7891, "step": 2671 }, { "epoch": 0.24652289239995387, "grad_norm": 1.7203876762332726, "learning_rate": 1.1096646451038578e-06, "loss": 0.6537, "step": 2672 }, { "epoch": 0.2466151539614808, "grad_norm": 2.3866574552580597, "learning_rate": 1.109545828948308e-06, "loss": 0.7328, "step": 2673 }, { "epoch": 0.24670741552300773, "grad_norm": 1.7511228802379015, "learning_rate": 1.1094269688824526e-06, "loss": 0.8012, "step": 2674 }, { "epoch": 0.24679967708453465, "grad_norm": 1.6420429647856971, "learning_rate": 1.1093080649170626e-06, "loss": 0.7032, "step": 2675 }, { "epoch": 0.24679967708453465, "eval_GEN Loss": 0.4752283990383148, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.410010427236557, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.921875, "eval_runtime": 56.7526, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2675 }, { "epoch": 0.2468919386460616, "grad_norm": 2.92803193347504, "learning_rate": 1.1091891170629137e-06, "loss": 0.8658, "step": 2676 }, { "epoch": 0.24698420020758852, "grad_norm": 1.2843911845081415, "learning_rate": 1.1090701253307848e-06, "loss": 0.6142, "step": 2677 }, { "epoch": 0.24707646176911544, "grad_norm": 1.7815618811696259, "learning_rate": 1.1089510897314591e-06, "loss": 0.6174, "step": 2678 }, { "epoch": 0.24716872333064238, "grad_norm": 1.6848760870756567, "learning_rate": 1.108832010275724e-06, "loss": 0.7942, "step": 2679 }, { "epoch": 0.2472609848921693, "grad_norm": 2.0652980233879488, "learning_rate": 1.1087128869743704e-06, "loss": 0.8283, "step": 2680 }, { "epoch": 0.2472609848921693, "eval_GEN Loss": 0.4764530658721924, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.39405161142349243, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9256610870361328, "eval_runtime": 55.736, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2680 }, { "epoch": 0.24735324645369622, "grad_norm": 1.4959808394336118, "learning_rate": 1.1085937198381938e-06, "loss": 0.7071, "step": 2681 }, { "epoch": 0.24744550801522316, "grad_norm": 1.5492094935392113, "learning_rate": 1.1084745088779932e-06, "loss": 0.6962, "step": 2682 }, { "epoch": 0.24753776957675008, "grad_norm": 1.5212333996460836, "learning_rate": 1.1083552541045715e-06, "loss": 0.6939, "step": 2683 }, { "epoch": 0.24763003113827703, "grad_norm": 1.6342928925896765, "learning_rate": 1.1082359555287359e-06, "loss": 0.7901, "step": 2684 }, { "epoch": 0.24772229269980395, "grad_norm": 2.1132965754143966, "learning_rate": 1.1081166131612971e-06, "loss": 0.8711, "step": 2685 }, { "epoch": 0.24772229269980395, "eval_GEN Loss": 0.47772204875946045, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3826387822628021, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9354567527770996, "eval_runtime": 55.8083, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2685 }, { "epoch": 0.24781455426133087, "grad_norm": 1.8408714340145624, "learning_rate": 1.1079972270130706e-06, "loss": 0.725, "step": 2686 }, { "epoch": 0.2479068158228578, "grad_norm": 2.1413222276832324, "learning_rate": 1.1078777970948751e-06, "loss": 0.6882, "step": 2687 }, { "epoch": 0.24799907738438473, "grad_norm": 1.8030187154881656, "learning_rate": 1.1077583234175338e-06, "loss": 0.7754, "step": 2688 }, { "epoch": 0.24809133894591165, "grad_norm": 1.5547666932982365, "learning_rate": 1.107638805991873e-06, "loss": 0.7013, "step": 2689 }, { "epoch": 0.2481836005074386, "grad_norm": 2.0074387054007024, "learning_rate": 1.1075192448287242e-06, "loss": 0.6715, "step": 2690 }, { "epoch": 0.2481836005074386, "eval_GEN Loss": 0.4780990481376648, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.37563762068748474, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9396634697914124, "eval_runtime": 55.9202, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2690 }, { "epoch": 0.2482758620689655, "grad_norm": 1.7498174218088007, "learning_rate": 1.1073996399389219e-06, "loss": 0.6374, "step": 2691 }, { "epoch": 0.24836812363049243, "grad_norm": 2.4867012202192145, "learning_rate": 1.1072799913333048e-06, "loss": 0.5798, "step": 2692 }, { "epoch": 0.24846038519201938, "grad_norm": 1.5050903166311473, "learning_rate": 1.1071602990227156e-06, "loss": 0.5502, "step": 2693 }, { "epoch": 0.2485526467535463, "grad_norm": 3.2452340997446245, "learning_rate": 1.1070405630180014e-06, "loss": 0.8691, "step": 2694 }, { "epoch": 0.24864490831507324, "grad_norm": 2.1210822441781514, "learning_rate": 1.1069207833300128e-06, "loss": 0.711, "step": 2695 }, { "epoch": 0.24864490831507324, "eval_GEN Loss": 0.47814249992370605, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.37390992045402527, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9502403736114502, "eval_runtime": 55.9602, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2695 }, { "epoch": 0.24873716987660016, "grad_norm": 2.8177571574365814, "learning_rate": 1.106800959969604e-06, "loss": 0.9125, "step": 2696 }, { "epoch": 0.24882943143812708, "grad_norm": 1.5027747160508305, "learning_rate": 1.106681092947634e-06, "loss": 0.5993, "step": 2697 }, { "epoch": 0.24892169299965403, "grad_norm": 2.1972824734459353, "learning_rate": 1.106561182274965e-06, "loss": 0.6126, "step": 2698 }, { "epoch": 0.24901395456118094, "grad_norm": 1.87921303262548, "learning_rate": 1.106441227962464e-06, "loss": 0.6475, "step": 2699 }, { "epoch": 0.24910621612270786, "grad_norm": 2.269059349742849, "learning_rate": 1.1063212300210007e-06, "loss": 0.7593, "step": 2700 }, { "epoch": 0.24910621612270786, "eval_GEN Loss": 0.4765802025794983, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3797445595264435, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9288461804389954, "eval_runtime": 55.8275, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2700 }, { "epoch": 0.2491984776842348, "grad_norm": 2.133584930517032, "learning_rate": 1.1062011884614502e-06, "loss": 0.7743, "step": 2701 }, { "epoch": 0.24929073924576173, "grad_norm": 2.759934439164502, "learning_rate": 1.1060811032946904e-06, "loss": 0.8687, "step": 2702 }, { "epoch": 0.24938300080728867, "grad_norm": 1.501543511252636, "learning_rate": 1.1059609745316038e-06, "loss": 0.5996, "step": 2703 }, { "epoch": 0.2494752623688156, "grad_norm": 2.765476358871736, "learning_rate": 1.105840802183077e-06, "loss": 0.8542, "step": 2704 }, { "epoch": 0.2495675239303425, "grad_norm": 2.192084663737546, "learning_rate": 1.1057205862599995e-06, "loss": 0.8602, "step": 2705 }, { "epoch": 0.2495675239303425, "eval_GEN Loss": 0.47709906101226807, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.40841448307037354, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.922656238079071, "eval_runtime": 55.886, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2705 }, { "epoch": 0.24965978549186946, "grad_norm": 1.82215323380972, "learning_rate": 1.1056003267732657e-06, "loss": 0.7283, "step": 2706 }, { "epoch": 0.24975204705339638, "grad_norm": 1.9918539551359982, "learning_rate": 1.105480023733774e-06, "loss": 0.7047, "step": 2707 }, { "epoch": 0.2498443086149233, "grad_norm": 2.1372829755698053, "learning_rate": 1.1053596771524263e-06, "loss": 0.7286, "step": 2708 }, { "epoch": 0.24993657017645024, "grad_norm": 3.666956765802162, "learning_rate": 1.1052392870401285e-06, "loss": 0.5377, "step": 2709 }, { "epoch": 0.2500288317379772, "grad_norm": 2.434505687115984, "learning_rate": 1.1051188534077906e-06, "loss": 0.669, "step": 2710 }, { "epoch": 0.2500288317379772, "eval_GEN Loss": 0.47733473777770996, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4218302369117737, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9270432591438293, "eval_runtime": 55.9367, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2710 }, { "epoch": 0.2501210932995041, "grad_norm": 2.58324077058937, "learning_rate": 1.1049983762663267e-06, "loss": 0.9696, "step": 2711 }, { "epoch": 0.250213354861031, "grad_norm": 1.8620362834184567, "learning_rate": 1.104877855626654e-06, "loss": 0.7172, "step": 2712 }, { "epoch": 0.25030561642255794, "grad_norm": 2.60333731709298, "learning_rate": 1.104757291499695e-06, "loss": 0.7288, "step": 2713 }, { "epoch": 0.25039787798408486, "grad_norm": 2.0264868894723147, "learning_rate": 1.104636683896375e-06, "loss": 0.7463, "step": 2714 }, { "epoch": 0.25049013954561183, "grad_norm": 2.05589004516307, "learning_rate": 1.1045160328276237e-06, "loss": 0.6319, "step": 2715 }, { "epoch": 0.25049013954561183, "eval_GEN Loss": 0.4764898121356964, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4027074873447418, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9216946959495544, "eval_runtime": 56.0182, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2715 }, { "epoch": 0.25058240110713875, "grad_norm": 2.5289463158075356, "learning_rate": 1.104395338304375e-06, "loss": 0.6668, "step": 2716 }, { "epoch": 0.25067466266866567, "grad_norm": 1.5864082678088869, "learning_rate": 1.1042746003375656e-06, "loss": 0.6903, "step": 2717 }, { "epoch": 0.2507669242301926, "grad_norm": 1.6947751046940056, "learning_rate": 1.104153818938138e-06, "loss": 0.7553, "step": 2718 }, { "epoch": 0.2508591857917195, "grad_norm": 2.44322897534241, "learning_rate": 1.104032994117037e-06, "loss": 0.851, "step": 2719 }, { "epoch": 0.2509514473532464, "grad_norm": 2.141264688497023, "learning_rate": 1.103912125885212e-06, "loss": 0.8212, "step": 2720 }, { "epoch": 0.2509514473532464, "eval_GEN Loss": 0.4742036759853363, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37442681193351746, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.924098551273346, "eval_runtime": 55.7235, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2720 }, { "epoch": 0.2510437089147734, "grad_norm": 1.6571002455330712, "learning_rate": 1.1037912142536165e-06, "loss": 0.5541, "step": 2721 }, { "epoch": 0.2511359704763003, "grad_norm": 2.9809860574731837, "learning_rate": 1.1036702592332074e-06, "loss": 0.6998, "step": 2722 }, { "epoch": 0.25122823203782724, "grad_norm": 1.468966340414337, "learning_rate": 1.103549260834946e-06, "loss": 0.4936, "step": 2723 }, { "epoch": 0.25132049359935416, "grad_norm": 2.289771045783806, "learning_rate": 1.1034282190697973e-06, "loss": 0.8155, "step": 2724 }, { "epoch": 0.2514127551608811, "grad_norm": 1.5916603472113702, "learning_rate": 1.1033071339487305e-06, "loss": 0.7593, "step": 2725 }, { "epoch": 0.2514127551608811, "eval_GEN Loss": 0.4734470546245575, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37095266580581665, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9146033525466919, "eval_runtime": 55.9357, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2725 }, { "epoch": 0.25150501672240805, "grad_norm": 1.9223544384193163, "learning_rate": 1.1031860054827182e-06, "loss": 0.8488, "step": 2726 }, { "epoch": 0.25159727828393497, "grad_norm": 1.5396407340450482, "learning_rate": 1.1030648336827374e-06, "loss": 0.6941, "step": 2727 }, { "epoch": 0.2516895398454619, "grad_norm": 2.6191322420455068, "learning_rate": 1.1029436185597688e-06, "loss": 0.989, "step": 2728 }, { "epoch": 0.2517818014069888, "grad_norm": 1.4063027010558389, "learning_rate": 1.1028223601247974e-06, "loss": 0.7228, "step": 2729 }, { "epoch": 0.2518740629685157, "grad_norm": 1.7045344682664259, "learning_rate": 1.1027010583888115e-06, "loss": 0.6418, "step": 2730 }, { "epoch": 0.2518740629685157, "eval_GEN Loss": 0.4710525870323181, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.3637698292732239, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9052283763885498, "eval_runtime": 55.9242, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2730 }, { "epoch": 0.2519663245300427, "grad_norm": 1.687606690212869, "learning_rate": 1.102579713362804e-06, "loss": 0.7405, "step": 2731 }, { "epoch": 0.2520585860915696, "grad_norm": 2.197511379073901, "learning_rate": 1.1024583250577708e-06, "loss": 0.7448, "step": 2732 }, { "epoch": 0.25215084765309653, "grad_norm": 3.2422250647843427, "learning_rate": 1.1023368934847128e-06, "loss": 1.1846, "step": 2733 }, { "epoch": 0.25224310921462345, "grad_norm": 2.7578343184098104, "learning_rate": 1.1022154186546341e-06, "loss": 0.9751, "step": 2734 }, { "epoch": 0.25233537077615037, "grad_norm": 1.4020187852952832, "learning_rate": 1.102093900578543e-06, "loss": 0.707, "step": 2735 }, { "epoch": 0.25233537077615037, "eval_GEN Loss": 0.47052672505378723, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3734349310398102, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8960937261581421, "eval_runtime": 55.9148, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2735 }, { "epoch": 0.2524276323376773, "grad_norm": 2.546163967016158, "learning_rate": 1.1019723392674518e-06, "loss": 0.8057, "step": 2736 }, { "epoch": 0.25251989389920426, "grad_norm": 2.3967268437186138, "learning_rate": 1.1018507347323767e-06, "loss": 0.8003, "step": 2737 }, { "epoch": 0.2526121554607312, "grad_norm": 1.8438201721412526, "learning_rate": 1.101729086984337e-06, "loss": 0.7421, "step": 2738 }, { "epoch": 0.2527044170222581, "grad_norm": 1.6678431054044824, "learning_rate": 1.1016073960343573e-06, "loss": 0.7248, "step": 2739 }, { "epoch": 0.252796678583785, "grad_norm": 2.2137463759365152, "learning_rate": 1.101485661893465e-06, "loss": 0.6184, "step": 2740 }, { "epoch": 0.252796678583785, "eval_GEN Loss": 0.47182321548461914, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4018365740776062, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9039663672447205, "eval_runtime": 55.9513, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2740 }, { "epoch": 0.25288894014531194, "grad_norm": 1.864168833974342, "learning_rate": 1.1013638845726921e-06, "loss": 0.7604, "step": 2741 }, { "epoch": 0.2529812017068389, "grad_norm": 1.9727405405879306, "learning_rate": 1.1012420640830743e-06, "loss": 0.7417, "step": 2742 }, { "epoch": 0.25307346326836583, "grad_norm": 2.198680636928872, "learning_rate": 1.101120200435651e-06, "loss": 0.6413, "step": 2743 }, { "epoch": 0.25316572482989275, "grad_norm": 1.7728143302191022, "learning_rate": 1.1009982936414656e-06, "loss": 0.7255, "step": 2744 }, { "epoch": 0.25325798639141966, "grad_norm": 1.987240472964129, "learning_rate": 1.1008763437115657e-06, "loss": 0.6966, "step": 2745 }, { "epoch": 0.25325798639141966, "eval_GEN Loss": 0.4717996120452881, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3923601508140564, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9013221263885498, "eval_runtime": 55.8897, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2745 }, { "epoch": 0.2533502479529466, "grad_norm": 1.4273274115572978, "learning_rate": 1.1007543506570023e-06, "loss": 0.7564, "step": 2746 }, { "epoch": 0.25344250951447356, "grad_norm": 2.6709177785801677, "learning_rate": 1.100632314488831e-06, "loss": 0.6231, "step": 2747 }, { "epoch": 0.2535347710760005, "grad_norm": 1.7995659784526166, "learning_rate": 1.1005102352181106e-06, "loss": 0.7487, "step": 2748 }, { "epoch": 0.2536270326375274, "grad_norm": 1.6121025402103923, "learning_rate": 1.1003881128559043e-06, "loss": 0.682, "step": 2749 }, { "epoch": 0.2537192941990543, "grad_norm": 2.0586458948042443, "learning_rate": 1.1002659474132787e-06, "loss": 0.6513, "step": 2750 }, { "epoch": 0.2537192941990543, "eval_GEN Loss": 0.47003883123397827, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.36587613821029663, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8927283883094788, "eval_runtime": 56.0661, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2750 }, { "epoch": 0.25381155576058123, "grad_norm": 1.7331050204059888, "learning_rate": 1.1001437389013052e-06, "loss": 0.7722, "step": 2751 }, { "epoch": 0.25390381732210815, "grad_norm": 1.563777794889261, "learning_rate": 1.100021487331058e-06, "loss": 0.5947, "step": 2752 }, { "epoch": 0.2539960788836351, "grad_norm": 1.8759858025217275, "learning_rate": 1.099899192713616e-06, "loss": 0.8462, "step": 2753 }, { "epoch": 0.25408834044516204, "grad_norm": 1.922353800268907, "learning_rate": 1.0997768550600615e-06, "loss": 0.693, "step": 2754 }, { "epoch": 0.25418060200668896, "grad_norm": 1.5572991964844718, "learning_rate": 1.0996544743814813e-06, "loss": 0.7165, "step": 2755 }, { "epoch": 0.25418060200668896, "eval_GEN Loss": 0.4701164662837982, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3527683615684509, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.897536039352417, "eval_runtime": 55.8188, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2755 }, { "epoch": 0.2542728635682159, "grad_norm": 1.6046248906656375, "learning_rate": 1.0995320506889654e-06, "loss": 0.6619, "step": 2756 }, { "epoch": 0.2543651251297428, "grad_norm": 1.4209949872231915, "learning_rate": 1.0994095839936081e-06, "loss": 0.6936, "step": 2757 }, { "epoch": 0.25445738669126977, "grad_norm": 1.534915694918809, "learning_rate": 1.0992870743065077e-06, "loss": 0.532, "step": 2758 }, { "epoch": 0.2545496482527967, "grad_norm": 1.8044306504046457, "learning_rate": 1.0991645216387661e-06, "loss": 0.7963, "step": 2759 }, { "epoch": 0.2546419098143236, "grad_norm": 1.4632734763269986, "learning_rate": 1.0990419260014891e-06, "loss": 0.5536, "step": 2760 }, { "epoch": 0.2546419098143236, "eval_GEN Loss": 0.47240176796913147, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.34533143043518066, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8927884697914124, "eval_runtime": 55.7199, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2760 }, { "epoch": 0.2547341713758505, "grad_norm": 1.7222787821212286, "learning_rate": 1.0989192874057865e-06, "loss": 0.6526, "step": 2761 }, { "epoch": 0.25482643293737745, "grad_norm": 1.7703129961636446, "learning_rate": 1.0987966058627726e-06, "loss": 0.7849, "step": 2762 }, { "epoch": 0.2549186944989044, "grad_norm": 1.5422890636705469, "learning_rate": 1.098673881383564e-06, "loss": 0.6029, "step": 2763 }, { "epoch": 0.25501095606043134, "grad_norm": 1.6050379066340041, "learning_rate": 1.098551113979283e-06, "loss": 0.4569, "step": 2764 }, { "epoch": 0.25510321762195826, "grad_norm": 1.3368182001234166, "learning_rate": 1.0984283036610544e-06, "loss": 0.6307, "step": 2765 }, { "epoch": 0.25510321762195826, "eval_GEN Loss": 0.4736599028110504, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3503721356391907, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8943509459495544, "eval_runtime": 55.9476, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2765 }, { "epoch": 0.2551954791834852, "grad_norm": 2.679884884446318, "learning_rate": 1.0983054504400078e-06, "loss": 0.9728, "step": 2766 }, { "epoch": 0.2552877407450121, "grad_norm": 2.2610303912303893, "learning_rate": 1.0981825543272765e-06, "loss": 0.7604, "step": 2767 }, { "epoch": 0.255380002306539, "grad_norm": 2.6415929410892214, "learning_rate": 1.098059615333997e-06, "loss": 0.9016, "step": 2768 }, { "epoch": 0.255472263868066, "grad_norm": 1.8350088078906566, "learning_rate": 1.0979366334713108e-06, "loss": 0.7414, "step": 2769 }, { "epoch": 0.2555645254295929, "grad_norm": 1.7231897799566085, "learning_rate": 1.0978136087503625e-06, "loss": 0.727, "step": 2770 }, { "epoch": 0.2555645254295929, "eval_GEN Loss": 0.4734903573989868, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3658936619758606, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8900841474533081, "eval_runtime": 55.934, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2770 }, { "epoch": 0.2556567869911198, "grad_norm": 1.6561298745041995, "learning_rate": 1.0976905411823005e-06, "loss": 0.7006, "step": 2771 }, { "epoch": 0.25574904855264674, "grad_norm": 1.5465264004793344, "learning_rate": 1.097567430778278e-06, "loss": 0.6357, "step": 2772 }, { "epoch": 0.25584131011417366, "grad_norm": 1.4634836315657354, "learning_rate": 1.0974442775494506e-06, "loss": 0.7187, "step": 2773 }, { "epoch": 0.25593357167570063, "grad_norm": 2.37903174551299, "learning_rate": 1.0973210815069795e-06, "loss": 0.8919, "step": 2774 }, { "epoch": 0.25602583323722755, "grad_norm": 1.9867145247951667, "learning_rate": 1.0971978426620285e-06, "loss": 0.5644, "step": 2775 }, { "epoch": 0.25602583323722755, "eval_GEN Loss": 0.47412750124931335, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.37998804450035095, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8872596025466919, "eval_runtime": 56.6649, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2775 }, { "epoch": 0.25611809479875447, "grad_norm": 1.6259013407828804, "learning_rate": 1.0970745610257657e-06, "loss": 0.8081, "step": 2776 }, { "epoch": 0.2562103563602814, "grad_norm": 1.7748196718121532, "learning_rate": 1.096951236609363e-06, "loss": 0.7647, "step": 2777 }, { "epoch": 0.2563026179218083, "grad_norm": 1.779199920781924, "learning_rate": 1.0968278694239965e-06, "loss": 0.7141, "step": 2778 }, { "epoch": 0.2563948794833353, "grad_norm": 1.8238775569929553, "learning_rate": 1.096704459480846e-06, "loss": 0.8336, "step": 2779 }, { "epoch": 0.2564871410448622, "grad_norm": 2.5219035745327996, "learning_rate": 1.0965810067910946e-06, "loss": 0.7671, "step": 2780 }, { "epoch": 0.2564871410448622, "eval_GEN Loss": 0.47480443120002747, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.38208648562431335, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8912860751152039, "eval_runtime": 55.9268, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2780 }, { "epoch": 0.2565794026063891, "grad_norm": 2.010591698276529, "learning_rate": 1.09645751136593e-06, "loss": 0.7778, "step": 2781 }, { "epoch": 0.25667166416791604, "grad_norm": 1.9932117067457162, "learning_rate": 1.096333973216544e-06, "loss": 0.9167, "step": 2782 }, { "epoch": 0.25676392572944295, "grad_norm": 1.6171203505033056, "learning_rate": 1.0962103923541311e-06, "loss": 0.8603, "step": 2783 }, { "epoch": 0.2568561872909699, "grad_norm": 2.4121571177480354, "learning_rate": 1.096086768789891e-06, "loss": 0.836, "step": 2784 }, { "epoch": 0.25694844885249685, "grad_norm": 1.5901849529773644, "learning_rate": 1.0959631025350264e-06, "loss": 0.6084, "step": 2785 }, { "epoch": 0.25694844885249685, "eval_GEN Loss": 0.47598758339881897, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.388836145401001, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8961538672447205, "eval_runtime": 56.9302, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2785 }, { "epoch": 0.25704071041402377, "grad_norm": 1.8847158556124448, "learning_rate": 1.0958393936007442e-06, "loss": 0.7882, "step": 2786 }, { "epoch": 0.2571329719755507, "grad_norm": 1.5407724113318073, "learning_rate": 1.0957156419982548e-06, "loss": 0.6125, "step": 2787 }, { "epoch": 0.2572252335370776, "grad_norm": 1.6609345073163515, "learning_rate": 1.0955918477387731e-06, "loss": 0.5919, "step": 2788 }, { "epoch": 0.2573174950986045, "grad_norm": 1.7724364631933782, "learning_rate": 1.0954680108335174e-06, "loss": 0.7188, "step": 2789 }, { "epoch": 0.2574097566601315, "grad_norm": 1.9579215759808466, "learning_rate": 1.0953441312937102e-06, "loss": 0.5865, "step": 2790 }, { "epoch": 0.2574097566601315, "eval_GEN Loss": 0.47702980041503906, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.39262256026268005, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9006009697914124, "eval_runtime": 56.8136, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2790 }, { "epoch": 0.2575020182216584, "grad_norm": 1.802557422520963, "learning_rate": 1.0952202091305774e-06, "loss": 0.8458, "step": 2791 }, { "epoch": 0.25759427978318533, "grad_norm": 1.54787936179994, "learning_rate": 1.0950962443553492e-06, "loss": 0.6077, "step": 2792 }, { "epoch": 0.25768654134471225, "grad_norm": 1.584416561131339, "learning_rate": 1.0949722369792592e-06, "loss": 0.6189, "step": 2793 }, { "epoch": 0.25777880290623917, "grad_norm": 2.352430888381316, "learning_rate": 1.0948481870135454e-06, "loss": 0.9219, "step": 2794 }, { "epoch": 0.25787106446776614, "grad_norm": 2.6680729850490867, "learning_rate": 1.0947240944694496e-06, "loss": 0.6239, "step": 2795 }, { "epoch": 0.25787106446776614, "eval_GEN Loss": 0.47783082723617554, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.37871477007865906, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9094350934028625, "eval_runtime": 55.8842, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2795 }, { "epoch": 0.25796332602929306, "grad_norm": 1.4334642233541819, "learning_rate": 1.0945999593582166e-06, "loss": 0.6609, "step": 2796 }, { "epoch": 0.25805558759082, "grad_norm": 1.348389367047391, "learning_rate": 1.0944757816910965e-06, "loss": 0.6109, "step": 2797 }, { "epoch": 0.2581478491523469, "grad_norm": 1.9822240292242792, "learning_rate": 1.0943515614793419e-06, "loss": 0.7317, "step": 2798 }, { "epoch": 0.2582401107138738, "grad_norm": 1.4757451030987536, "learning_rate": 1.0942272987342098e-06, "loss": 0.6135, "step": 2799 }, { "epoch": 0.25833237227540073, "grad_norm": 2.7201681269827813, "learning_rate": 1.0941029934669616e-06, "loss": 0.7775, "step": 2800 }, { "epoch": 0.25833237227540073, "eval_GEN Loss": 0.4769158661365509, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3735000193119049, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9156851172447205, "eval_runtime": 56.0778, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2800 }, { "epoch": 0.2584246338369277, "grad_norm": 1.320850616664563, "learning_rate": 1.0939786456888616e-06, "loss": 0.5955, "step": 2801 }, { "epoch": 0.2585168953984546, "grad_norm": 1.9698847411133535, "learning_rate": 1.0938542554111788e-06, "loss": 0.6053, "step": 2802 }, { "epoch": 0.25860915695998155, "grad_norm": 2.674289754523188, "learning_rate": 1.093729822645185e-06, "loss": 0.8347, "step": 2803 }, { "epoch": 0.25870141852150846, "grad_norm": 1.9187299052654343, "learning_rate": 1.0936053474021573e-06, "loss": 0.8464, "step": 2804 }, { "epoch": 0.2587936800830354, "grad_norm": 1.7308216274669346, "learning_rate": 1.0934808296933753e-06, "loss": 0.6464, "step": 2805 }, { "epoch": 0.2587936800830354, "eval_GEN Loss": 0.4770454168319702, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3920973539352417, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9135817289352417, "eval_runtime": 55.8704, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2805 }, { "epoch": 0.25888594164456236, "grad_norm": 2.050243820309279, "learning_rate": 1.0933562695301228e-06, "loss": 0.749, "step": 2806 }, { "epoch": 0.2589782032060893, "grad_norm": 1.5088742536349635, "learning_rate": 1.0932316669236882e-06, "loss": 0.5941, "step": 2807 }, { "epoch": 0.2590704647676162, "grad_norm": 3.192567161532349, "learning_rate": 1.093107021885363e-06, "loss": 0.8434, "step": 2808 }, { "epoch": 0.2591627263291431, "grad_norm": 2.8380429039134536, "learning_rate": 1.0929823344264426e-06, "loss": 0.7969, "step": 2809 }, { "epoch": 0.25925498789067003, "grad_norm": 2.367740112491841, "learning_rate": 1.0928576045582266e-06, "loss": 0.6597, "step": 2810 }, { "epoch": 0.25925498789067003, "eval_GEN Loss": 0.4770470857620239, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4092256426811218, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9203125238418579, "eval_runtime": 55.8472, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2810 }, { "epoch": 0.259347249452197, "grad_norm": 1.665398423253935, "learning_rate": 1.0927328322920178e-06, "loss": 0.77, "step": 2811 }, { "epoch": 0.2594395110137239, "grad_norm": 1.750131626629132, "learning_rate": 1.0926080176391235e-06, "loss": 0.5612, "step": 2812 }, { "epoch": 0.25953177257525084, "grad_norm": 1.6182853219142004, "learning_rate": 1.0924831606108546e-06, "loss": 0.7637, "step": 2813 }, { "epoch": 0.25962403413677776, "grad_norm": 2.144579481980696, "learning_rate": 1.092358261218526e-06, "loss": 0.6083, "step": 2814 }, { "epoch": 0.2597162956983047, "grad_norm": 1.6875025106559716, "learning_rate": 1.0922333194734562e-06, "loss": 0.6488, "step": 2815 }, { "epoch": 0.2597162956983047, "eval_GEN Loss": 0.4769200384616852, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.42085930705070496, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9325721263885498, "eval_runtime": 55.7213, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 2815 }, { "epoch": 0.2598085572598316, "grad_norm": 2.162660529928559, "learning_rate": 1.0921083353869674e-06, "loss": 0.8474, "step": 2816 }, { "epoch": 0.25990081882135857, "grad_norm": 1.466975487936104, "learning_rate": 1.091983308970386e-06, "loss": 0.6649, "step": 2817 }, { "epoch": 0.2599930803828855, "grad_norm": 1.947681954358698, "learning_rate": 1.0918582402350421e-06, "loss": 0.7354, "step": 2818 }, { "epoch": 0.2600853419444124, "grad_norm": 1.4949756812404982, "learning_rate": 1.0917331291922698e-06, "loss": 0.5357, "step": 2819 }, { "epoch": 0.2601776035059393, "grad_norm": 1.7323684241199255, "learning_rate": 1.0916079758534067e-06, "loss": 0.6904, "step": 2820 }, { "epoch": 0.2601776035059393, "eval_GEN Loss": 0.47724971175193787, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.42346706986427307, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9420673251152039, "eval_runtime": 55.7956, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2820 }, { "epoch": 0.26026986506746624, "grad_norm": 2.285875956263543, "learning_rate": 1.0914827802297942e-06, "loss": 0.8076, "step": 2821 }, { "epoch": 0.2603621266289932, "grad_norm": 1.8603760629637214, "learning_rate": 1.091357542332778e-06, "loss": 0.7745, "step": 2822 }, { "epoch": 0.26045438819052014, "grad_norm": 2.7703884501992952, "learning_rate": 1.091232262173707e-06, "loss": 0.8429, "step": 2823 }, { "epoch": 0.26054664975204705, "grad_norm": 2.629327540371188, "learning_rate": 1.0911069397639349e-06, "loss": 0.9216, "step": 2824 }, { "epoch": 0.260638911313574, "grad_norm": 1.870606733976828, "learning_rate": 1.090981575114818e-06, "loss": 0.8966, "step": 2825 }, { "epoch": 0.260638911313574, "eval_GEN Loss": 0.4756940007209778, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.4186084568500519, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9485576748847961, "eval_runtime": 55.7228, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2825 }, { "epoch": 0.2607311728751009, "grad_norm": 2.6340260628856034, "learning_rate": 1.0908561682377175e-06, "loss": 0.8419, "step": 2826 }, { "epoch": 0.26082343443662787, "grad_norm": 1.94939204128999, "learning_rate": 1.0907307191439977e-06, "loss": 0.7387, "step": 2827 }, { "epoch": 0.2609156959981548, "grad_norm": 1.5741812293126676, "learning_rate": 1.090605227845027e-06, "loss": 0.7373, "step": 2828 }, { "epoch": 0.2610079575596817, "grad_norm": 2.2443092110742726, "learning_rate": 1.0904796943521777e-06, "loss": 0.8435, "step": 2829 }, { "epoch": 0.2611002191212086, "grad_norm": 1.434500517995226, "learning_rate": 1.0903541186768257e-06, "loss": 0.6617, "step": 2830 }, { "epoch": 0.2611002191212086, "eval_GEN Loss": 0.47352904081344604, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.4016229212284088, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9518029093742371, "eval_runtime": 55.8548, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2830 }, { "epoch": 0.26119248068273554, "grad_norm": 1.7298664370626673, "learning_rate": 1.0902285008303513e-06, "loss": 0.7555, "step": 2831 }, { "epoch": 0.26128474224426246, "grad_norm": 1.4444042079177812, "learning_rate": 1.0901028408241377e-06, "loss": 0.5976, "step": 2832 }, { "epoch": 0.26137700380578943, "grad_norm": 1.6604419780132995, "learning_rate": 1.0899771386695726e-06, "loss": 0.6701, "step": 2833 }, { "epoch": 0.26146926536731635, "grad_norm": 3.146589065133363, "learning_rate": 1.0898513943780471e-06, "loss": 0.6214, "step": 2834 }, { "epoch": 0.26156152692884327, "grad_norm": 1.968668778021192, "learning_rate": 1.0897256079609567e-06, "loss": 0.6522, "step": 2835 }, { "epoch": 0.26156152692884327, "eval_GEN Loss": 0.4726296663284302, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3989977240562439, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9579927921295166, "eval_runtime": 55.89, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2835 }, { "epoch": 0.2616537884903702, "grad_norm": 3.026666023218241, "learning_rate": 1.0895997794297003e-06, "loss": 0.9134, "step": 2836 }, { "epoch": 0.2617460500518971, "grad_norm": 1.7298089701732546, "learning_rate": 1.0894739087956806e-06, "loss": 0.5006, "step": 2837 }, { "epoch": 0.2618383116134241, "grad_norm": 1.4286580177198507, "learning_rate": 1.089347996070304e-06, "loss": 0.5675, "step": 2838 }, { "epoch": 0.261930573174951, "grad_norm": 3.652190565418445, "learning_rate": 1.0892220412649814e-06, "loss": 0.8784, "step": 2839 }, { "epoch": 0.2620228347364779, "grad_norm": 1.7002966343821668, "learning_rate": 1.0890960443911265e-06, "loss": 0.6068, "step": 2840 }, { "epoch": 0.2620228347364779, "eval_GEN Loss": 0.4713214039802551, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.41650906205177307, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9401442408561707, "eval_runtime": 55.952, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2840 }, { "epoch": 0.26211509629800483, "grad_norm": 2.1625294193006255, "learning_rate": 1.0889700054601576e-06, "loss": 0.7479, "step": 2841 }, { "epoch": 0.26220735785953175, "grad_norm": 1.9285517920868451, "learning_rate": 1.0888439244834965e-06, "loss": 0.714, "step": 2842 }, { "epoch": 0.2622996194210587, "grad_norm": 1.5857584967914014, "learning_rate": 1.088717801472569e-06, "loss": 0.6862, "step": 2843 }, { "epoch": 0.26239188098258565, "grad_norm": 1.4191435423319874, "learning_rate": 1.0885916364388043e-06, "loss": 0.8066, "step": 2844 }, { "epoch": 0.26248414254411256, "grad_norm": 1.4633345884881437, "learning_rate": 1.0884654293936358e-06, "loss": 0.6089, "step": 2845 }, { "epoch": 0.26248414254411256, "eval_GEN Loss": 0.4720485210418701, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.426534503698349, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9353966116905212, "eval_runtime": 56.0563, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 2845 }, { "epoch": 0.2625764041056395, "grad_norm": 2.2858576838558835, "learning_rate": 1.0883391803485005e-06, "loss": 0.6386, "step": 2846 }, { "epoch": 0.2626686656671664, "grad_norm": 1.9808166992748992, "learning_rate": 1.0882128893148395e-06, "loss": 0.7891, "step": 2847 }, { "epoch": 0.2627609272286933, "grad_norm": 1.7137051599153532, "learning_rate": 1.0880865563040975e-06, "loss": 0.6102, "step": 2848 }, { "epoch": 0.2628531887902203, "grad_norm": 1.6459237540588072, "learning_rate": 1.0879601813277226e-06, "loss": 0.8092, "step": 2849 }, { "epoch": 0.2629454503517472, "grad_norm": 2.1743503929510166, "learning_rate": 1.0878337643971677e-06, "loss": 0.8703, "step": 2850 }, { "epoch": 0.2629454503517472, "eval_GEN Loss": 0.47063061594963074, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4229276776313782, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.931911051273346, "eval_runtime": 55.8547, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2850 }, { "epoch": 0.26303771191327413, "grad_norm": 2.0289772824087042, "learning_rate": 1.0877073055238883e-06, "loss": 0.9132, "step": 2851 }, { "epoch": 0.26312997347480105, "grad_norm": 2.0769986421133293, "learning_rate": 1.0875808047193444e-06, "loss": 0.7412, "step": 2852 }, { "epoch": 0.26322223503632797, "grad_norm": 1.6719285616073285, "learning_rate": 1.087454261995e-06, "loss": 0.5139, "step": 2853 }, { "epoch": 0.26331449659785494, "grad_norm": 1.7787465322995637, "learning_rate": 1.0873276773623227e-06, "loss": 0.8152, "step": 2854 }, { "epoch": 0.26340675815938186, "grad_norm": 2.1741799027194255, "learning_rate": 1.0872010508327833e-06, "loss": 0.8449, "step": 2855 }, { "epoch": 0.26340675815938186, "eval_GEN Loss": 0.47170206904411316, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.42667096853256226, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9335336685180664, "eval_runtime": 55.912, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2855 }, { "epoch": 0.2634990197209088, "grad_norm": 1.7974457261666446, "learning_rate": 1.0870743824178572e-06, "loss": 0.8676, "step": 2856 }, { "epoch": 0.2635912812824357, "grad_norm": 1.8658790318280039, "learning_rate": 1.086947672129023e-06, "loss": 0.8661, "step": 2857 }, { "epoch": 0.2636835428439626, "grad_norm": 2.184235811563245, "learning_rate": 1.086820919977764e-06, "loss": 0.7951, "step": 2858 }, { "epoch": 0.2637758044054896, "grad_norm": 2.122415369907746, "learning_rate": 1.0866941259755663e-06, "loss": 0.6642, "step": 2859 }, { "epoch": 0.2638680659670165, "grad_norm": 2.7901658251737365, "learning_rate": 1.0865672901339202e-06, "loss": 0.7244, "step": 2860 }, { "epoch": 0.2638680659670165, "eval_GEN Loss": 0.4719868302345276, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.42815595865249634, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9323317408561707, "eval_runtime": 55.8947, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2860 }, { "epoch": 0.2639603275285434, "grad_norm": 1.4985642027008574, "learning_rate": 1.0864404124643197e-06, "loss": 0.4886, "step": 2861 }, { "epoch": 0.26405258909007034, "grad_norm": 1.6611065077938427, "learning_rate": 1.0863134929782626e-06, "loss": 0.8357, "step": 2862 }, { "epoch": 0.26414485065159726, "grad_norm": 1.5424880746667047, "learning_rate": 1.0861865316872506e-06, "loss": 0.7578, "step": 2863 }, { "epoch": 0.2642371122131242, "grad_norm": 1.5086276870700677, "learning_rate": 1.0860595286027893e-06, "loss": 0.6162, "step": 2864 }, { "epoch": 0.26432937377465116, "grad_norm": 1.7995003060467978, "learning_rate": 1.0859324837363878e-06, "loss": 0.7894, "step": 2865 }, { "epoch": 0.26432937377465116, "eval_GEN Loss": 0.4730812609195709, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.42739221453666687, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9325721263885498, "eval_runtime": 55.8967, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2865 }, { "epoch": 0.2644216353361781, "grad_norm": 2.2670008145067673, "learning_rate": 1.085805397099559e-06, "loss": 0.7332, "step": 2866 }, { "epoch": 0.264513896897705, "grad_norm": 1.9072589631028012, "learning_rate": 1.08567826870382e-06, "loss": 0.6485, "step": 2867 }, { "epoch": 0.2646061584592319, "grad_norm": 1.600773972719319, "learning_rate": 1.0855510985606912e-06, "loss": 0.6992, "step": 2868 }, { "epoch": 0.26469842002075883, "grad_norm": 2.2154277191973315, "learning_rate": 1.0854238866816966e-06, "loss": 0.6674, "step": 2869 }, { "epoch": 0.2647906815822858, "grad_norm": 2.246468231463725, "learning_rate": 1.085296633078365e-06, "loss": 0.7329, "step": 2870 }, { "epoch": 0.2647906815822858, "eval_GEN Loss": 0.47351667284965515, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.41970211267471313, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.931370198726654, "eval_runtime": 55.7497, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 2870 }, { "epoch": 0.2648829431438127, "grad_norm": 2.0524643362930917, "learning_rate": 1.0851693377622276e-06, "loss": 0.765, "step": 2871 }, { "epoch": 0.26497520470533964, "grad_norm": 1.6777409247684603, "learning_rate": 1.085042000744821e-06, "loss": 0.7887, "step": 2872 }, { "epoch": 0.26506746626686656, "grad_norm": 2.9044502055453307, "learning_rate": 1.084914622037684e-06, "loss": 0.9233, "step": 2873 }, { "epoch": 0.2651597278283935, "grad_norm": 1.851984411139579, "learning_rate": 1.0847872016523598e-06, "loss": 0.6793, "step": 2874 }, { "epoch": 0.26525198938992045, "grad_norm": 1.7689138325551346, "learning_rate": 1.084659739600396e-06, "loss": 0.8068, "step": 2875 }, { "epoch": 0.26525198938992045, "eval_GEN Loss": 0.47261348366737366, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.41723376512527466, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9238581657409668, "eval_runtime": 56.662, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2875 }, { "epoch": 0.26534425095144737, "grad_norm": 2.518988655945643, "learning_rate": 1.0845322358933429e-06, "loss": 0.8823, "step": 2876 }, { "epoch": 0.2654365125129743, "grad_norm": 1.6922890281696157, "learning_rate": 1.0844046905427552e-06, "loss": 0.6131, "step": 2877 }, { "epoch": 0.2655287740745012, "grad_norm": 1.5298582902353595, "learning_rate": 1.0842771035601916e-06, "loss": 0.5772, "step": 2878 }, { "epoch": 0.2656210356360281, "grad_norm": 2.140596771900157, "learning_rate": 1.0841494749572135e-06, "loss": 0.7481, "step": 2879 }, { "epoch": 0.26571329719755504, "grad_norm": 1.4039039760746899, "learning_rate": 1.0840218047453877e-06, "loss": 0.6066, "step": 2880 }, { "epoch": 0.26571329719755504, "eval_GEN Loss": 0.4720955193042755, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.38698023557662964, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9079927802085876, "eval_runtime": 56.5785, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 2880 }, { "epoch": 0.265805558759082, "grad_norm": 1.734679531546747, "learning_rate": 1.0838940929362832e-06, "loss": 0.7649, "step": 2881 }, { "epoch": 0.26589782032060894, "grad_norm": 1.4436070519957807, "learning_rate": 1.0837663395414737e-06, "loss": 0.5511, "step": 2882 }, { "epoch": 0.26599008188213585, "grad_norm": 1.5306854758668027, "learning_rate": 1.0836385445725366e-06, "loss": 0.8169, "step": 2883 }, { "epoch": 0.26608234344366277, "grad_norm": 2.209621320462489, "learning_rate": 1.0835107080410525e-06, "loss": 0.7476, "step": 2884 }, { "epoch": 0.2661746050051897, "grad_norm": 2.333483988165698, "learning_rate": 1.0833828299586064e-06, "loss": 0.8471, "step": 2885 }, { "epoch": 0.2661746050051897, "eval_GEN Loss": 0.4727107882499695, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37869298458099365, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9090144038200378, "eval_runtime": 56.8512, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2885 }, { "epoch": 0.26626686656671666, "grad_norm": 3.621223958701815, "learning_rate": 1.0832549103367868e-06, "loss": 0.9463, "step": 2886 }, { "epoch": 0.2663591281282436, "grad_norm": 2.5282885683733642, "learning_rate": 1.083126949187186e-06, "loss": 0.7999, "step": 2887 }, { "epoch": 0.2664513896897705, "grad_norm": 1.9973503048168053, "learning_rate": 1.0829989465213996e-06, "loss": 0.6615, "step": 2888 }, { "epoch": 0.2665436512512974, "grad_norm": 1.758681115083525, "learning_rate": 1.0828709023510282e-06, "loss": 0.7291, "step": 2889 }, { "epoch": 0.26663591281282434, "grad_norm": 1.7853998571874048, "learning_rate": 1.0827428166876746e-06, "loss": 0.7475, "step": 2890 }, { "epoch": 0.26663591281282434, "eval_GEN Loss": 0.4736158549785614, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3929135203361511, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9142428040504456, "eval_runtime": 56.6963, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2890 }, { "epoch": 0.2667281743743513, "grad_norm": 2.0202502120712547, "learning_rate": 1.0826146895429465e-06, "loss": 0.7987, "step": 2891 }, { "epoch": 0.26682043593587823, "grad_norm": 2.0584889741402552, "learning_rate": 1.082486520928455e-06, "loss": 0.7831, "step": 2892 }, { "epoch": 0.26691269749740515, "grad_norm": 1.7347886982583645, "learning_rate": 1.082358310855815e-06, "loss": 0.659, "step": 2893 }, { "epoch": 0.26700495905893207, "grad_norm": 2.2671950749564704, "learning_rate": 1.0822300593366446e-06, "loss": 0.87, "step": 2894 }, { "epoch": 0.267097220620459, "grad_norm": 1.6796338733481695, "learning_rate": 1.082101766382567e-06, "loss": 0.6606, "step": 2895 }, { "epoch": 0.267097220620459, "eval_GEN Loss": 0.4737313985824585, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4053592085838318, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9170072078704834, "eval_runtime": 56.834, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2895 }, { "epoch": 0.2671894821819859, "grad_norm": 1.8186297016083144, "learning_rate": 1.0819734320052077e-06, "loss": 0.6944, "step": 2896 }, { "epoch": 0.2672817437435129, "grad_norm": 2.2232199693453305, "learning_rate": 1.0818450562161966e-06, "loss": 0.7168, "step": 2897 }, { "epoch": 0.2673740053050398, "grad_norm": 2.4038255462991507, "learning_rate": 1.0817166390271674e-06, "loss": 0.7652, "step": 2898 }, { "epoch": 0.2674662668665667, "grad_norm": 1.9710086581823223, "learning_rate": 1.0815881804497576e-06, "loss": 0.823, "step": 2899 }, { "epoch": 0.26755852842809363, "grad_norm": 1.4910994291652362, "learning_rate": 1.081459680495608e-06, "loss": 0.7373, "step": 2900 }, { "epoch": 0.26755852842809363, "eval_GEN Loss": 0.47203004360198975, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.410864919424057, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9215144515037537, "eval_runtime": 56.7335, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 2900 }, { "epoch": 0.26765078998962055, "grad_norm": 2.1131906187932836, "learning_rate": 1.081331139176364e-06, "loss": 0.6806, "step": 2901 }, { "epoch": 0.2677430515511475, "grad_norm": 2.7948668407010326, "learning_rate": 1.0812025565036738e-06, "loss": 0.8329, "step": 2902 }, { "epoch": 0.26783531311267444, "grad_norm": 2.6533122459357092, "learning_rate": 1.0810739324891897e-06, "loss": 0.7192, "step": 2903 }, { "epoch": 0.26792757467420136, "grad_norm": 2.0983627377891305, "learning_rate": 1.080945267144568e-06, "loss": 0.7468, "step": 2904 }, { "epoch": 0.2680198362357283, "grad_norm": 3.007420205172924, "learning_rate": 1.0808165604814686e-06, "loss": 1.0453, "step": 2905 }, { "epoch": 0.2680198362357283, "eval_GEN Loss": 0.47039514780044556, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.4074372351169586, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9245192408561707, "eval_runtime": 56.786, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 2905 }, { "epoch": 0.2681120977972552, "grad_norm": 1.5998505247895043, "learning_rate": 1.0806878125115549e-06, "loss": 0.6214, "step": 2906 }, { "epoch": 0.2682043593587822, "grad_norm": 1.7106725387046147, "learning_rate": 1.0805590232464944e-06, "loss": 0.7344, "step": 2907 }, { "epoch": 0.2682966209203091, "grad_norm": 1.9177576355349442, "learning_rate": 1.0804301926979584e-06, "loss": 0.6649, "step": 2908 }, { "epoch": 0.268388882481836, "grad_norm": 1.3196856273651647, "learning_rate": 1.0803013208776212e-06, "loss": 0.6409, "step": 2909 }, { "epoch": 0.26848114404336293, "grad_norm": 1.9568369630543458, "learning_rate": 1.0801724077971618e-06, "loss": 0.8207, "step": 2910 }, { "epoch": 0.26848114404336293, "eval_GEN Loss": 0.4692898094654083, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3971266746520996, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9300480484962463, "eval_runtime": 56.8504, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2910 }, { "epoch": 0.26857340560488985, "grad_norm": 2.3157908592391068, "learning_rate": 1.0800434534682623e-06, "loss": 0.8243, "step": 2911 }, { "epoch": 0.26866566716641677, "grad_norm": 1.613711002272769, "learning_rate": 1.0799144579026087e-06, "loss": 0.6867, "step": 2912 }, { "epoch": 0.26875792872794374, "grad_norm": 2.4738510202088015, "learning_rate": 1.0797854211118911e-06, "loss": 0.7694, "step": 2913 }, { "epoch": 0.26885019028947066, "grad_norm": 2.2261598878042395, "learning_rate": 1.0796563431078027e-06, "loss": 0.8152, "step": 2914 }, { "epoch": 0.2689424518509976, "grad_norm": 1.761019883546548, "learning_rate": 1.0795272239020407e-06, "loss": 0.8802, "step": 2915 }, { "epoch": 0.2689424518509976, "eval_GEN Loss": 0.46886858344078064, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.39003583788871765, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9323918223381042, "eval_runtime": 56.6345, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 2915 }, { "epoch": 0.2690347134125245, "grad_norm": 2.6407705364832723, "learning_rate": 1.0793980635063064e-06, "loss": 0.8825, "step": 2916 }, { "epoch": 0.2691269749740514, "grad_norm": 1.7562121403030946, "learning_rate": 1.0792688619323042e-06, "loss": 0.7568, "step": 2917 }, { "epoch": 0.2692192365355784, "grad_norm": 1.8160496091454899, "learning_rate": 1.0791396191917429e-06, "loss": 0.747, "step": 2918 }, { "epoch": 0.2693114980971053, "grad_norm": 1.4703350220943332, "learning_rate": 1.0790103352963343e-06, "loss": 0.687, "step": 2919 }, { "epoch": 0.2694037596586322, "grad_norm": 2.53177968868352, "learning_rate": 1.0788810102577946e-06, "loss": 0.6893, "step": 2920 }, { "epoch": 0.2694037596586322, "eval_GEN Loss": 0.4682959020137787, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.39357900619506836, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9245192408561707, "eval_runtime": 56.8544, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 2920 }, { "epoch": 0.26949602122015914, "grad_norm": 1.8516885475416047, "learning_rate": 1.0787516440878435e-06, "loss": 0.7163, "step": 2921 }, { "epoch": 0.26958828278168606, "grad_norm": 2.1160565704273266, "learning_rate": 1.0786222367982037e-06, "loss": 0.8189, "step": 2922 }, { "epoch": 0.26968054434321304, "grad_norm": 1.9040697952784618, "learning_rate": 1.0784927884006032e-06, "loss": 0.7959, "step": 2923 }, { "epoch": 0.26977280590473995, "grad_norm": 1.4444408649716918, "learning_rate": 1.0783632989067725e-06, "loss": 0.6232, "step": 2924 }, { "epoch": 0.2698650674662669, "grad_norm": 1.3227319492381608, "learning_rate": 1.0782337683284457e-06, "loss": 0.5944, "step": 2925 }, { "epoch": 0.2698650674662669, "eval_GEN Loss": 0.4667108356952667, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.4003351628780365, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9219951629638672, "eval_runtime": 56.8948, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 2925 }, { "epoch": 0.2699573290277938, "grad_norm": 1.901285890344741, "learning_rate": 1.0781041966773615e-06, "loss": 0.8238, "step": 2926 }, { "epoch": 0.2700495905893207, "grad_norm": 1.880259543140357, "learning_rate": 1.077974583965262e-06, "loss": 0.8227, "step": 2927 }, { "epoch": 0.27014185215084763, "grad_norm": 1.6942444576860036, "learning_rate": 1.0778449302038925e-06, "loss": 0.8278, "step": 2928 }, { "epoch": 0.2702341137123746, "grad_norm": 1.7801397377465484, "learning_rate": 1.0777152354050026e-06, "loss": 0.6676, "step": 2929 }, { "epoch": 0.2703263752739015, "grad_norm": 2.2657342008091192, "learning_rate": 1.0775854995803456e-06, "loss": 0.7701, "step": 2930 }, { "epoch": 0.2703263752739015, "eval_GEN Loss": 0.4680368900299072, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.4020960330963135, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9251803159713745, "eval_runtime": 55.9556, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2930 }, { "epoch": 0.27041863683542844, "grad_norm": 1.6407330308061099, "learning_rate": 1.0774557227416783e-06, "loss": 0.5789, "step": 2931 }, { "epoch": 0.27051089839695536, "grad_norm": 1.6021232520345274, "learning_rate": 1.077325904900761e-06, "loss": 0.6688, "step": 2932 }, { "epoch": 0.2706031599584823, "grad_norm": 1.479719404476177, "learning_rate": 1.0771960460693588e-06, "loss": 0.7653, "step": 2933 }, { "epoch": 0.27069542152000925, "grad_norm": 1.4609981980198374, "learning_rate": 1.0770661462592385e-06, "loss": 0.6051, "step": 2934 }, { "epoch": 0.27078768308153617, "grad_norm": 1.0992705582228601, "learning_rate": 1.0769362054821728e-06, "loss": 0.5368, "step": 2935 }, { "epoch": 0.27078768308153617, "eval_GEN Loss": 0.4699912965297699, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.4076942801475525, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9277043342590332, "eval_runtime": 55.7894, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 2935 }, { "epoch": 0.2708799446430631, "grad_norm": 1.4378030605591086, "learning_rate": 1.0768062237499365e-06, "loss": 0.729, "step": 2936 }, { "epoch": 0.27097220620459, "grad_norm": 1.6161195381033198, "learning_rate": 1.0766762010743093e-06, "loss": 0.5311, "step": 2937 }, { "epoch": 0.2710644677661169, "grad_norm": 1.7086682571920622, "learning_rate": 1.0765461374670738e-06, "loss": 0.8596, "step": 2938 }, { "epoch": 0.2711567293276439, "grad_norm": 2.069676595962534, "learning_rate": 1.0764160329400167e-06, "loss": 0.5081, "step": 2939 }, { "epoch": 0.2712489908891708, "grad_norm": 1.7704229224283745, "learning_rate": 1.076285887504928e-06, "loss": 0.84, "step": 2940 }, { "epoch": 0.2712489908891708, "eval_GEN Loss": 0.47121885418891907, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.4136001765727997, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9354567527770996, "eval_runtime": 56.1669, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 2940 }, { "epoch": 0.27134125245069773, "grad_norm": 2.1653525888719827, "learning_rate": 1.0761557011736018e-06, "loss": 0.6645, "step": 2941 }, { "epoch": 0.27143351401222465, "grad_norm": 2.854016505791687, "learning_rate": 1.0760254739578358e-06, "loss": 0.9773, "step": 2942 }, { "epoch": 0.27152577557375157, "grad_norm": 1.657128474618374, "learning_rate": 1.0758952058694313e-06, "loss": 0.7026, "step": 2943 }, { "epoch": 0.2716180371352785, "grad_norm": 1.915486511031709, "learning_rate": 1.075764896920194e-06, "loss": 0.8005, "step": 2944 }, { "epoch": 0.27171029869680546, "grad_norm": 2.2045174048833958, "learning_rate": 1.0756345471219319e-06, "loss": 0.8616, "step": 2945 }, { "epoch": 0.27171029869680546, "eval_GEN Loss": 0.4716050326824188, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.4085181653499603, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9379807710647583, "eval_runtime": 55.8446, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 2945 }, { "epoch": 0.2718025602583324, "grad_norm": 1.9954431213998831, "learning_rate": 1.0755041564864577e-06, "loss": 0.678, "step": 2946 }, { "epoch": 0.2718948218198593, "grad_norm": 1.985754389146779, "learning_rate": 1.075373725025588e-06, "loss": 0.7281, "step": 2947 }, { "epoch": 0.2719870833813862, "grad_norm": 2.7574089347205066, "learning_rate": 1.0752432527511421e-06, "loss": 0.8584, "step": 2948 }, { "epoch": 0.27207934494291314, "grad_norm": 2.2764212700991937, "learning_rate": 1.0751127396749445e-06, "loss": 0.7423, "step": 2949 }, { "epoch": 0.2721716065044401, "grad_norm": 1.6483397800493493, "learning_rate": 1.0749821858088215e-06, "loss": 0.7096, "step": 2950 }, { "epoch": 0.2721716065044401, "eval_GEN Loss": 0.4714268743991852, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.4028923511505127, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9395432472229004, "eval_runtime": 55.8972, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 2950 }, { "epoch": 0.27226386806596703, "grad_norm": 2.456810661767572, "learning_rate": 1.0748515911646047e-06, "loss": 0.8599, "step": 2951 }, { "epoch": 0.27235612962749395, "grad_norm": 1.614728262049482, "learning_rate": 1.0747209557541286e-06, "loss": 0.5507, "step": 2952 }, { "epoch": 0.27244839118902087, "grad_norm": 2.3540574691967384, "learning_rate": 1.0745902795892315e-06, "loss": 0.7493, "step": 2953 }, { "epoch": 0.2725406527505478, "grad_norm": 2.230432170743013, "learning_rate": 1.0744595626817557e-06, "loss": 0.763, "step": 2954 }, { "epoch": 0.27263291431207476, "grad_norm": 2.2265999218489303, "learning_rate": 1.074328805043547e-06, "loss": 0.7823, "step": 2955 }, { "epoch": 0.27263291431207476, "eval_GEN Loss": 0.470962792634964, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.40174680948257446, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9305288195610046, "eval_runtime": 56.1549, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 2955 }, { "epoch": 0.2727251758736017, "grad_norm": 1.8371295485989962, "learning_rate": 1.0741980066864545e-06, "loss": 0.6203, "step": 2956 }, { "epoch": 0.2728174374351286, "grad_norm": 2.1076505355641943, "learning_rate": 1.0740671676223319e-06, "loss": 0.8231, "step": 2957 }, { "epoch": 0.2729096989966555, "grad_norm": 1.6193518676565852, "learning_rate": 1.0739362878630355e-06, "loss": 0.5592, "step": 2958 }, { "epoch": 0.27300196055818243, "grad_norm": 1.6979882137639126, "learning_rate": 1.073805367420426e-06, "loss": 0.6869, "step": 2959 }, { "epoch": 0.27309422211970935, "grad_norm": 1.3944447627316257, "learning_rate": 1.073674406306368e-06, "loss": 0.517, "step": 2960 }, { "epoch": 0.27309422211970935, "eval_GEN Loss": 0.4710898995399475, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3922373950481415, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9268028736114502, "eval_runtime": 56.0061, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 2960 }, { "epoch": 0.2731864836812363, "grad_norm": 2.980974654172515, "learning_rate": 1.0735434045327287e-06, "loss": 0.7722, "step": 2961 }, { "epoch": 0.27327874524276324, "grad_norm": 1.8456992095491502, "learning_rate": 1.07341236211138e-06, "loss": 0.7864, "step": 2962 }, { "epoch": 0.27337100680429016, "grad_norm": 1.8784025473858066, "learning_rate": 1.0732812790541977e-06, "loss": 0.721, "step": 2963 }, { "epoch": 0.2734632683658171, "grad_norm": 2.066693689693836, "learning_rate": 1.07315015537306e-06, "loss": 0.8374, "step": 2964 }, { "epoch": 0.273555529927344, "grad_norm": 1.7295788004467523, "learning_rate": 1.0730189910798497e-06, "loss": 0.446, "step": 2965 }, { "epoch": 0.273555529927344, "eval_GEN Loss": 0.4710273742675781, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3842709958553314, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9241586327552795, "eval_runtime": 55.947, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 2965 }, { "epoch": 0.273647791488871, "grad_norm": 1.9123825715438492, "learning_rate": 1.0728877861864534e-06, "loss": 0.8068, "step": 2966 }, { "epoch": 0.2737400530503979, "grad_norm": 2.253684877950857, "learning_rate": 1.072756540704761e-06, "loss": 0.7399, "step": 2967 }, { "epoch": 0.2738323146119248, "grad_norm": 2.3267420812374087, "learning_rate": 1.0726252546466659e-06, "loss": 0.6644, "step": 2968 }, { "epoch": 0.27392457617345173, "grad_norm": 2.1594839660895744, "learning_rate": 1.072493928024066e-06, "loss": 0.9195, "step": 2969 }, { "epoch": 0.27401683773497865, "grad_norm": 1.615247046523298, "learning_rate": 1.0723625608488617e-06, "loss": 0.6362, "step": 2970 }, { "epoch": 0.27401683773497865, "eval_GEN Loss": 0.4714062213897705, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9146341463414634, "eval_PRM F1 AUC": 0.8213724463069669, "eval_PRM F1 Neg": 0.7083333333333334, "eval_PRM Loss": 0.3864392936229706, "eval_PRM NPV": 0.68, "eval_PRM Precision": 0.9259259259259259, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9131009578704834, "eval_runtime": 56.0699, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 2970 }, { "epoch": 0.2741090992965056, "grad_norm": 3.6703664972373864, "learning_rate": 1.072231153132958e-06, "loss": 1.1565, "step": 2971 }, { "epoch": 0.27420136085803254, "grad_norm": 1.665237552315827, "learning_rate": 1.0720997048882632e-06, "loss": 0.5983, "step": 2972 }, { "epoch": 0.27429362241955946, "grad_norm": 3.053703069908747, "learning_rate": 1.0719682161266894e-06, "loss": 0.5336, "step": 2973 }, { "epoch": 0.2743858839810864, "grad_norm": 1.7050088474819154, "learning_rate": 1.0718366868601526e-06, "loss": 0.8571, "step": 2974 }, { "epoch": 0.2744781455426133, "grad_norm": 1.8257498753652626, "learning_rate": 1.0717051171005715e-06, "loss": 0.8708, "step": 2975 }, { "epoch": 0.2744781455426133, "eval_GEN Loss": 0.4726153016090393, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.41426679491996765, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.915745198726654, "eval_runtime": 56.6605, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2975 }, { "epoch": 0.2745704071041402, "grad_norm": 2.0781769843727673, "learning_rate": 1.0715735068598698e-06, "loss": 0.9534, "step": 2976 }, { "epoch": 0.2746626686656672, "grad_norm": 1.3498716611053658, "learning_rate": 1.071441856149974e-06, "loss": 0.6658, "step": 2977 }, { "epoch": 0.2747549302271941, "grad_norm": 2.3352739141914896, "learning_rate": 1.0713101649828143e-06, "loss": 0.8961, "step": 2978 }, { "epoch": 0.274847191788721, "grad_norm": 1.893398868696727, "learning_rate": 1.0711784333703252e-06, "loss": 0.827, "step": 2979 }, { "epoch": 0.27493945335024794, "grad_norm": 2.4254582277827876, "learning_rate": 1.071046661324444e-06, "loss": 0.7849, "step": 2980 }, { "epoch": 0.27493945335024794, "eval_GEN Loss": 0.47261038422584534, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4217749238014221, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9133413434028625, "eval_runtime": 56.6778, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2980 }, { "epoch": 0.27503171491177486, "grad_norm": 2.051485330504249, "learning_rate": 1.0709148488571123e-06, "loss": 0.6959, "step": 2981 }, { "epoch": 0.27512397647330183, "grad_norm": 1.8124372530176573, "learning_rate": 1.070782995980275e-06, "loss": 0.6654, "step": 2982 }, { "epoch": 0.27521623803482875, "grad_norm": 1.789274532211207, "learning_rate": 1.070651102705881e-06, "loss": 0.8282, "step": 2983 }, { "epoch": 0.27530849959635567, "grad_norm": 2.4247167739441218, "learning_rate": 1.0705191690458826e-06, "loss": 0.6691, "step": 2984 }, { "epoch": 0.2754007611578826, "grad_norm": 1.9362840055640174, "learning_rate": 1.0703871950122362e-06, "loss": 0.7744, "step": 2985 }, { "epoch": 0.2754007611578826, "eval_GEN Loss": 0.4706338346004486, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.4156058728694916, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9146634340286255, "eval_runtime": 56.5735, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 2985 }, { "epoch": 0.2754930227194095, "grad_norm": 1.7661738455074483, "learning_rate": 1.0702551806169009e-06, "loss": 0.6302, "step": 2986 }, { "epoch": 0.2755852842809365, "grad_norm": 2.179368130907011, "learning_rate": 1.07012312587184e-06, "loss": 0.826, "step": 2987 }, { "epoch": 0.2756775458424634, "grad_norm": 1.3227171925333114, "learning_rate": 1.0699910307890213e-06, "loss": 0.5974, "step": 2988 }, { "epoch": 0.2757698074039903, "grad_norm": 1.5215068251231954, "learning_rate": 1.0698588953804146e-06, "loss": 0.7154, "step": 2989 }, { "epoch": 0.27586206896551724, "grad_norm": 1.8611650992188542, "learning_rate": 1.0697267196579946e-06, "loss": 0.7443, "step": 2990 }, { "epoch": 0.27586206896551724, "eval_GEN Loss": 0.4698081314563751, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3971595764160156, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9191105961799622, "eval_runtime": 56.8346, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 2990 }, { "epoch": 0.27595433052704416, "grad_norm": 1.5731395456884663, "learning_rate": 1.0695945036337394e-06, "loss": 0.5874, "step": 2991 }, { "epoch": 0.2760465920885711, "grad_norm": 1.8458591760521923, "learning_rate": 1.0694622473196303e-06, "loss": 0.8392, "step": 2992 }, { "epoch": 0.27613885365009805, "grad_norm": 1.5301326642721071, "learning_rate": 1.069329950727653e-06, "loss": 0.7545, "step": 2993 }, { "epoch": 0.27623111521162497, "grad_norm": 1.4687202099750942, "learning_rate": 1.0691976138697959e-06, "loss": 0.7071, "step": 2994 }, { "epoch": 0.2763233767731519, "grad_norm": 1.6107935879435766, "learning_rate": 1.069065236758052e-06, "loss": 0.5573, "step": 2995 }, { "epoch": 0.2763233767731519, "eval_GEN Loss": 0.47077441215515137, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3876074254512787, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9328725934028625, "eval_runtime": 56.6805, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 2995 }, { "epoch": 0.2764156383346788, "grad_norm": 3.191370588523095, "learning_rate": 1.0689328194044176e-06, "loss": 0.8169, "step": 2996 }, { "epoch": 0.2765078998962057, "grad_norm": 1.2001886420614896, "learning_rate": 1.0688003618208922e-06, "loss": 0.5587, "step": 2997 }, { "epoch": 0.2766001614577327, "grad_norm": 2.323862866865989, "learning_rate": 1.0686678640194791e-06, "loss": 0.7312, "step": 2998 }, { "epoch": 0.2766924230192596, "grad_norm": 2.321497592497748, "learning_rate": 1.068535326012186e-06, "loss": 0.8557, "step": 2999 }, { "epoch": 0.27678468458078653, "grad_norm": 2.0297776260028892, "learning_rate": 1.0684027478110238e-06, "loss": 0.7923, "step": 3000 }, { "epoch": 0.27678468458078653, "eval_GEN Loss": 0.47090959548950195, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.38966938853263855, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9231970906257629, "eval_runtime": 56.8399, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3000 }, { "epoch": 0.27687694614231345, "grad_norm": 1.6618185518380078, "learning_rate": 1.0682701294280066e-06, "loss": 0.7444, "step": 3001 }, { "epoch": 0.27696920770384037, "grad_norm": 2.476708643456072, "learning_rate": 1.0681374708751525e-06, "loss": 0.901, "step": 3002 }, { "epoch": 0.27706146926536734, "grad_norm": 1.6390607184185797, "learning_rate": 1.0680047721644831e-06, "loss": 0.6479, "step": 3003 }, { "epoch": 0.27715373082689426, "grad_norm": 1.2077098188787156, "learning_rate": 1.0678720333080242e-06, "loss": 0.6578, "step": 3004 }, { "epoch": 0.2772459923884212, "grad_norm": 2.095117818126065, "learning_rate": 1.0677392543178045e-06, "loss": 0.8181, "step": 3005 }, { "epoch": 0.2772459923884212, "eval_GEN Loss": 0.47230812907218933, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.4182332158088684, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9130408763885498, "eval_runtime": 55.9194, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3005 }, { "epoch": 0.2773382539499481, "grad_norm": 2.6604775050617984, "learning_rate": 1.0676064352058566e-06, "loss": 0.6083, "step": 3006 }, { "epoch": 0.277430515511475, "grad_norm": 1.3858070793868345, "learning_rate": 1.0674735759842166e-06, "loss": 0.5896, "step": 3007 }, { "epoch": 0.27752277707300194, "grad_norm": 3.880363472013846, "learning_rate": 1.0673406766649252e-06, "loss": 0.8189, "step": 3008 }, { "epoch": 0.2776150386345289, "grad_norm": 2.310164277193226, "learning_rate": 1.067207737260025e-06, "loss": 0.7813, "step": 3009 }, { "epoch": 0.27770730019605583, "grad_norm": 2.441424253660931, "learning_rate": 1.067074757781564e-06, "loss": 0.7209, "step": 3010 }, { "epoch": 0.27770730019605583, "eval_GEN Loss": 0.4707789719104767, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.40797895193099976, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9105167984962463, "eval_runtime": 55.7052, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3010 }, { "epoch": 0.27779956175758275, "grad_norm": 1.7815883948680813, "learning_rate": 1.0669417382415923e-06, "loss": 0.7369, "step": 3011 }, { "epoch": 0.27789182331910967, "grad_norm": 1.5110397906159032, "learning_rate": 1.0668086786521648e-06, "loss": 0.6315, "step": 3012 }, { "epoch": 0.2779840848806366, "grad_norm": 1.9341888127529423, "learning_rate": 1.0666755790253393e-06, "loss": 0.6519, "step": 3013 }, { "epoch": 0.27807634644216356, "grad_norm": 1.9835501065707783, "learning_rate": 1.0665424393731777e-06, "loss": 0.7808, "step": 3014 }, { "epoch": 0.2781686080036905, "grad_norm": 2.3280147083623075, "learning_rate": 1.0664092597077455e-06, "loss": 0.8808, "step": 3015 }, { "epoch": 0.2781686080036905, "eval_GEN Loss": 0.4707986116409302, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.38820645213127136, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9114783406257629, "eval_runtime": 56.7691, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3015 }, { "epoch": 0.2782608695652174, "grad_norm": 2.8357232108307215, "learning_rate": 1.066276040041111e-06, "loss": 0.861, "step": 3016 }, { "epoch": 0.2783531311267443, "grad_norm": 1.8295674414500154, "learning_rate": 1.0661427803853473e-06, "loss": 0.6751, "step": 3017 }, { "epoch": 0.27844539268827123, "grad_norm": 2.2622370843638877, "learning_rate": 1.0660094807525305e-06, "loss": 0.7406, "step": 3018 }, { "epoch": 0.2785376542497982, "grad_norm": 2.195596812019375, "learning_rate": 1.0658761411547404e-06, "loss": 0.7446, "step": 3019 }, { "epoch": 0.2786299158113251, "grad_norm": 1.621731708015415, "learning_rate": 1.0657427616040605e-06, "loss": 0.6217, "step": 3020 }, { "epoch": 0.2786299158113251, "eval_GEN Loss": 0.47051486372947693, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.4024726450443268, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9075720906257629, "eval_runtime": 56.7361, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3020 }, { "epoch": 0.27872217737285204, "grad_norm": 2.049016492117123, "learning_rate": 1.0656093421125777e-06, "loss": 0.8602, "step": 3021 }, { "epoch": 0.27881443893437896, "grad_norm": 2.0497393145955685, "learning_rate": 1.0654758826923827e-06, "loss": 0.7315, "step": 3022 }, { "epoch": 0.2789067004959059, "grad_norm": 2.122846118333475, "learning_rate": 1.0653423833555701e-06, "loss": 0.7259, "step": 3023 }, { "epoch": 0.2789989620574328, "grad_norm": 2.1648262068114836, "learning_rate": 1.0652088441142375e-06, "loss": 0.6142, "step": 3024 }, { "epoch": 0.27909122361895977, "grad_norm": 1.8756445899355763, "learning_rate": 1.0650752649804866e-06, "loss": 0.818, "step": 3025 }, { "epoch": 0.27909122361895977, "eval_GEN Loss": 0.4718669354915619, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3990402817726135, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9111778736114502, "eval_runtime": 55.7786, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3025 }, { "epoch": 0.2791834851804867, "grad_norm": 1.4974941619338655, "learning_rate": 1.0649416459664224e-06, "loss": 0.6817, "step": 3026 }, { "epoch": 0.2792757467420136, "grad_norm": 2.7454544109571524, "learning_rate": 1.064807987084154e-06, "loss": 0.7396, "step": 3027 }, { "epoch": 0.2793680083035405, "grad_norm": 1.5025185893054946, "learning_rate": 1.0646742883457932e-06, "loss": 0.6328, "step": 3028 }, { "epoch": 0.27946026986506745, "grad_norm": 1.691085999858614, "learning_rate": 1.0645405497634566e-06, "loss": 0.6876, "step": 3029 }, { "epoch": 0.2795525314265944, "grad_norm": 3.3312380732250904, "learning_rate": 1.0644067713492635e-06, "loss": 0.8739, "step": 3030 }, { "epoch": 0.2795525314265944, "eval_GEN Loss": 0.4710805118083954, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3732966184616089, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9143028855323792, "eval_runtime": 55.7757, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3030 }, { "epoch": 0.27964479298812134, "grad_norm": 1.8158589611092544, "learning_rate": 1.064272953115337e-06, "loss": 0.7647, "step": 3031 }, { "epoch": 0.27973705454964826, "grad_norm": 3.9458975882161513, "learning_rate": 1.064139095073804e-06, "loss": 1.2141, "step": 3032 }, { "epoch": 0.2798293161111752, "grad_norm": 2.5882358601325253, "learning_rate": 1.0640051972367955e-06, "loss": 0.6481, "step": 3033 }, { "epoch": 0.2799215776727021, "grad_norm": 1.9084181803913842, "learning_rate": 1.0638712596164445e-06, "loss": 0.6903, "step": 3034 }, { "epoch": 0.280013839234229, "grad_norm": 2.644414617579794, "learning_rate": 1.0637372822248892e-06, "loss": 0.9132, "step": 3035 }, { "epoch": 0.280013839234229, "eval_GEN Loss": 0.46965330839157104, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9047619047619048, "eval_PRM F1 AUC": 0.7621791513881613, "eval_PRM F1 Neg": 0.6363636363636364, "eval_PRM Loss": 0.36662760376930237, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.8941176470588236, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9252403974533081, "eval_runtime": 55.7503, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 3035 }, { "epoch": 0.280106100795756, "grad_norm": 1.9822324253651207, "learning_rate": 1.063603265074271e-06, "loss": 0.6281, "step": 3036 }, { "epoch": 0.2801983623572829, "grad_norm": 1.923125657012463, "learning_rate": 1.0634692081767344e-06, "loss": 0.7492, "step": 3037 }, { "epoch": 0.2802906239188098, "grad_norm": 2.3429376529638755, "learning_rate": 1.0633351115444281e-06, "loss": 0.8975, "step": 3038 }, { "epoch": 0.28038288548033674, "grad_norm": 2.050496352175447, "learning_rate": 1.063200975189504e-06, "loss": 0.5983, "step": 3039 }, { "epoch": 0.28047514704186366, "grad_norm": 2.4762319883475437, "learning_rate": 1.0630667991241178e-06, "loss": 1.0166, "step": 3040 }, { "epoch": 0.28047514704186366, "eval_GEN Loss": 0.46793049573898315, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3690236210823059, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9129807949066162, "eval_runtime": 56.4612, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 3040 }, { "epoch": 0.28056740860339063, "grad_norm": 2.302922509664043, "learning_rate": 1.0629325833604288e-06, "loss": 0.6984, "step": 3041 }, { "epoch": 0.28065967016491755, "grad_norm": 1.7904631579843462, "learning_rate": 1.0627983279105996e-06, "loss": 0.7855, "step": 3042 }, { "epoch": 0.28075193172644447, "grad_norm": 1.7484699054593347, "learning_rate": 1.062664032786797e-06, "loss": 0.6728, "step": 3043 }, { "epoch": 0.2808441932879714, "grad_norm": 2.1338057527343115, "learning_rate": 1.0625296980011909e-06, "loss": 0.8728, "step": 3044 }, { "epoch": 0.2809364548494983, "grad_norm": 1.4213221012684427, "learning_rate": 1.0623953235659547e-06, "loss": 0.6779, "step": 3045 }, { "epoch": 0.2809364548494983, "eval_GEN Loss": 0.4686720371246338, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.381797730922699, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9061899185180664, "eval_runtime": 56.9058, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3045 }, { "epoch": 0.2810287164110253, "grad_norm": 2.1135693186589215, "learning_rate": 1.0622609094932658e-06, "loss": 0.7909, "step": 3046 }, { "epoch": 0.2811209779725522, "grad_norm": 1.7274339732855157, "learning_rate": 1.0621264557953052e-06, "loss": 0.6717, "step": 3047 }, { "epoch": 0.2812132395340791, "grad_norm": 1.9125030429274472, "learning_rate": 1.061991962484257e-06, "loss": 0.6906, "step": 3048 }, { "epoch": 0.28130550109560604, "grad_norm": 2.144051575041993, "learning_rate": 1.0618574295723095e-06, "loss": 0.6694, "step": 3049 }, { "epoch": 0.28139776265713295, "grad_norm": 1.84832154181422, "learning_rate": 1.0617228570716538e-06, "loss": 0.5958, "step": 3050 }, { "epoch": 0.28139776265713295, "eval_GEN Loss": 0.4657774865627289, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.38704806566238403, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.900661051273346, "eval_runtime": 56.6353, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 3050 }, { "epoch": 0.2814900242186599, "grad_norm": 2.31598315278293, "learning_rate": 1.0615882449944856e-06, "loss": 0.7841, "step": 3051 }, { "epoch": 0.28158228578018685, "grad_norm": 2.1371664471350713, "learning_rate": 1.0614535933530033e-06, "loss": 0.7341, "step": 3052 }, { "epoch": 0.28167454734171377, "grad_norm": 2.4419606666641105, "learning_rate": 1.0613189021594096e-06, "loss": 0.9996, "step": 3053 }, { "epoch": 0.2817668089032407, "grad_norm": 2.1011073182541566, "learning_rate": 1.06118417142591e-06, "loss": 0.6853, "step": 3054 }, { "epoch": 0.2818590704647676, "grad_norm": 2.086353803274598, "learning_rate": 1.0610494011647143e-06, "loss": 0.6906, "step": 3055 }, { "epoch": 0.2818590704647676, "eval_GEN Loss": 0.4659087359905243, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3741576671600342, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9114783406257629, "eval_runtime": 56.863, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3055 }, { "epoch": 0.2819513320262945, "grad_norm": 2.871683684942679, "learning_rate": 1.0609145913880355e-06, "loss": 0.7057, "step": 3056 }, { "epoch": 0.2820435935878215, "grad_norm": 1.8595216782239863, "learning_rate": 1.0607797421080902e-06, "loss": 0.6267, "step": 3057 }, { "epoch": 0.2821358551493484, "grad_norm": 2.536029962732933, "learning_rate": 1.0606448533370988e-06, "loss": 0.7527, "step": 3058 }, { "epoch": 0.28222811671087533, "grad_norm": 1.487910259640829, "learning_rate": 1.0605099250872852e-06, "loss": 0.7512, "step": 3059 }, { "epoch": 0.28232037827240225, "grad_norm": 2.0658230844092147, "learning_rate": 1.0603749573708765e-06, "loss": 0.8208, "step": 3060 }, { "epoch": 0.28232037827240225, "eval_GEN Loss": 0.4652542173862457, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.375637412071228, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9095553159713745, "eval_runtime": 57.3191, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 3060 }, { "epoch": 0.28241263983392917, "grad_norm": 1.7626753024284254, "learning_rate": 1.060239950200104e-06, "loss": 0.8132, "step": 3061 }, { "epoch": 0.28250490139545614, "grad_norm": 1.451956880870587, "learning_rate": 1.0601049035872021e-06, "loss": 0.5288, "step": 3062 }, { "epoch": 0.28259716295698306, "grad_norm": 3.030208795825869, "learning_rate": 1.0599698175444092e-06, "loss": 0.7612, "step": 3063 }, { "epoch": 0.28268942451851, "grad_norm": 2.182971082205315, "learning_rate": 1.0598346920839664e-06, "loss": 0.6718, "step": 3064 }, { "epoch": 0.2827816860800369, "grad_norm": 1.7677658952444775, "learning_rate": 1.0596995272181195e-06, "loss": 0.7722, "step": 3065 }, { "epoch": 0.2827816860800369, "eval_GEN Loss": 0.46604636311531067, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.37874099612236023, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.907151460647583, "eval_runtime": 56.6518, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3065 }, { "epoch": 0.2828739476415638, "grad_norm": 2.2423082403953045, "learning_rate": 1.0595643229591174e-06, "loss": 0.675, "step": 3066 }, { "epoch": 0.28296620920309073, "grad_norm": 1.5534307236488345, "learning_rate": 1.059429079319212e-06, "loss": 0.6772, "step": 3067 }, { "epoch": 0.2830584707646177, "grad_norm": 1.9817521697600702, "learning_rate": 1.05929379631066e-06, "loss": 0.6152, "step": 3068 }, { "epoch": 0.2831507323261446, "grad_norm": 1.55341060271511, "learning_rate": 1.0591584739457203e-06, "loss": 0.7239, "step": 3069 }, { "epoch": 0.28324299388767155, "grad_norm": 2.2594796869473357, "learning_rate": 1.0590231122366565e-06, "loss": 0.7845, "step": 3070 }, { "epoch": 0.28324299388767155, "eval_GEN Loss": 0.4675382971763611, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3763037919998169, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9029446840286255, "eval_runtime": 56.8095, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3070 }, { "epoch": 0.28333525544919846, "grad_norm": 1.5711109656493212, "learning_rate": 1.0588877111957348e-06, "loss": 0.5559, "step": 3071 }, { "epoch": 0.2834275170107254, "grad_norm": 2.3612479186297133, "learning_rate": 1.0587522708352262e-06, "loss": 0.9523, "step": 3072 }, { "epoch": 0.28351977857225236, "grad_norm": 2.175565693130009, "learning_rate": 1.058616791167404e-06, "loss": 0.7909, "step": 3073 }, { "epoch": 0.2836120401337793, "grad_norm": 1.7017775914052056, "learning_rate": 1.0584812722045455e-06, "loss": 0.7176, "step": 3074 }, { "epoch": 0.2837043016953062, "grad_norm": 2.6788065268577643, "learning_rate": 1.0583457139589317e-06, "loss": 0.9553, "step": 3075 }, { "epoch": 0.2837043016953062, "eval_GEN Loss": 0.46606746315956116, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3762892484664917, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9116586446762085, "eval_runtime": 56.7424, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3075 }, { "epoch": 0.2837965632568331, "grad_norm": 2.914097442064055, "learning_rate": 1.0582101164428474e-06, "loss": 0.869, "step": 3076 }, { "epoch": 0.28388882481836003, "grad_norm": 2.88039190454395, "learning_rate": 1.0580744796685804e-06, "loss": 0.9041, "step": 3077 }, { "epoch": 0.283981086379887, "grad_norm": 2.363975874657006, "learning_rate": 1.0579388036484223e-06, "loss": 0.932, "step": 3078 }, { "epoch": 0.2840733479414139, "grad_norm": 2.0158679523647995, "learning_rate": 1.0578030883946685e-06, "loss": 0.7301, "step": 3079 }, { "epoch": 0.28416560950294084, "grad_norm": 1.8537815026079734, "learning_rate": 1.0576673339196176e-06, "loss": 0.8477, "step": 3080 }, { "epoch": 0.28416560950294084, "eval_GEN Loss": 0.46597346663475037, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3801872730255127, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8949519395828247, "eval_runtime": 56.6931, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3080 }, { "epoch": 0.28425787106446776, "grad_norm": 1.8994480286322213, "learning_rate": 1.0575315402355718e-06, "loss": 0.6243, "step": 3081 }, { "epoch": 0.2843501326259947, "grad_norm": 3.2779745014244988, "learning_rate": 1.057395707354837e-06, "loss": 1.0052, "step": 3082 }, { "epoch": 0.2844423941875216, "grad_norm": 2.492639473823188, "learning_rate": 1.0572598352897227e-06, "loss": 0.8754, "step": 3083 }, { "epoch": 0.28453465574904857, "grad_norm": 1.900689999724326, "learning_rate": 1.0571239240525414e-06, "loss": 0.7231, "step": 3084 }, { "epoch": 0.2846269173105755, "grad_norm": 2.2859324540427357, "learning_rate": 1.0569879736556102e-06, "loss": 0.859, "step": 3085 }, { "epoch": 0.2846269173105755, "eval_GEN Loss": 0.46712419390678406, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.4000728130340576, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8842548131942749, "eval_runtime": 56.7942, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3085 }, { "epoch": 0.2847191788721024, "grad_norm": 2.1509835400542827, "learning_rate": 1.056851984111249e-06, "loss": 0.8304, "step": 3086 }, { "epoch": 0.2848114404336293, "grad_norm": 2.1363475596955626, "learning_rate": 1.056715955431781e-06, "loss": 0.5765, "step": 3087 }, { "epoch": 0.28490370199515624, "grad_norm": 1.7308635146031295, "learning_rate": 1.0565798876295337e-06, "loss": 0.6607, "step": 3088 }, { "epoch": 0.2849959635566832, "grad_norm": 1.582608132372354, "learning_rate": 1.0564437807168376e-06, "loss": 0.8734, "step": 3089 }, { "epoch": 0.28508822511821014, "grad_norm": 1.4671379084193517, "learning_rate": 1.0563076347060273e-06, "loss": 0.6062, "step": 3090 }, { "epoch": 0.28508822511821014, "eval_GEN Loss": 0.4661886692047119, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.38512077927589417, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8808293342590332, "eval_runtime": 56.7829, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3090 }, { "epoch": 0.28518048667973706, "grad_norm": 1.7688010433446533, "learning_rate": 1.0561714496094398e-06, "loss": 0.727, "step": 3091 }, { "epoch": 0.285272748241264, "grad_norm": 1.8775239804600636, "learning_rate": 1.056035225439417e-06, "loss": 0.6714, "step": 3092 }, { "epoch": 0.2853650098027909, "grad_norm": 1.9746959633598722, "learning_rate": 1.0558989622083038e-06, "loss": 0.8284, "step": 3093 }, { "epoch": 0.28545727136431787, "grad_norm": 1.5507223235366274, "learning_rate": 1.0557626599284481e-06, "loss": 0.6109, "step": 3094 }, { "epoch": 0.2855495329258448, "grad_norm": 1.7766831703362023, "learning_rate": 1.0556263186122022e-06, "loss": 0.8638, "step": 3095 }, { "epoch": 0.2855495329258448, "eval_GEN Loss": 0.4653873145580292, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3613568842411041, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8912259340286255, "eval_runtime": 55.9366, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3095 }, { "epoch": 0.2856417944873717, "grad_norm": 1.7554203841913272, "learning_rate": 1.0554899382719217e-06, "loss": 0.7518, "step": 3096 }, { "epoch": 0.2857340560488986, "grad_norm": 1.6844967445903287, "learning_rate": 1.0553535189199655e-06, "loss": 0.7656, "step": 3097 }, { "epoch": 0.28582631761042554, "grad_norm": 2.089667784863428, "learning_rate": 1.0552170605686957e-06, "loss": 0.8665, "step": 3098 }, { "epoch": 0.28591857917195246, "grad_norm": 1.6438299141886128, "learning_rate": 1.055080563230479e-06, "loss": 0.6618, "step": 3099 }, { "epoch": 0.28601084073347943, "grad_norm": 1.6914329780792354, "learning_rate": 1.0549440269176843e-06, "loss": 0.654, "step": 3100 }, { "epoch": 0.28601084073347943, "eval_GEN Loss": 0.4667896032333374, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3566409647464752, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8939903974533081, "eval_runtime": 55.8686, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3100 }, { "epoch": 0.28610310229500635, "grad_norm": 1.5334234556289796, "learning_rate": 1.0548074516426855e-06, "loss": 0.6701, "step": 3101 }, { "epoch": 0.28619536385653327, "grad_norm": 1.6714199493367639, "learning_rate": 1.0546708374178585e-06, "loss": 0.7958, "step": 3102 }, { "epoch": 0.2862876254180602, "grad_norm": 1.6422071550644641, "learning_rate": 1.0545341842555843e-06, "loss": 0.7805, "step": 3103 }, { "epoch": 0.2863798869795871, "grad_norm": 1.9429238807507643, "learning_rate": 1.0543974921682462e-06, "loss": 0.6407, "step": 3104 }, { "epoch": 0.2864721485411141, "grad_norm": 1.8132138305768448, "learning_rate": 1.0542607611682312e-06, "loss": 0.6952, "step": 3105 }, { "epoch": 0.2864721485411141, "eval_GEN Loss": 0.465804785490036, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.35782474279403687, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8822115659713745, "eval_runtime": 55.9472, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3105 }, { "epoch": 0.286564410102641, "grad_norm": 2.124122330337371, "learning_rate": 1.0541239912679306e-06, "loss": 0.6771, "step": 3106 }, { "epoch": 0.2866566716641679, "grad_norm": 1.554192333664422, "learning_rate": 1.0539871824797384e-06, "loss": 0.7065, "step": 3107 }, { "epoch": 0.28674893322569484, "grad_norm": 1.629955964226237, "learning_rate": 1.0538503348160523e-06, "loss": 0.7569, "step": 3108 }, { "epoch": 0.28684119478722175, "grad_norm": 1.5532291249377288, "learning_rate": 1.053713448289274e-06, "loss": 0.6305, "step": 3109 }, { "epoch": 0.2869334563487487, "grad_norm": 2.141857916910032, "learning_rate": 1.0535765229118084e-06, "loss": 0.7892, "step": 3110 }, { "epoch": 0.2869334563487487, "eval_GEN Loss": 0.4660208523273468, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.36910420656204224, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8732572197914124, "eval_runtime": 55.8231, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3110 }, { "epoch": 0.28702571791027565, "grad_norm": 2.1212484068932773, "learning_rate": 1.0534395586960634e-06, "loss": 0.7813, "step": 3111 }, { "epoch": 0.28711797947180256, "grad_norm": 2.087905572005798, "learning_rate": 1.0533025556544513e-06, "loss": 0.8203, "step": 3112 }, { "epoch": 0.2872102410333295, "grad_norm": 1.812317216913645, "learning_rate": 1.0531655137993876e-06, "loss": 0.7788, "step": 3113 }, { "epoch": 0.2873025025948564, "grad_norm": 1.8474439368782816, "learning_rate": 1.0530284331432911e-06, "loss": 0.7616, "step": 3114 }, { "epoch": 0.2873947641563833, "grad_norm": 1.8675715485348674, "learning_rate": 1.0528913136985841e-06, "loss": 0.8438, "step": 3115 }, { "epoch": 0.2873947641563833, "eval_GEN Loss": 0.46344852447509766, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38797926902770996, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8698317408561707, "eval_runtime": 56.3747, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 3115 }, { "epoch": 0.2874870257179103, "grad_norm": 2.0242343361431367, "learning_rate": 1.0527541554776926e-06, "loss": 0.7094, "step": 3116 }, { "epoch": 0.2875792872794372, "grad_norm": 1.9460536316360604, "learning_rate": 1.0526169584930464e-06, "loss": 0.5945, "step": 3117 }, { "epoch": 0.28767154884096413, "grad_norm": 1.9319594951384043, "learning_rate": 1.0524797227570785e-06, "loss": 0.6974, "step": 3118 }, { "epoch": 0.28776381040249105, "grad_norm": 1.719496726115059, "learning_rate": 1.0523424482822251e-06, "loss": 0.7208, "step": 3119 }, { "epoch": 0.28785607196401797, "grad_norm": 2.424005694128972, "learning_rate": 1.0522051350809265e-06, "loss": 0.7763, "step": 3120 }, { "epoch": 0.28785607196401797, "eval_GEN Loss": 0.4616316556930542, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38041043281555176, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.870312511920929, "eval_runtime": 56.6768, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3120 }, { "epoch": 0.28794833352554494, "grad_norm": 1.4211401390054537, "learning_rate": 1.0520677831656258e-06, "loss": 0.8117, "step": 3121 }, { "epoch": 0.28804059508707186, "grad_norm": 1.7596771331547327, "learning_rate": 1.0519303925487708e-06, "loss": 0.5949, "step": 3122 }, { "epoch": 0.2881328566485988, "grad_norm": 2.363982976402196, "learning_rate": 1.0517929632428113e-06, "loss": 0.7793, "step": 3123 }, { "epoch": 0.2882251182101257, "grad_norm": 1.9629677355913673, "learning_rate": 1.051655495260202e-06, "loss": 0.9329, "step": 3124 }, { "epoch": 0.2883173797716526, "grad_norm": 2.2197297120392405, "learning_rate": 1.0515179886134e-06, "loss": 0.8808, "step": 3125 }, { "epoch": 0.2883173797716526, "eval_GEN Loss": 0.45907220244407654, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3719245195388794, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8778846263885498, "eval_runtime": 55.6551, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 3125 }, { "epoch": 0.2884096413331796, "grad_norm": 1.4296998827142253, "learning_rate": 1.0513804433148664e-06, "loss": 0.6082, "step": 3126 }, { "epoch": 0.2885019028947065, "grad_norm": 2.0088710776882372, "learning_rate": 1.0512428593770662e-06, "loss": 0.8761, "step": 3127 }, { "epoch": 0.2885941644562334, "grad_norm": 2.556149882217034, "learning_rate": 1.051105236812467e-06, "loss": 0.8749, "step": 3128 }, { "epoch": 0.28868642601776034, "grad_norm": 1.8383744387669663, "learning_rate": 1.0509675756335404e-06, "loss": 0.9021, "step": 3129 }, { "epoch": 0.28877868757928726, "grad_norm": 1.8068564555818132, "learning_rate": 1.0508298758527617e-06, "loss": 0.7847, "step": 3130 }, { "epoch": 0.28877868757928726, "eval_GEN Loss": 0.4589958190917969, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.369075745344162, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.892848551273346, "eval_runtime": 55.9093, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3130 }, { "epoch": 0.2888709491408142, "grad_norm": 1.7482976395088272, "learning_rate": 1.0506921374826094e-06, "loss": 0.7627, "step": 3131 }, { "epoch": 0.28896321070234116, "grad_norm": 1.8152660651430073, "learning_rate": 1.0505543605355656e-06, "loss": 0.6659, "step": 3132 }, { "epoch": 0.2890554722638681, "grad_norm": 3.3737528732931783, "learning_rate": 1.0504165450241158e-06, "loss": 0.833, "step": 3133 }, { "epoch": 0.289147733825395, "grad_norm": 1.942320949150712, "learning_rate": 1.050278690960749e-06, "loss": 0.6873, "step": 3134 }, { "epoch": 0.2892399953869219, "grad_norm": 2.2186790493947837, "learning_rate": 1.050140798357958e-06, "loss": 0.7874, "step": 3135 }, { "epoch": 0.2892399953869219, "eval_GEN Loss": 0.45963695645332336, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.36822742223739624, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8883413672447205, "eval_runtime": 55.8123, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3135 }, { "epoch": 0.28933225694844883, "grad_norm": 1.8656051278043004, "learning_rate": 1.0500028672282384e-06, "loss": 0.623, "step": 3136 }, { "epoch": 0.2894245185099758, "grad_norm": 1.8888042933587164, "learning_rate": 1.0498648975840901e-06, "loss": 0.6907, "step": 3137 }, { "epoch": 0.2895167800715027, "grad_norm": 1.2742909023044926, "learning_rate": 1.049726889438016e-06, "loss": 0.5956, "step": 3138 }, { "epoch": 0.28960904163302964, "grad_norm": 1.7209415378099318, "learning_rate": 1.049588842802523e-06, "loss": 0.6488, "step": 3139 }, { "epoch": 0.28970130319455656, "grad_norm": 1.5859824419279278, "learning_rate": 1.0494507576901206e-06, "loss": 0.5687, "step": 3140 }, { "epoch": 0.28970130319455656, "eval_GEN Loss": 0.46031397581100464, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3708396553993225, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8823317289352417, "eval_runtime": 55.804, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3140 }, { "epoch": 0.2897935647560835, "grad_norm": 1.4086078227801055, "learning_rate": 1.0493126341133221e-06, "loss": 0.6124, "step": 3141 }, { "epoch": 0.28988582631761045, "grad_norm": 1.3737896057678165, "learning_rate": 1.049174472084645e-06, "loss": 0.756, "step": 3142 }, { "epoch": 0.28997808787913737, "grad_norm": 1.4575605104274383, "learning_rate": 1.0490362716166097e-06, "loss": 0.6639, "step": 3143 }, { "epoch": 0.2900703494406643, "grad_norm": 1.7526819456268004, "learning_rate": 1.04889803272174e-06, "loss": 0.7761, "step": 3144 }, { "epoch": 0.2901626110021912, "grad_norm": 2.067018200441921, "learning_rate": 1.0487597554125633e-06, "loss": 0.8508, "step": 3145 }, { "epoch": 0.2901626110021912, "eval_GEN Loss": 0.46307626366615295, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3669787645339966, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8828125, "eval_runtime": 55.9242, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3145 }, { "epoch": 0.2902548725637181, "grad_norm": 1.904528284618996, "learning_rate": 1.0486214397016107e-06, "loss": 0.5534, "step": 3146 }, { "epoch": 0.29034713412524504, "grad_norm": 1.9020526562960165, "learning_rate": 1.0484830856014162e-06, "loss": 0.848, "step": 3147 }, { "epoch": 0.290439395686772, "grad_norm": 2.155351680336442, "learning_rate": 1.048344693124518e-06, "loss": 0.7462, "step": 3148 }, { "epoch": 0.29053165724829894, "grad_norm": 2.550682080895001, "learning_rate": 1.0482062622834575e-06, "loss": 0.771, "step": 3149 }, { "epoch": 0.29062391880982585, "grad_norm": 1.8111298565882687, "learning_rate": 1.0480677930907792e-06, "loss": 0.7119, "step": 3150 }, { "epoch": 0.29062391880982585, "eval_GEN Loss": 0.4651535451412201, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.35730528831481934, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8854567408561707, "eval_runtime": 55.7264, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 3150 }, { "epoch": 0.2907161803713528, "grad_norm": 2.3965045367411784, "learning_rate": 1.0479292855590314e-06, "loss": 0.6272, "step": 3151 }, { "epoch": 0.2908084419328797, "grad_norm": 1.2022092351837308, "learning_rate": 1.0477907397007664e-06, "loss": 0.6686, "step": 3152 }, { "epoch": 0.29090070349440666, "grad_norm": 1.9397325181218765, "learning_rate": 1.047652155528539e-06, "loss": 0.7637, "step": 3153 }, { "epoch": 0.2909929650559336, "grad_norm": 1.5083879696158757, "learning_rate": 1.047513533054908e-06, "loss": 0.7001, "step": 3154 }, { "epoch": 0.2910852266174605, "grad_norm": 1.5808087887051612, "learning_rate": 1.0473748722924354e-06, "loss": 0.5169, "step": 3155 }, { "epoch": 0.2910852266174605, "eval_GEN Loss": 0.46677032113075256, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3591814935207367, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8782451748847961, "eval_runtime": 55.9761, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3155 }, { "epoch": 0.2911774881789874, "grad_norm": 1.6359547268654968, "learning_rate": 1.0472361732536874e-06, "loss": 0.7349, "step": 3156 }, { "epoch": 0.29126974974051434, "grad_norm": 1.8549432198455764, "learning_rate": 1.0470974359512324e-06, "loss": 0.6993, "step": 3157 }, { "epoch": 0.2913620113020413, "grad_norm": 1.653857682227101, "learning_rate": 1.0469586603976433e-06, "loss": 0.6384, "step": 3158 }, { "epoch": 0.29145427286356823, "grad_norm": 1.548072397896846, "learning_rate": 1.0468198466054965e-06, "loss": 0.5188, "step": 3159 }, { "epoch": 0.29154653442509515, "grad_norm": 5.077027236249122, "learning_rate": 1.0466809945873713e-06, "loss": 1.0489, "step": 3160 }, { "epoch": 0.29154653442509515, "eval_GEN Loss": 0.46819600462913513, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3675070106983185, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8615384697914124, "eval_runtime": 55.9124, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3160 }, { "epoch": 0.29163879598662207, "grad_norm": 1.4133852381883283, "learning_rate": 1.0465421043558505e-06, "loss": 0.7251, "step": 3161 }, { "epoch": 0.291731057548149, "grad_norm": 1.919934809858561, "learning_rate": 1.0464031759235207e-06, "loss": 0.7187, "step": 3162 }, { "epoch": 0.2918233191096759, "grad_norm": 1.986475543429513, "learning_rate": 1.046264209302972e-06, "loss": 0.6051, "step": 3163 }, { "epoch": 0.2919155806712029, "grad_norm": 1.4775431135751924, "learning_rate": 1.0461252045067972e-06, "loss": 0.6428, "step": 3164 }, { "epoch": 0.2920078422327298, "grad_norm": 2.4297431446091817, "learning_rate": 1.0459861615475936e-06, "loss": 0.8346, "step": 3165 }, { "epoch": 0.2920078422327298, "eval_GEN Loss": 0.4699571132659912, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.40065595507621765, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8694711327552795, "eval_runtime": 55.948, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3165 }, { "epoch": 0.2921001037942567, "grad_norm": 1.7331737289138733, "learning_rate": 1.0458470804379617e-06, "loss": 0.7742, "step": 3166 }, { "epoch": 0.29219236535578363, "grad_norm": 1.867585373874945, "learning_rate": 1.0457079611905047e-06, "loss": 0.6015, "step": 3167 }, { "epoch": 0.29228462691731055, "grad_norm": 2.1300608669779955, "learning_rate": 1.04556880381783e-06, "loss": 0.8298, "step": 3168 }, { "epoch": 0.2923768884788375, "grad_norm": 1.5229898910347492, "learning_rate": 1.0454296083325483e-06, "loss": 0.7539, "step": 3169 }, { "epoch": 0.29246915004036445, "grad_norm": 3.596303188964942, "learning_rate": 1.045290374747274e-06, "loss": 0.8435, "step": 3170 }, { "epoch": 0.29246915004036445, "eval_GEN Loss": 0.46960684657096863, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.39612385630607605, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8713341355323792, "eval_runtime": 55.9532, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3170 }, { "epoch": 0.29256141160189136, "grad_norm": 1.964153866959998, "learning_rate": 1.0451511030746242e-06, "loss": 0.7423, "step": 3171 }, { "epoch": 0.2926536731634183, "grad_norm": 2.411175488046264, "learning_rate": 1.0450117933272201e-06, "loss": 0.7087, "step": 3172 }, { "epoch": 0.2927459347249452, "grad_norm": 2.634525391910467, "learning_rate": 1.0448724455176862e-06, "loss": 0.8788, "step": 3173 }, { "epoch": 0.2928381962864722, "grad_norm": 1.7843384106790685, "learning_rate": 1.0447330596586504e-06, "loss": 0.7808, "step": 3174 }, { "epoch": 0.2929304578479991, "grad_norm": 1.966600069213244, "learning_rate": 1.044593635762744e-06, "loss": 0.6539, "step": 3175 }, { "epoch": 0.2929304578479991, "eval_GEN Loss": 0.46833521127700806, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39416956901550293, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8832932710647583, "eval_runtime": 55.9285, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3175 }, { "epoch": 0.293022719409526, "grad_norm": 1.764432799519812, "learning_rate": 1.044454173842602e-06, "loss": 0.7885, "step": 3176 }, { "epoch": 0.29311498097105293, "grad_norm": 2.04802878259487, "learning_rate": 1.0443146739108625e-06, "loss": 0.6674, "step": 3177 }, { "epoch": 0.29320724253257985, "grad_norm": 1.4919837660601845, "learning_rate": 1.0441751359801673e-06, "loss": 0.5971, "step": 3178 }, { "epoch": 0.29329950409410677, "grad_norm": 1.957245487506922, "learning_rate": 1.0440355600631612e-06, "loss": 0.863, "step": 3179 }, { "epoch": 0.29339176565563374, "grad_norm": 2.3287094530422547, "learning_rate": 1.0438959461724934e-06, "loss": 0.7705, "step": 3180 }, { "epoch": 0.29339176565563374, "eval_GEN Loss": 0.4665025472640991, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3920274078845978, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8968750238418579, "eval_runtime": 55.9439, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3180 }, { "epoch": 0.29348402721716066, "grad_norm": 1.9833444517471517, "learning_rate": 1.0437562943208153e-06, "loss": 0.8876, "step": 3181 }, { "epoch": 0.2935762887786876, "grad_norm": 1.8946601399084904, "learning_rate": 1.0436166045207831e-06, "loss": 0.6933, "step": 3182 }, { "epoch": 0.2936685503402145, "grad_norm": 2.8117872189601822, "learning_rate": 1.0434768767850551e-06, "loss": 0.9753, "step": 3183 }, { "epoch": 0.2937608119017414, "grad_norm": 3.414644451572609, "learning_rate": 1.0433371111262938e-06, "loss": 1.0414, "step": 3184 }, { "epoch": 0.2938530734632684, "grad_norm": 1.705567029138378, "learning_rate": 1.043197307557165e-06, "loss": 0.6504, "step": 3185 }, { "epoch": 0.2938530734632684, "eval_GEN Loss": 0.46626728773117065, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.39432328939437866, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8966947197914124, "eval_runtime": 55.9209, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3185 }, { "epoch": 0.2939453350247953, "grad_norm": 2.3853810340231756, "learning_rate": 1.0430574660903379e-06, "loss": 0.826, "step": 3186 }, { "epoch": 0.2940375965863222, "grad_norm": 1.4601027958840533, "learning_rate": 1.0429175867384853e-06, "loss": 0.7381, "step": 3187 }, { "epoch": 0.29412985814784914, "grad_norm": 3.0209128877522353, "learning_rate": 1.042777669514283e-06, "loss": 0.8718, "step": 3188 }, { "epoch": 0.29422211970937606, "grad_norm": 2.85446344423048, "learning_rate": 1.0426377144304107e-06, "loss": 0.8125, "step": 3189 }, { "epoch": 0.29431438127090304, "grad_norm": 1.8311409864746164, "learning_rate": 1.0424977214995515e-06, "loss": 0.7096, "step": 3190 }, { "epoch": 0.29431438127090304, "eval_GEN Loss": 0.46524283289909363, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.39024388790130615, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8878605961799622, "eval_runtime": 55.9145, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3190 }, { "epoch": 0.29440664283242995, "grad_norm": 1.4732126770264173, "learning_rate": 1.0423576907343916e-06, "loss": 0.7715, "step": 3191 }, { "epoch": 0.2944989043939569, "grad_norm": 1.4891954160985086, "learning_rate": 1.0422176221476208e-06, "loss": 0.6787, "step": 3192 }, { "epoch": 0.2945911659554838, "grad_norm": 2.4310716826356407, "learning_rate": 1.0420775157519325e-06, "loss": 0.7358, "step": 3193 }, { "epoch": 0.2946834275170107, "grad_norm": 1.847219074555379, "learning_rate": 1.041937371560023e-06, "loss": 0.7859, "step": 3194 }, { "epoch": 0.29477568907853763, "grad_norm": 1.6234422563789452, "learning_rate": 1.0417971895845927e-06, "loss": 0.7301, "step": 3195 }, { "epoch": 0.29477568907853763, "eval_GEN Loss": 0.4664727747440338, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3986499607563019, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8802283406257629, "eval_runtime": 56.0516, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 3195 }, { "epoch": 0.2948679506400646, "grad_norm": 2.2291279703305173, "learning_rate": 1.0416569698383451e-06, "loss": 0.8245, "step": 3196 }, { "epoch": 0.2949602122015915, "grad_norm": 2.3734572538934553, "learning_rate": 1.041516712333987e-06, "loss": 0.8111, "step": 3197 }, { "epoch": 0.29505247376311844, "grad_norm": 1.7671502648734991, "learning_rate": 1.041376417084229e-06, "loss": 0.796, "step": 3198 }, { "epoch": 0.29514473532464536, "grad_norm": 1.883649292075704, "learning_rate": 1.0412360841017845e-06, "loss": 0.7656, "step": 3199 }, { "epoch": 0.2952369968861723, "grad_norm": 2.680206645958656, "learning_rate": 1.041095713399371e-06, "loss": 0.7452, "step": 3200 }, { "epoch": 0.2952369968861723, "eval_GEN Loss": 0.4674176573753357, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4074541926383972, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8787259459495544, "eval_runtime": 55.9267, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3200 }, { "epoch": 0.29532925844769925, "grad_norm": 1.9446061260422907, "learning_rate": 1.040955304989709e-06, "loss": 0.7373, "step": 3201 }, { "epoch": 0.29542152000922617, "grad_norm": 2.3552602313247095, "learning_rate": 1.0408148588855225e-06, "loss": 0.655, "step": 3202 }, { "epoch": 0.2955137815707531, "grad_norm": 2.6776142622557515, "learning_rate": 1.0406743750995388e-06, "loss": 0.6728, "step": 3203 }, { "epoch": 0.29560604313228, "grad_norm": 2.496971892181065, "learning_rate": 1.0405338536444893e-06, "loss": 0.8394, "step": 3204 }, { "epoch": 0.2956983046938069, "grad_norm": 2.0945994420792324, "learning_rate": 1.0403932945331078e-06, "loss": 0.6992, "step": 3205 }, { "epoch": 0.2956983046938069, "eval_GEN Loss": 0.46679702401161194, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.4008890986442566, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8759615421295166, "eval_runtime": 55.741, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 3205 }, { "epoch": 0.2957905662553339, "grad_norm": 1.4268433586044347, "learning_rate": 1.040252697778132e-06, "loss": 0.637, "step": 3206 }, { "epoch": 0.2958828278168608, "grad_norm": 1.9604369515361877, "learning_rate": 1.0401120633923031e-06, "loss": 0.7567, "step": 3207 }, { "epoch": 0.29597508937838773, "grad_norm": 2.050256242253183, "learning_rate": 1.0399713913883655e-06, "loss": 0.8661, "step": 3208 }, { "epoch": 0.29606735093991465, "grad_norm": 1.6955652138476502, "learning_rate": 1.0398306817790677e-06, "loss": 0.8202, "step": 3209 }, { "epoch": 0.29615961250144157, "grad_norm": 1.6589527435088736, "learning_rate": 1.0396899345771603e-06, "loss": 0.8077, "step": 3210 }, { "epoch": 0.29615961250144157, "eval_GEN Loss": 0.46665677428245544, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.4116832911968231, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8700721263885498, "eval_runtime": 56.2772, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 3210 }, { "epoch": 0.2962518740629685, "grad_norm": 2.179169601372341, "learning_rate": 1.039549149795398e-06, "loss": 0.7368, "step": 3211 }, { "epoch": 0.29634413562449546, "grad_norm": 2.490690970558911, "learning_rate": 1.0394083274465397e-06, "loss": 0.6379, "step": 3212 }, { "epoch": 0.2964363971860224, "grad_norm": 2.5464766250650746, "learning_rate": 1.0392674675433462e-06, "loss": 0.813, "step": 3213 }, { "epoch": 0.2965286587475493, "grad_norm": 1.8716356283686209, "learning_rate": 1.0391265700985827e-06, "loss": 0.7216, "step": 3214 }, { "epoch": 0.2966209203090762, "grad_norm": 1.7010034716123574, "learning_rate": 1.0389856351250178e-06, "loss": 0.647, "step": 3215 }, { "epoch": 0.2966209203090762, "eval_GEN Loss": 0.4681289494037628, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4168323874473572, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8778846263885498, "eval_runtime": 56.2273, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 3215 }, { "epoch": 0.29671318187060314, "grad_norm": 1.3811160230917578, "learning_rate": 1.038844662635423e-06, "loss": 0.5191, "step": 3216 }, { "epoch": 0.2968054434321301, "grad_norm": 1.5464390579174991, "learning_rate": 1.0387036526425734e-06, "loss": 0.7829, "step": 3217 }, { "epoch": 0.29689770499365703, "grad_norm": 2.517594632348134, "learning_rate": 1.0385626051592476e-06, "loss": 0.9745, "step": 3218 }, { "epoch": 0.29698996655518395, "grad_norm": 2.413440548805422, "learning_rate": 1.0384215201982275e-06, "loss": 0.8237, "step": 3219 }, { "epoch": 0.29708222811671087, "grad_norm": 1.6389357500069879, "learning_rate": 1.0382803977722986e-06, "loss": 0.5575, "step": 3220 }, { "epoch": 0.29708222811671087, "eval_GEN Loss": 0.4676324129104614, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.40068355202674866, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8912860751152039, "eval_runtime": 55.9035, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3220 }, { "epoch": 0.2971744896782378, "grad_norm": 2.1137986501791888, "learning_rate": 1.0381392378942495e-06, "loss": 0.735, "step": 3221 }, { "epoch": 0.29726675123976476, "grad_norm": 2.168557091076219, "learning_rate": 1.0379980405768726e-06, "loss": 0.7403, "step": 3222 }, { "epoch": 0.2973590128012917, "grad_norm": 3.216875359654587, "learning_rate": 1.0378568058329628e-06, "loss": 0.8687, "step": 3223 }, { "epoch": 0.2974512743628186, "grad_norm": 2.0052480433898565, "learning_rate": 1.0377155336753196e-06, "loss": 0.8577, "step": 3224 }, { "epoch": 0.2975435359243455, "grad_norm": 1.4313688871535097, "learning_rate": 1.0375742241167452e-06, "loss": 0.6885, "step": 3225 }, { "epoch": 0.2975435359243455, "eval_GEN Loss": 0.46804577112197876, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3963159918785095, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9114783406257629, "eval_runtime": 56.0151, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 3225 }, { "epoch": 0.29763579748587243, "grad_norm": 2.187857154681799, "learning_rate": 1.0374328771700452e-06, "loss": 0.865, "step": 3226 }, { "epoch": 0.29772805904739935, "grad_norm": 1.6542876255566346, "learning_rate": 1.0372914928480285e-06, "loss": 0.7568, "step": 3227 }, { "epoch": 0.2978203206089263, "grad_norm": 1.2735996968453465, "learning_rate": 1.0371500711635079e-06, "loss": 0.5604, "step": 3228 }, { "epoch": 0.29791258217045324, "grad_norm": 2.874541431609378, "learning_rate": 1.037008612129299e-06, "loss": 0.8126, "step": 3229 }, { "epoch": 0.29800484373198016, "grad_norm": 1.3027060538651356, "learning_rate": 1.0368671157582211e-06, "loss": 0.6454, "step": 3230 }, { "epoch": 0.29800484373198016, "eval_GEN Loss": 0.46702277660369873, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.38811028003692627, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9039062261581421, "eval_runtime": 56.1379, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 3230 }, { "epoch": 0.2980971052935071, "grad_norm": 1.3655562260481116, "learning_rate": 1.0367255820630972e-06, "loss": 0.74, "step": 3231 }, { "epoch": 0.298189366855034, "grad_norm": 1.7104187736498002, "learning_rate": 1.0365840110567528e-06, "loss": 0.6899, "step": 3232 }, { "epoch": 0.298281628416561, "grad_norm": 2.070311453084554, "learning_rate": 1.0364424027520175e-06, "loss": 0.6575, "step": 3233 }, { "epoch": 0.2983738899780879, "grad_norm": 1.3532262791037883, "learning_rate": 1.036300757161724e-06, "loss": 0.7087, "step": 3234 }, { "epoch": 0.2984661515396148, "grad_norm": 2.9280333355882613, "learning_rate": 1.0361590742987084e-06, "loss": 0.9321, "step": 3235 }, { "epoch": 0.2984661515396148, "eval_GEN Loss": 0.46798866987228394, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.38410934805870056, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8912259340286255, "eval_runtime": 55.8978, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3235 }, { "epoch": 0.29855841310114173, "grad_norm": 1.7575149604597236, "learning_rate": 1.0360173541758105e-06, "loss": 0.6251, "step": 3236 }, { "epoch": 0.29865067466266865, "grad_norm": 1.7941693097692035, "learning_rate": 1.035875596805873e-06, "loss": 0.7648, "step": 3237 }, { "epoch": 0.2987429362241956, "grad_norm": 1.422349157133686, "learning_rate": 1.0357338022017422e-06, "loss": 0.7285, "step": 3238 }, { "epoch": 0.29883519778572254, "grad_norm": 2.204233576169532, "learning_rate": 1.0355919703762677e-06, "loss": 0.6954, "step": 3239 }, { "epoch": 0.29892745934724946, "grad_norm": 2.9978934632184164, "learning_rate": 1.0354501013423023e-06, "loss": 0.776, "step": 3240 }, { "epoch": 0.29892745934724946, "eval_GEN Loss": 0.46850425004959106, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3801555633544922, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8795071840286255, "eval_runtime": 57.0482, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 3240 }, { "epoch": 0.2990197209087764, "grad_norm": 2.0307286634079444, "learning_rate": 1.035308195112703e-06, "loss": 0.7, "step": 3241 }, { "epoch": 0.2991119824703033, "grad_norm": 3.218966889947449, "learning_rate": 1.035166251700329e-06, "loss": 0.9292, "step": 3242 }, { "epoch": 0.2992042440318302, "grad_norm": 2.209032735963684, "learning_rate": 1.0350242711180439e-06, "loss": 0.8464, "step": 3243 }, { "epoch": 0.2992965055933572, "grad_norm": 2.379495123563452, "learning_rate": 1.0348822533787139e-06, "loss": 0.9501, "step": 3244 }, { "epoch": 0.2993887671548841, "grad_norm": 1.6734295398994734, "learning_rate": 1.0347401984952089e-06, "loss": 0.8336, "step": 3245 }, { "epoch": 0.2993887671548841, "eval_GEN Loss": 0.46801918745040894, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.40139010548591614, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.865504801273346, "eval_runtime": 56.979, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3245 }, { "epoch": 0.299481028716411, "grad_norm": 2.06947352453802, "learning_rate": 1.034598106480402e-06, "loss": 0.7311, "step": 3246 }, { "epoch": 0.29957329027793794, "grad_norm": 1.9702157908877436, "learning_rate": 1.03445597734717e-06, "loss": 0.8078, "step": 3247 }, { "epoch": 0.29966555183946486, "grad_norm": 1.6355725513816324, "learning_rate": 1.0343138111083931e-06, "loss": 0.7881, "step": 3248 }, { "epoch": 0.29975781340099183, "grad_norm": 2.2578121541255713, "learning_rate": 1.0341716077769543e-06, "loss": 0.8894, "step": 3249 }, { "epoch": 0.29985007496251875, "grad_norm": 1.9801506616358524, "learning_rate": 1.0340293673657402e-06, "loss": 0.7919, "step": 3250 }, { "epoch": 0.29985007496251875, "eval_GEN Loss": 0.46785077452659607, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41465696692466736, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8686298131942749, "eval_runtime": 56.6402, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 3250 }, { "epoch": 0.29994233652404567, "grad_norm": 3.444329472431624, "learning_rate": 1.0338870898876412e-06, "loss": 1.1695, "step": 3251 }, { "epoch": 0.3000345980855726, "grad_norm": 2.937429164958739, "learning_rate": 1.0337447753555504e-06, "loss": 0.7983, "step": 3252 }, { "epoch": 0.3001268596470995, "grad_norm": 2.2419866762563423, "learning_rate": 1.0336024237823647e-06, "loss": 0.9784, "step": 3253 }, { "epoch": 0.3002191212086265, "grad_norm": 1.8267692641547941, "learning_rate": 1.0334600351809842e-06, "loss": 0.695, "step": 3254 }, { "epoch": 0.3003113827701534, "grad_norm": 1.7169402593841039, "learning_rate": 1.0333176095643124e-06, "loss": 0.7023, "step": 3255 }, { "epoch": 0.3003113827701534, "eval_GEN Loss": 0.46702641248703003, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.38843604922294617, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8678485751152039, "eval_runtime": 55.8029, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3255 }, { "epoch": 0.3004036443316803, "grad_norm": 1.9036497474696479, "learning_rate": 1.0331751469452561e-06, "loss": 0.7492, "step": 3256 }, { "epoch": 0.30049590589320724, "grad_norm": 1.5382110250732495, "learning_rate": 1.0330326473367255e-06, "loss": 0.6062, "step": 3257 }, { "epoch": 0.30058816745473416, "grad_norm": 2.05641696513611, "learning_rate": 1.0328901107516342e-06, "loss": 0.7757, "step": 3258 }, { "epoch": 0.3006804290162611, "grad_norm": 2.116337995374133, "learning_rate": 1.032747537202899e-06, "loss": 1.0547, "step": 3259 }, { "epoch": 0.30077269057778805, "grad_norm": 1.9551700046569036, "learning_rate": 1.0326049267034403e-06, "loss": 0.7711, "step": 3260 }, { "epoch": 0.30077269057778805, "eval_GEN Loss": 0.4676561951637268, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3697621822357178, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8673076629638672, "eval_runtime": 55.946, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3260 }, { "epoch": 0.30086495213931497, "grad_norm": 1.6620577709301876, "learning_rate": 1.0324622792661813e-06, "loss": 0.647, "step": 3261 }, { "epoch": 0.3009572137008419, "grad_norm": 1.6303362595302524, "learning_rate": 1.0323195949040493e-06, "loss": 0.6007, "step": 3262 }, { "epoch": 0.3010494752623688, "grad_norm": 1.5566984769084449, "learning_rate": 1.0321768736299745e-06, "loss": 0.752, "step": 3263 }, { "epoch": 0.3011417368238957, "grad_norm": 1.900052620726974, "learning_rate": 1.0320341154568904e-06, "loss": 0.7988, "step": 3264 }, { "epoch": 0.3012339983854227, "grad_norm": 3.0201460667688313, "learning_rate": 1.0318913203977344e-06, "loss": 0.9369, "step": 3265 }, { "epoch": 0.3012339983854227, "eval_GEN Loss": 0.46747279167175293, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.3642984926700592, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8667067289352417, "eval_runtime": 55.6597, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 3265 }, { "epoch": 0.3013262599469496, "grad_norm": 1.5204419144766583, "learning_rate": 1.0317484884654464e-06, "loss": 0.7844, "step": 3266 }, { "epoch": 0.30141852150847653, "grad_norm": 2.310936576885017, "learning_rate": 1.03160561967297e-06, "loss": 0.8933, "step": 3267 }, { "epoch": 0.30151078307000345, "grad_norm": 1.820555318156068, "learning_rate": 1.0314627140332522e-06, "loss": 0.7743, "step": 3268 }, { "epoch": 0.30160304463153037, "grad_norm": 1.8115708513353699, "learning_rate": 1.0313197715592438e-06, "loss": 0.8415, "step": 3269 }, { "epoch": 0.30169530619305734, "grad_norm": 1.9909249657601442, "learning_rate": 1.0311767922638978e-06, "loss": 0.863, "step": 3270 }, { "epoch": 0.30169530619305734, "eval_GEN Loss": 0.4707719385623932, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.38755959272384644, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8667067289352417, "eval_runtime": 56.9362, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3270 }, { "epoch": 0.30178756775458426, "grad_norm": 1.244021862801661, "learning_rate": 1.0310337761601719e-06, "loss": 0.6429, "step": 3271 }, { "epoch": 0.3018798293161112, "grad_norm": 1.6657812673684578, "learning_rate": 1.0308907232610258e-06, "loss": 0.6845, "step": 3272 }, { "epoch": 0.3019720908776381, "grad_norm": 1.9383551294255283, "learning_rate": 1.0307476335794237e-06, "loss": 0.7033, "step": 3273 }, { "epoch": 0.302064352439165, "grad_norm": 1.5038797483073527, "learning_rate": 1.0306045071283321e-06, "loss": 0.6858, "step": 3274 }, { "epoch": 0.30215661400069194, "grad_norm": 1.6482822932377652, "learning_rate": 1.030461343920722e-06, "loss": 0.7536, "step": 3275 }, { "epoch": 0.30215661400069194, "eval_GEN Loss": 0.4728904962539673, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.39366382360458374, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8687499761581421, "eval_runtime": 56.7359, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3275 }, { "epoch": 0.3022488755622189, "grad_norm": 1.9541821455417878, "learning_rate": 1.0303181439695664e-06, "loss": 0.7107, "step": 3276 }, { "epoch": 0.30234113712374583, "grad_norm": 1.7631724194084861, "learning_rate": 1.0301749072878428e-06, "loss": 0.7293, "step": 3277 }, { "epoch": 0.30243339868527275, "grad_norm": 1.956013345066894, "learning_rate": 1.0300316338885314e-06, "loss": 0.7992, "step": 3278 }, { "epoch": 0.30252566024679967, "grad_norm": 1.9077567510106757, "learning_rate": 1.0298883237846157e-06, "loss": 0.8802, "step": 3279 }, { "epoch": 0.3026179218083266, "grad_norm": 1.6983129042163072, "learning_rate": 1.0297449769890827e-06, "loss": 0.7191, "step": 3280 }, { "epoch": 0.3026179218083266, "eval_GEN Loss": 0.4703946113586426, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.3676469624042511, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8661658763885498, "eval_runtime": 56.9354, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3280 }, { "epoch": 0.30271018336985356, "grad_norm": 2.4167596748010736, "learning_rate": 1.029601593514923e-06, "loss": 0.8724, "step": 3281 }, { "epoch": 0.3028024449313805, "grad_norm": 1.9284718370881728, "learning_rate": 1.02945817337513e-06, "loss": 0.771, "step": 3282 }, { "epoch": 0.3028947064929074, "grad_norm": 2.0896592797305265, "learning_rate": 1.0293147165827005e-06, "loss": 0.726, "step": 3283 }, { "epoch": 0.3029869680544343, "grad_norm": 1.4631848407087988, "learning_rate": 1.0291712231506352e-06, "loss": 0.7402, "step": 3284 }, { "epoch": 0.30307922961596123, "grad_norm": 2.023432144881425, "learning_rate": 1.0290276930919374e-06, "loss": 0.7985, "step": 3285 }, { "epoch": 0.30307922961596123, "eval_GEN Loss": 0.4699096381664276, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3604976236820221, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8707332015037537, "eval_runtime": 56.8859, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3285 }, { "epoch": 0.3031714911774882, "grad_norm": 1.623194573926711, "learning_rate": 1.0288841264196142e-06, "loss": 0.5966, "step": 3286 }, { "epoch": 0.3032637527390151, "grad_norm": 2.5588576795049978, "learning_rate": 1.0287405231466757e-06, "loss": 0.9355, "step": 3287 }, { "epoch": 0.30335601430054204, "grad_norm": 2.076081250269867, "learning_rate": 1.0285968832861354e-06, "loss": 0.8369, "step": 3288 }, { "epoch": 0.30344827586206896, "grad_norm": 2.405456077218641, "learning_rate": 1.0284532068510103e-06, "loss": 0.8733, "step": 3289 }, { "epoch": 0.3035405374235959, "grad_norm": 1.2966798455161543, "learning_rate": 1.0283094938543206e-06, "loss": 0.6689, "step": 3290 }, { "epoch": 0.3035405374235959, "eval_GEN Loss": 0.47063034772872925, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3636990785598755, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8725360631942749, "eval_runtime": 56.8365, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3290 }, { "epoch": 0.3036327989851228, "grad_norm": 2.0413652043800243, "learning_rate": 1.0281657443090897e-06, "loss": 0.8375, "step": 3291 }, { "epoch": 0.30372506054664977, "grad_norm": 1.6862004076391688, "learning_rate": 1.0280219582283446e-06, "loss": 0.7106, "step": 3292 }, { "epoch": 0.3038173221081767, "grad_norm": 1.572203241693701, "learning_rate": 1.0278781356251151e-06, "loss": 0.7421, "step": 3293 }, { "epoch": 0.3039095836697036, "grad_norm": 1.4160268666443627, "learning_rate": 1.0277342765124348e-06, "loss": 0.5468, "step": 3294 }, { "epoch": 0.3040018452312305, "grad_norm": 1.6878246187805812, "learning_rate": 1.0275903809033405e-06, "loss": 0.8052, "step": 3295 }, { "epoch": 0.3040018452312305, "eval_GEN Loss": 0.4707462191581726, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36769601702690125, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8847355842590332, "eval_runtime": 56.7304, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3295 }, { "epoch": 0.30409410679275745, "grad_norm": 1.614324008379159, "learning_rate": 1.0274464488108723e-06, "loss": 0.7218, "step": 3296 }, { "epoch": 0.3041863683542844, "grad_norm": 2.084914313864402, "learning_rate": 1.0273024802480733e-06, "loss": 0.6896, "step": 3297 }, { "epoch": 0.30427862991581134, "grad_norm": 3.964611332592801, "learning_rate": 1.0271584752279905e-06, "loss": 0.9625, "step": 3298 }, { "epoch": 0.30437089147733826, "grad_norm": 2.240553154010285, "learning_rate": 1.0270144337636733e-06, "loss": 0.9378, "step": 3299 }, { "epoch": 0.3044631530388652, "grad_norm": 1.8621243038663489, "learning_rate": 1.026870355868176e-06, "loss": 0.7919, "step": 3300 }, { "epoch": 0.3044631530388652, "eval_GEN Loss": 0.47090718150138855, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38071757555007935, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8900841474533081, "eval_runtime": 55.7203, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3300 }, { "epoch": 0.3045554146003921, "grad_norm": 1.9486981087268203, "learning_rate": 1.0267262415545536e-06, "loss": 0.6998, "step": 3301 }, { "epoch": 0.30464767616191907, "grad_norm": 2.5574249284977015, "learning_rate": 1.0265820908358677e-06, "loss": 0.6515, "step": 3302 }, { "epoch": 0.304739937723446, "grad_norm": 2.5832467387808142, "learning_rate": 1.02643790372518e-06, "loss": 0.8226, "step": 3303 }, { "epoch": 0.3048321992849729, "grad_norm": 1.937257837319866, "learning_rate": 1.026293680235558e-06, "loss": 0.7538, "step": 3304 }, { "epoch": 0.3049244608464998, "grad_norm": 1.6625397420449046, "learning_rate": 1.026149420380071e-06, "loss": 0.7756, "step": 3305 }, { "epoch": 0.3049244608464998, "eval_GEN Loss": 0.47270333766937256, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39520299434661865, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8859975934028625, "eval_runtime": 55.7971, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3305 }, { "epoch": 0.30501672240802674, "grad_norm": 2.268252691157371, "learning_rate": 1.026005124171792e-06, "loss": 0.7261, "step": 3306 }, { "epoch": 0.30510898396955366, "grad_norm": 1.4806585163162858, "learning_rate": 1.0258607916237972e-06, "loss": 0.6518, "step": 3307 }, { "epoch": 0.30520124553108063, "grad_norm": 1.436677787171373, "learning_rate": 1.0257164227491668e-06, "loss": 0.6294, "step": 3308 }, { "epoch": 0.30529350709260755, "grad_norm": 2.2437822009554726, "learning_rate": 1.0255720175609834e-06, "loss": 0.6874, "step": 3309 }, { "epoch": 0.30538576865413447, "grad_norm": 1.8269910046246456, "learning_rate": 1.0254275760723335e-06, "loss": 0.5265, "step": 3310 }, { "epoch": 0.30538576865413447, "eval_GEN Loss": 0.4729827046394348, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4143664538860321, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8935697078704834, "eval_runtime": 55.8389, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3310 }, { "epoch": 0.3054780302156614, "grad_norm": 2.395724923886861, "learning_rate": 1.025283098296306e-06, "loss": 0.7263, "step": 3311 }, { "epoch": 0.3055702917771883, "grad_norm": 2.230094583216984, "learning_rate": 1.0251385842459942e-06, "loss": 0.7754, "step": 3312 }, { "epoch": 0.3056625533387153, "grad_norm": 1.868791460671676, "learning_rate": 1.0249940339344942e-06, "loss": 0.7799, "step": 3313 }, { "epoch": 0.3057548149002422, "grad_norm": 2.468894125372381, "learning_rate": 1.024849447374905e-06, "loss": 0.8185, "step": 3314 }, { "epoch": 0.3058470764617691, "grad_norm": 2.0452050694746498, "learning_rate": 1.0247048245803296e-06, "loss": 0.7051, "step": 3315 }, { "epoch": 0.3058470764617691, "eval_GEN Loss": 0.4728299081325531, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.4197731018066406, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9040865302085876, "eval_runtime": 55.8304, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3315 }, { "epoch": 0.30593933802329604, "grad_norm": 1.805030598113026, "learning_rate": 1.024560165563874e-06, "loss": 0.6042, "step": 3316 }, { "epoch": 0.30603159958482296, "grad_norm": 1.829706059984909, "learning_rate": 1.024415470338647e-06, "loss": 0.6795, "step": 3317 }, { "epoch": 0.30612386114634993, "grad_norm": 2.9942106735190213, "learning_rate": 1.0242707389177615e-06, "loss": 1.025, "step": 3318 }, { "epoch": 0.30621612270787685, "grad_norm": 1.8334212605152038, "learning_rate": 1.0241259713143334e-06, "loss": 0.7262, "step": 3319 }, { "epoch": 0.30630838426940377, "grad_norm": 1.6526923793308834, "learning_rate": 1.0239811675414813e-06, "loss": 0.4432, "step": 3320 }, { "epoch": 0.30630838426940377, "eval_GEN Loss": 0.4724779427051544, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.42770978808403015, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9074519276618958, "eval_runtime": 56.6413, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 3320 }, { "epoch": 0.3064006458309307, "grad_norm": 2.137500298581433, "learning_rate": 1.0238363276123277e-06, "loss": 0.7667, "step": 3321 }, { "epoch": 0.3064929073924576, "grad_norm": 1.8812189534134063, "learning_rate": 1.0236914515399988e-06, "loss": 0.6562, "step": 3322 }, { "epoch": 0.3065851689539845, "grad_norm": 2.006870280497996, "learning_rate": 1.0235465393376226e-06, "loss": 0.9133, "step": 3323 }, { "epoch": 0.3066774305155115, "grad_norm": 1.8062423441610895, "learning_rate": 1.0234015910183317e-06, "loss": 0.7146, "step": 3324 }, { "epoch": 0.3067696920770384, "grad_norm": 2.2441966271930838, "learning_rate": 1.0232566065952619e-06, "loss": 0.7222, "step": 3325 }, { "epoch": 0.3067696920770384, "eval_GEN Loss": 0.47074562311172485, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.41788098216056824, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9084134697914124, "eval_runtime": 55.8037, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3325 }, { "epoch": 0.30686195363856533, "grad_norm": 2.6136074390789745, "learning_rate": 1.023111586081551e-06, "loss": 0.8835, "step": 3326 }, { "epoch": 0.30695421520009225, "grad_norm": 1.8722610066994665, "learning_rate": 1.0229665294903419e-06, "loss": 0.7502, "step": 3327 }, { "epoch": 0.30704647676161917, "grad_norm": 1.6319415044337886, "learning_rate": 1.0228214368347794e-06, "loss": 0.5874, "step": 3328 }, { "epoch": 0.30713873832314614, "grad_norm": 2.8342384197846364, "learning_rate": 1.0226763081280119e-06, "loss": 1.125, "step": 3329 }, { "epoch": 0.30723099988467306, "grad_norm": 1.9241778615562308, "learning_rate": 1.0225311433831917e-06, "loss": 0.6292, "step": 3330 }, { "epoch": 0.30723099988467306, "eval_GEN Loss": 0.47109854221343994, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.4101719856262207, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9084134697914124, "eval_runtime": 55.8197, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3330 }, { "epoch": 0.3073232614462, "grad_norm": 2.1434093132793293, "learning_rate": 1.0223859426134733e-06, "loss": 0.6021, "step": 3331 }, { "epoch": 0.3074155230077269, "grad_norm": 1.6934957483109931, "learning_rate": 1.0222407058320156e-06, "loss": 0.572, "step": 3332 }, { "epoch": 0.3075077845692538, "grad_norm": 1.7503604521794125, "learning_rate": 1.0220954330519796e-06, "loss": 0.8133, "step": 3333 }, { "epoch": 0.3076000461307808, "grad_norm": 1.8703807772651815, "learning_rate": 1.0219501242865307e-06, "loss": 0.7132, "step": 3334 }, { "epoch": 0.3076923076923077, "grad_norm": 1.9980591641510483, "learning_rate": 1.0218047795488365e-06, "loss": 0.8978, "step": 3335 }, { "epoch": 0.3076923076923077, "eval_GEN Loss": 0.4707014560699463, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.4088593125343323, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9044471383094788, "eval_runtime": 55.6871, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3335 }, { "epoch": 0.30778456925383463, "grad_norm": 2.07492655187952, "learning_rate": 1.0216593988520683e-06, "loss": 0.7707, "step": 3336 }, { "epoch": 0.30787683081536155, "grad_norm": 1.8991136494571181, "learning_rate": 1.0215139822094018e-06, "loss": 0.7475, "step": 3337 }, { "epoch": 0.30796909237688846, "grad_norm": 1.3872993182792597, "learning_rate": 1.0213685296340134e-06, "loss": 0.5416, "step": 3338 }, { "epoch": 0.3080613539384154, "grad_norm": 1.3707842988170422, "learning_rate": 1.0212230411390855e-06, "loss": 0.552, "step": 3339 }, { "epoch": 0.30815361549994236, "grad_norm": 2.2669664923232897, "learning_rate": 1.0210775167378015e-06, "loss": 0.6874, "step": 3340 }, { "epoch": 0.30815361549994236, "eval_GEN Loss": 0.4694972336292267, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.40061259269714355, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8984375, "eval_runtime": 56.5324, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 3340 }, { "epoch": 0.3082458770614693, "grad_norm": 2.0212913292135943, "learning_rate": 1.0209319564433499e-06, "loss": 0.8697, "step": 3341 }, { "epoch": 0.3083381386229962, "grad_norm": 2.1789344103685298, "learning_rate": 1.0207863602689208e-06, "loss": 0.8567, "step": 3342 }, { "epoch": 0.3084304001845231, "grad_norm": 1.98778489061429, "learning_rate": 1.0206407282277089e-06, "loss": 0.7202, "step": 3343 }, { "epoch": 0.30852266174605003, "grad_norm": 2.7202012428272497, "learning_rate": 1.0204950603329118e-06, "loss": 0.6787, "step": 3344 }, { "epoch": 0.308614923307577, "grad_norm": 2.1318058328549205, "learning_rate": 1.0203493565977292e-06, "loss": 0.7727, "step": 3345 }, { "epoch": 0.308614923307577, "eval_GEN Loss": 0.4690205752849579, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.387918084859848, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9064303040504456, "eval_runtime": 56.7077, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3345 }, { "epoch": 0.3087071848691039, "grad_norm": 1.890544659623137, "learning_rate": 1.020203617035366e-06, "loss": 0.7057, "step": 3346 }, { "epoch": 0.30879944643063084, "grad_norm": 1.646076173241973, "learning_rate": 1.020057841659029e-06, "loss": 0.73, "step": 3347 }, { "epoch": 0.30889170799215776, "grad_norm": 1.527831774418119, "learning_rate": 1.0199120304819285e-06, "loss": 0.7791, "step": 3348 }, { "epoch": 0.3089839695536847, "grad_norm": 1.3464500653717142, "learning_rate": 1.019766183517278e-06, "loss": 0.6014, "step": 3349 }, { "epoch": 0.30907623111521165, "grad_norm": 3.5756884753754457, "learning_rate": 1.0196203007782948e-06, "loss": 0.7607, "step": 3350 }, { "epoch": 0.30907623111521165, "eval_GEN Loss": 0.46669140458106995, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3780517876148224, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.9027042984962463, "eval_runtime": 56.5699, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 3350 }, { "epoch": 0.30916849267673857, "grad_norm": 2.7250270759632174, "learning_rate": 1.0194743822781988e-06, "loss": 1.1092, "step": 3351 }, { "epoch": 0.3092607542382655, "grad_norm": 3.136282312388678, "learning_rate": 1.0193284280302132e-06, "loss": 1.0014, "step": 3352 }, { "epoch": 0.3093530157997924, "grad_norm": 2.1291434451106217, "learning_rate": 1.0191824380475649e-06, "loss": 0.7561, "step": 3353 }, { "epoch": 0.3094452773613193, "grad_norm": 3.082858778453155, "learning_rate": 1.0190364123434834e-06, "loss": 1.0409, "step": 3354 }, { "epoch": 0.30953753892284624, "grad_norm": 2.3365254181050146, "learning_rate": 1.0188903509312022e-06, "loss": 0.6982, "step": 3355 }, { "epoch": 0.30953753892284624, "eval_GEN Loss": 0.46679937839508057, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.39128080010414124, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8769230842590332, "eval_runtime": 56.8006, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3355 }, { "epoch": 0.3096298004843732, "grad_norm": 1.9106366259885774, "learning_rate": 1.0187442538239574e-06, "loss": 0.9559, "step": 3356 }, { "epoch": 0.30972206204590014, "grad_norm": 2.0395205025758694, "learning_rate": 1.0185981210349887e-06, "loss": 0.6558, "step": 3357 }, { "epoch": 0.30981432360742706, "grad_norm": 1.7719361919041747, "learning_rate": 1.0184519525775385e-06, "loss": 0.6844, "step": 3358 }, { "epoch": 0.309906585168954, "grad_norm": 2.0228887938339666, "learning_rate": 1.0183057484648531e-06, "loss": 0.6582, "step": 3359 }, { "epoch": 0.3099988467304809, "grad_norm": 1.9374935217996054, "learning_rate": 1.0181595087101818e-06, "loss": 0.7496, "step": 3360 }, { "epoch": 0.3099988467304809, "eval_GEN Loss": 0.4677060544490814, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4080377221107483, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8750600814819336, "eval_runtime": 56.7766, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3360 }, { "epoch": 0.31009110829200787, "grad_norm": 1.6071211254353064, "learning_rate": 1.018013233326777e-06, "loss": 0.7742, "step": 3361 }, { "epoch": 0.3101833698535348, "grad_norm": 2.0562964741189953, "learning_rate": 1.0178669223278942e-06, "loss": 0.7995, "step": 3362 }, { "epoch": 0.3102756314150617, "grad_norm": 1.7809982036684668, "learning_rate": 1.0177205757267926e-06, "loss": 0.7282, "step": 3363 }, { "epoch": 0.3103678929765886, "grad_norm": 1.5973330668416594, "learning_rate": 1.0175741935367344e-06, "loss": 0.7552, "step": 3364 }, { "epoch": 0.31046015453811554, "grad_norm": 1.8496922122601893, "learning_rate": 1.0174277757709847e-06, "loss": 0.7035, "step": 3365 }, { "epoch": 0.31046015453811554, "eval_GEN Loss": 0.4686073362827301, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4041784107685089, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.868870198726654, "eval_runtime": 56.9633, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3365 }, { "epoch": 0.31055241609964246, "grad_norm": 2.0865713160728694, "learning_rate": 1.0172813224428123e-06, "loss": 0.9894, "step": 3366 }, { "epoch": 0.31064467766116943, "grad_norm": 1.8065729357525429, "learning_rate": 1.017134833565489e-06, "loss": 0.8664, "step": 3367 }, { "epoch": 0.31073693922269635, "grad_norm": 2.4333008525534088, "learning_rate": 1.0169883091522898e-06, "loss": 0.8904, "step": 3368 }, { "epoch": 0.31082920078422327, "grad_norm": 1.8428756429351756, "learning_rate": 1.016841749216493e-06, "loss": 0.9325, "step": 3369 }, { "epoch": 0.3109214623457502, "grad_norm": 1.3092401645417482, "learning_rate": 1.0166951537713804e-06, "loss": 0.7078, "step": 3370 }, { "epoch": 0.3109214623457502, "eval_GEN Loss": 0.4676709473133087, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3755190968513489, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8591946959495544, "eval_runtime": 56.7841, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3370 }, { "epoch": 0.3110137239072771, "grad_norm": 1.7672206805137922, "learning_rate": 1.0165485228302362e-06, "loss": 0.7657, "step": 3371 }, { "epoch": 0.3111059854688041, "grad_norm": 1.6200604261966551, "learning_rate": 1.0164018564063485e-06, "loss": 0.6887, "step": 3372 }, { "epoch": 0.311198247030331, "grad_norm": 2.204190312458895, "learning_rate": 1.0162551545130088e-06, "loss": 0.637, "step": 3373 }, { "epoch": 0.3112905085918579, "grad_norm": 2.870443599677136, "learning_rate": 1.0161084171635109e-06, "loss": 0.836, "step": 3374 }, { "epoch": 0.31138277015338484, "grad_norm": 1.7490066154481514, "learning_rate": 1.0159616443711526e-06, "loss": 0.7755, "step": 3375 }, { "epoch": 0.31138277015338484, "eval_GEN Loss": 0.4669856131076813, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3453295826911926, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8633413314819336, "eval_runtime": 56.7946, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3375 }, { "epoch": 0.31147503171491175, "grad_norm": 2.0361920885017017, "learning_rate": 1.0158148361492348e-06, "loss": 0.7277, "step": 3376 }, { "epoch": 0.31156729327643873, "grad_norm": 1.4250053539163856, "learning_rate": 1.0156679925110614e-06, "loss": 0.6848, "step": 3377 }, { "epoch": 0.31165955483796565, "grad_norm": 1.5666054968783123, "learning_rate": 1.0155211134699395e-06, "loss": 0.6273, "step": 3378 }, { "epoch": 0.31175181639949257, "grad_norm": 2.3737875587370185, "learning_rate": 1.0153741990391797e-06, "loss": 0.7456, "step": 3379 }, { "epoch": 0.3118440779610195, "grad_norm": 1.853789005686633, "learning_rate": 1.0152272492320956e-06, "loss": 0.6138, "step": 3380 }, { "epoch": 0.3118440779610195, "eval_GEN Loss": 0.46676862239837646, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.33773162961006165, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8675480484962463, "eval_runtime": 56.6869, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3380 }, { "epoch": 0.3119363395225464, "grad_norm": 1.7541052082128803, "learning_rate": 1.0150802640620037e-06, "loss": 0.7671, "step": 3381 }, { "epoch": 0.3120286010840733, "grad_norm": 1.8550924751502285, "learning_rate": 1.0149332435422245e-06, "loss": 0.7803, "step": 3382 }, { "epoch": 0.3121208626456003, "grad_norm": 1.5843097412727327, "learning_rate": 1.014786187686081e-06, "loss": 0.6949, "step": 3383 }, { "epoch": 0.3122131242071272, "grad_norm": 1.7730409501494113, "learning_rate": 1.0146390965068994e-06, "loss": 0.6834, "step": 3384 }, { "epoch": 0.31230538576865413, "grad_norm": 2.512328584502214, "learning_rate": 1.0144919700180097e-06, "loss": 0.7811, "step": 3385 }, { "epoch": 0.31230538576865413, "eval_GEN Loss": 0.4673357307910919, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM Loss": 0.334909588098526, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8689903616905212, "eval_runtime": 56.8249, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3385 }, { "epoch": 0.31239764733018105, "grad_norm": 2.6287097619865736, "learning_rate": 1.0143448082327448e-06, "loss": 0.7828, "step": 3386 }, { "epoch": 0.31248990889170797, "grad_norm": 1.8687824661604415, "learning_rate": 1.0141976111644403e-06, "loss": 0.5685, "step": 3387 }, { "epoch": 0.31258217045323494, "grad_norm": 1.9189808352920166, "learning_rate": 1.0140503788264358e-06, "loss": 0.6937, "step": 3388 }, { "epoch": 0.31267443201476186, "grad_norm": 1.9459741266297461, "learning_rate": 1.0139031112320736e-06, "loss": 0.8864, "step": 3389 }, { "epoch": 0.3127666935762888, "grad_norm": 2.6156046369506694, "learning_rate": 1.013755808394699e-06, "loss": 0.7837, "step": 3390 }, { "epoch": 0.3127666935762888, "eval_GEN Loss": 0.4673900902271271, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.34583035111427307, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8541466593742371, "eval_runtime": 56.8622, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3390 }, { "epoch": 0.3128589551378157, "grad_norm": 2.354927366443173, "learning_rate": 1.0136084703276617e-06, "loss": 0.7306, "step": 3391 }, { "epoch": 0.3129512166993426, "grad_norm": 2.255573155195867, "learning_rate": 1.0134610970443127e-06, "loss": 0.6164, "step": 3392 }, { "epoch": 0.3130434782608696, "grad_norm": 2.8555387428391694, "learning_rate": 1.0133136885580077e-06, "loss": 0.6752, "step": 3393 }, { "epoch": 0.3131357398223965, "grad_norm": 2.1770738403624286, "learning_rate": 1.0131662448821052e-06, "loss": 0.723, "step": 3394 }, { "epoch": 0.3132280013839234, "grad_norm": 2.0981190343643608, "learning_rate": 1.0130187660299665e-06, "loss": 0.7703, "step": 3395 }, { "epoch": 0.3132280013839234, "eval_GEN Loss": 0.4663728177547455, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3642297089099884, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8474158644676208, "eval_runtime": 57.0, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 3395 }, { "epoch": 0.31332026294545035, "grad_norm": 3.527970621621397, "learning_rate": 1.0128712520149567e-06, "loss": 0.8934, "step": 3396 }, { "epoch": 0.31341252450697726, "grad_norm": 3.170039347899062, "learning_rate": 1.0127237028504432e-06, "loss": 0.8189, "step": 3397 }, { "epoch": 0.3135047860685042, "grad_norm": 2.0768709791999744, "learning_rate": 1.0125761185497977e-06, "loss": 0.5339, "step": 3398 }, { "epoch": 0.31359704763003116, "grad_norm": 1.8826166264845288, "learning_rate": 1.012428499126394e-06, "loss": 0.6593, "step": 3399 }, { "epoch": 0.3136893091915581, "grad_norm": 1.9129527924954723, "learning_rate": 1.01228084459361e-06, "loss": 0.7743, "step": 3400 }, { "epoch": 0.3136893091915581, "eval_GEN Loss": 0.4669395387172699, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.38741618394851685, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8521634340286255, "eval_runtime": 56.8911, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3400 }, { "epoch": 0.313781570753085, "grad_norm": 2.502354480838246, "learning_rate": 1.0121331549648264e-06, "loss": 0.8719, "step": 3401 }, { "epoch": 0.3138738323146119, "grad_norm": 1.4679716181941183, "learning_rate": 1.0119854302534268e-06, "loss": 0.5931, "step": 3402 }, { "epoch": 0.31396609387613883, "grad_norm": 2.656745236494864, "learning_rate": 1.0118376704727984e-06, "loss": 0.6946, "step": 3403 }, { "epoch": 0.3140583554376658, "grad_norm": 1.5085630730545219, "learning_rate": 1.0116898756363316e-06, "loss": 0.6718, "step": 3404 }, { "epoch": 0.3141506169991927, "grad_norm": 2.0771395260898204, "learning_rate": 1.0115420457574195e-06, "loss": 0.6816, "step": 3405 }, { "epoch": 0.3141506169991927, "eval_GEN Loss": 0.4653070867061615, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3639722764492035, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8503605723381042, "eval_runtime": 56.9927, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 3405 }, { "epoch": 0.31424287856071964, "grad_norm": 1.333892759760426, "learning_rate": 1.0113941808494587e-06, "loss": 0.5261, "step": 3406 }, { "epoch": 0.31433514012224656, "grad_norm": 2.4276151214316184, "learning_rate": 1.011246280925849e-06, "loss": 0.8444, "step": 3407 }, { "epoch": 0.3144274016837735, "grad_norm": 2.210272519313882, "learning_rate": 1.0110983459999935e-06, "loss": 0.7401, "step": 3408 }, { "epoch": 0.31451966324530045, "grad_norm": 2.2593652637655706, "learning_rate": 1.0109503760852983e-06, "loss": 0.8228, "step": 3409 }, { "epoch": 0.31461192480682737, "grad_norm": 1.7818353199493056, "learning_rate": 1.0108023711951722e-06, "loss": 0.8208, "step": 3410 }, { "epoch": 0.31461192480682737, "eval_GEN Loss": 0.4647001624107361, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3483923077583313, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8742788434028625, "eval_runtime": 55.6935, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3410 }, { "epoch": 0.3147041863683543, "grad_norm": 2.012667795539502, "learning_rate": 1.0106543313430282e-06, "loss": 0.6787, "step": 3411 }, { "epoch": 0.3147964479298812, "grad_norm": 1.3123381621678762, "learning_rate": 1.0105062565422814e-06, "loss": 0.5917, "step": 3412 }, { "epoch": 0.3148887094914081, "grad_norm": 2.2622176665884255, "learning_rate": 1.010358146806351e-06, "loss": 0.806, "step": 3413 }, { "epoch": 0.31498097105293504, "grad_norm": 1.527314938773981, "learning_rate": 1.0102100021486589e-06, "loss": 0.4999, "step": 3414 }, { "epoch": 0.315073232614462, "grad_norm": 1.916729805183037, "learning_rate": 1.0100618225826298e-06, "loss": 0.5403, "step": 3415 }, { "epoch": 0.315073232614462, "eval_GEN Loss": 0.465240478515625, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.35986462235450745, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8895432949066162, "eval_runtime": 55.815, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3415 }, { "epoch": 0.31516549417598894, "grad_norm": 1.716122950973823, "learning_rate": 1.0099136081216923e-06, "loss": 0.6357, "step": 3416 }, { "epoch": 0.31525775573751585, "grad_norm": 2.1558103027639692, "learning_rate": 1.009765358779278e-06, "loss": 0.6351, "step": 3417 }, { "epoch": 0.3153500172990428, "grad_norm": 1.8971406082319706, "learning_rate": 1.009617074568821e-06, "loss": 0.6116, "step": 3418 }, { "epoch": 0.3154422788605697, "grad_norm": 2.920437480370756, "learning_rate": 1.0094687555037596e-06, "loss": 0.7252, "step": 3419 }, { "epoch": 0.31553454042209667, "grad_norm": 2.8320797851427493, "learning_rate": 1.0093204015975341e-06, "loss": 0.9, "step": 3420 }, { "epoch": 0.31553454042209667, "eval_GEN Loss": 0.4643435776233673, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37148717045783997, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8838341236114502, "eval_runtime": 55.7998, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3420 }, { "epoch": 0.3156268019836236, "grad_norm": 1.51356421307728, "learning_rate": 1.009172012863589e-06, "loss": 0.4982, "step": 3421 }, { "epoch": 0.3157190635451505, "grad_norm": 1.534661922114155, "learning_rate": 1.0090235893153717e-06, "loss": 0.6358, "step": 3422 }, { "epoch": 0.3158113251066774, "grad_norm": 1.8494959772780213, "learning_rate": 1.0088751309663316e-06, "loss": 0.6841, "step": 3423 }, { "epoch": 0.31590358666820434, "grad_norm": 1.6758762109155423, "learning_rate": 1.0087266378299234e-06, "loss": 0.7718, "step": 3424 }, { "epoch": 0.3159958482297313, "grad_norm": 2.1952365542300885, "learning_rate": 1.0085781099196032e-06, "loss": 0.7814, "step": 3425 }, { "epoch": 0.3159958482297313, "eval_GEN Loss": 0.46513885259628296, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.39377743005752563, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8839543461799622, "eval_runtime": 56.4961, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 3425 }, { "epoch": 0.31608810979125823, "grad_norm": 3.3753403499604553, "learning_rate": 1.0084295472488308e-06, "loss": 1.0128, "step": 3426 }, { "epoch": 0.31618037135278515, "grad_norm": 2.0482485230569725, "learning_rate": 1.0082809498310695e-06, "loss": 0.7715, "step": 3427 }, { "epoch": 0.31627263291431207, "grad_norm": 2.360636547456829, "learning_rate": 1.0081323176797852e-06, "loss": 0.7996, "step": 3428 }, { "epoch": 0.316364894475839, "grad_norm": 2.053635802687062, "learning_rate": 1.0079836508084471e-06, "loss": 0.9527, "step": 3429 }, { "epoch": 0.3164571560373659, "grad_norm": 1.9656706975676381, "learning_rate": 1.0078349492305278e-06, "loss": 0.7118, "step": 3430 }, { "epoch": 0.3164571560373659, "eval_GEN Loss": 0.4659498631954193, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.43402910232543945, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8809494972229004, "eval_runtime": 56.7131, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3430 }, { "epoch": 0.3165494175988929, "grad_norm": 1.9034363516133948, "learning_rate": 1.0076862129595027e-06, "loss": 0.6944, "step": 3431 }, { "epoch": 0.3166416791604198, "grad_norm": 2.5491627377452257, "learning_rate": 1.0075374420088508e-06, "loss": 0.6056, "step": 3432 }, { "epoch": 0.3167339407219467, "grad_norm": 2.6899026807620006, "learning_rate": 1.0073886363920538e-06, "loss": 0.8779, "step": 3433 }, { "epoch": 0.31682620228347363, "grad_norm": 1.481629692279984, "learning_rate": 1.0072397961225964e-06, "loss": 0.7051, "step": 3434 }, { "epoch": 0.31691846384500055, "grad_norm": 2.977962078464129, "learning_rate": 1.0070909212139674e-06, "loss": 0.8423, "step": 3435 }, { "epoch": 0.31691846384500055, "eval_GEN Loss": 0.46746936440467834, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8496732026143791, "eval_PRM F1 AUC": 0.782870612886328, "eval_PRM F1 Neg": 0.6101694915254238, "eval_PRM Loss": 0.450547456741333, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9285714285714286, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8827524185180664, "eval_runtime": 56.8121, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3435 }, { "epoch": 0.3170107254065275, "grad_norm": 2.3996413961854057, "learning_rate": 1.0069420116796574e-06, "loss": 0.6885, "step": 3436 }, { "epoch": 0.31710298696805445, "grad_norm": 2.1142899971653937, "learning_rate": 1.0067930675331613e-06, "loss": 0.8298, "step": 3437 }, { "epoch": 0.31719524852958136, "grad_norm": 1.8630473519628383, "learning_rate": 1.0066440887879762e-06, "loss": 0.7965, "step": 3438 }, { "epoch": 0.3172875100911083, "grad_norm": 2.6474044745535057, "learning_rate": 1.0064950754576032e-06, "loss": 0.8672, "step": 3439 }, { "epoch": 0.3173797716526352, "grad_norm": 2.046198469978302, "learning_rate": 1.0063460275555462e-06, "loss": 0.6864, "step": 3440 }, { "epoch": 0.3173797716526352, "eval_GEN Loss": 0.4668099284172058, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.4373442232608795, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8778245449066162, "eval_runtime": 56.7758, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3440 }, { "epoch": 0.3174720332141622, "grad_norm": 2.091925694187833, "learning_rate": 1.0061969450953116e-06, "loss": 0.8362, "step": 3441 }, { "epoch": 0.3175642947756891, "grad_norm": 1.8035522488555062, "learning_rate": 1.0060478280904102e-06, "loss": 0.7548, "step": 3442 }, { "epoch": 0.317656556337216, "grad_norm": 1.8014604359281734, "learning_rate": 1.0058986765543543e-06, "loss": 0.7336, "step": 3443 }, { "epoch": 0.31774881789874293, "grad_norm": 1.6621129855361083, "learning_rate": 1.0057494905006612e-06, "loss": 0.7264, "step": 3444 }, { "epoch": 0.31784107946026985, "grad_norm": 1.9453823959241852, "learning_rate": 1.00560026994285e-06, "loss": 0.7352, "step": 3445 }, { "epoch": 0.31784107946026985, "eval_GEN Loss": 0.46572715044021606, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8589743589743589, "eval_PRM F1 AUC": 0.7731796752226295, "eval_PRM F1 Neg": 0.6071428571428571, "eval_PRM Loss": 0.4288994073867798, "eval_PRM NPV": 0.5151515151515151, "eval_PRM Precision": 0.9178082191780822, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.872776448726654, "eval_runtime": 56.7986, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3445 }, { "epoch": 0.31793334102179677, "grad_norm": 2.276878407395933, "learning_rate": 1.0054510148944432e-06, "loss": 0.8751, "step": 3446 }, { "epoch": 0.31802560258332374, "grad_norm": 2.2816585194345493, "learning_rate": 1.0053017253689664e-06, "loss": 0.8072, "step": 3447 }, { "epoch": 0.31811786414485066, "grad_norm": 2.775210014993187, "learning_rate": 1.0051524013799489e-06, "loss": 0.7209, "step": 3448 }, { "epoch": 0.3182101257063776, "grad_norm": 2.021413380796253, "learning_rate": 1.0050030429409222e-06, "loss": 0.6319, "step": 3449 }, { "epoch": 0.3183023872679045, "grad_norm": 1.798017525701329, "learning_rate": 1.0048536500654215e-06, "loss": 0.993, "step": 3450 }, { "epoch": 0.3183023872679045, "eval_GEN Loss": 0.46543627977371216, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.40401512384414673, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8692307472229004, "eval_runtime": 56.8161, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3450 }, { "epoch": 0.3183946488294314, "grad_norm": 1.629701791307313, "learning_rate": 1.0047042227669855e-06, "loss": 0.6564, "step": 3451 }, { "epoch": 0.3184869103909584, "grad_norm": 2.318404719343471, "learning_rate": 1.0045547610591549e-06, "loss": 0.7442, "step": 3452 }, { "epoch": 0.3185791719524853, "grad_norm": 1.7955599986456374, "learning_rate": 1.0044052649554747e-06, "loss": 0.7654, "step": 3453 }, { "epoch": 0.3186714335140122, "grad_norm": 1.972705877313899, "learning_rate": 1.004255734469492e-06, "loss": 0.7959, "step": 3454 }, { "epoch": 0.31876369507553914, "grad_norm": 1.2881381625310782, "learning_rate": 1.0041061696147578e-06, "loss": 0.5447, "step": 3455 }, { "epoch": 0.31876369507553914, "eval_GEN Loss": 0.46501624584198, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM Loss": 0.37184834480285645, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8751201629638672, "eval_runtime": 56.8625, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3455 }, { "epoch": 0.31885595663706606, "grad_norm": 2.7123745967657538, "learning_rate": 1.0039565704048255e-06, "loss": 0.7356, "step": 3456 }, { "epoch": 0.31894821819859304, "grad_norm": 1.858272651565408, "learning_rate": 1.0038069368532525e-06, "loss": 0.6798, "step": 3457 }, { "epoch": 0.31904047976011995, "grad_norm": 1.5476194325166135, "learning_rate": 1.0036572689735987e-06, "loss": 0.7346, "step": 3458 }, { "epoch": 0.3191327413216469, "grad_norm": 2.0370774214217233, "learning_rate": 1.003507566779427e-06, "loss": 0.7689, "step": 3459 }, { "epoch": 0.3192250028831738, "grad_norm": 2.663822577447917, "learning_rate": 1.003357830284304e-06, "loss": 0.9592, "step": 3460 }, { "epoch": 0.3192250028831738, "eval_GEN Loss": 0.46541598439216614, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.36349013447761536, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8764423131942749, "eval_runtime": 55.832, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3460 }, { "epoch": 0.3193172644447007, "grad_norm": 1.5500941830841264, "learning_rate": 1.0032080595017987e-06, "loss": 0.8309, "step": 3461 }, { "epoch": 0.31940952600622763, "grad_norm": 2.4884640035515204, "learning_rate": 1.003058254445484e-06, "loss": 0.8815, "step": 3462 }, { "epoch": 0.3195017875677546, "grad_norm": 1.5222473484521577, "learning_rate": 1.002908415128935e-06, "loss": 0.6373, "step": 3463 }, { "epoch": 0.3195940491292815, "grad_norm": 1.7115155752891467, "learning_rate": 1.0027585415657306e-06, "loss": 0.6498, "step": 3464 }, { "epoch": 0.31968631069080844, "grad_norm": 1.7464842802665954, "learning_rate": 1.0026086337694526e-06, "loss": 0.7887, "step": 3465 }, { "epoch": 0.31968631069080844, "eval_GEN Loss": 0.46864184737205505, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.369650274515152, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8722355961799622, "eval_runtime": 56.7646, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3465 }, { "epoch": 0.31977857225233536, "grad_norm": 1.7329564540020683, "learning_rate": 1.0024586917536858e-06, "loss": 0.7487, "step": 3466 }, { "epoch": 0.3198708338138623, "grad_norm": 3.370463703304283, "learning_rate": 1.0023087155320183e-06, "loss": 0.7237, "step": 3467 }, { "epoch": 0.31996309537538925, "grad_norm": 1.8017335990526395, "learning_rate": 1.002158705118041e-06, "loss": 0.8718, "step": 3468 }, { "epoch": 0.32005535693691617, "grad_norm": 2.1581579821709336, "learning_rate": 1.0020086605253482e-06, "loss": 0.6968, "step": 3469 }, { "epoch": 0.3201476184984431, "grad_norm": 1.867968093790674, "learning_rate": 1.0018585817675373e-06, "loss": 0.8581, "step": 3470 }, { "epoch": 0.3201476184984431, "eval_GEN Loss": 0.4694361984729767, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3823939859867096, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8747596144676208, "eval_runtime": 56.912, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3470 }, { "epoch": 0.32023988005997, "grad_norm": 2.755711413920739, "learning_rate": 1.0017084688582086e-06, "loss": 0.8308, "step": 3471 }, { "epoch": 0.3203321416214969, "grad_norm": 1.8441340179149308, "learning_rate": 1.0015583218109652e-06, "loss": 0.8914, "step": 3472 }, { "epoch": 0.3204244031830239, "grad_norm": 2.2674160438948654, "learning_rate": 1.001408140639414e-06, "loss": 0.6273, "step": 3473 }, { "epoch": 0.3205166647445508, "grad_norm": 1.7966698742268874, "learning_rate": 1.0012579253571648e-06, "loss": 0.6454, "step": 3474 }, { "epoch": 0.32060892630607774, "grad_norm": 2.2228832871488713, "learning_rate": 1.0011076759778301e-06, "loss": 0.7326, "step": 3475 }, { "epoch": 0.32060892630607774, "eval_GEN Loss": 0.46892285346984863, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38079655170440674, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8813701868057251, "eval_runtime": 55.8428, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3475 }, { "epoch": 0.32070118786760465, "grad_norm": 2.4632508087198017, "learning_rate": 1.000957392515026e-06, "loss": 0.8512, "step": 3476 }, { "epoch": 0.32079344942913157, "grad_norm": 1.8050158259780842, "learning_rate": 1.0008070749823709e-06, "loss": 0.5992, "step": 3477 }, { "epoch": 0.3208857109906585, "grad_norm": 2.481792641995227, "learning_rate": 1.0006567233934873e-06, "loss": 0.8449, "step": 3478 }, { "epoch": 0.32097797255218546, "grad_norm": 2.5834799184142945, "learning_rate": 1.000506337762e-06, "loss": 0.7446, "step": 3479 }, { "epoch": 0.3210702341137124, "grad_norm": 1.488416660909454, "learning_rate": 1.0003559181015374e-06, "loss": 0.6129, "step": 3480 }, { "epoch": 0.3210702341137124, "eval_GEN Loss": 0.4685995578765869, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.37271106243133545, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.885036051273346, "eval_runtime": 56.9734, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3480 }, { "epoch": 0.3211624956752393, "grad_norm": 1.6589345037028045, "learning_rate": 1.000205464425731e-06, "loss": 0.5114, "step": 3481 }, { "epoch": 0.3212547572367662, "grad_norm": 1.4823346507551198, "learning_rate": 1.0000549767482142e-06, "loss": 0.6256, "step": 3482 }, { "epoch": 0.32134701879829314, "grad_norm": 2.1792902858080847, "learning_rate": 9.999044550826256e-07, "loss": 0.8143, "step": 3483 }, { "epoch": 0.3214392803598201, "grad_norm": 1.9011944299609913, "learning_rate": 9.997538994426049e-07, "loss": 0.755, "step": 3484 }, { "epoch": 0.32153154192134703, "grad_norm": 1.4360295660088076, "learning_rate": 9.99603309841796e-07, "loss": 0.6985, "step": 3485 }, { "epoch": 0.32153154192134703, "eval_GEN Loss": 0.4663397967815399, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3620414733886719, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9073317050933838, "eval_runtime": 57.0555, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 3485 }, { "epoch": 0.32162380348287395, "grad_norm": 1.4470063670363587, "learning_rate": 9.994526862938455e-07, "loss": 0.574, "step": 3486 }, { "epoch": 0.32171606504440087, "grad_norm": 2.356573665782338, "learning_rate": 9.993020288124033e-07, "loss": 0.5472, "step": 3487 }, { "epoch": 0.3218083266059278, "grad_norm": 1.380305689048948, "learning_rate": 9.99151337411122e-07, "loss": 0.6889, "step": 3488 }, { "epoch": 0.32190058816745476, "grad_norm": 5.131841186139524, "learning_rate": 9.990006121036575e-07, "loss": 1.1968, "step": 3489 }, { "epoch": 0.3219928497289817, "grad_norm": 1.48050417658812, "learning_rate": 9.98849852903669e-07, "loss": 0.7084, "step": 3490 }, { "epoch": 0.3219928497289817, "eval_GEN Loss": 0.4651165306568146, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3570702373981476, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9067908525466919, "eval_runtime": 56.7204, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3490 }, { "epoch": 0.3220851112905086, "grad_norm": 1.8579928368458347, "learning_rate": 9.986990598248184e-07, "loss": 0.7977, "step": 3491 }, { "epoch": 0.3221773728520355, "grad_norm": 2.893219702474659, "learning_rate": 9.985482328807706e-07, "loss": 0.8473, "step": 3492 }, { "epoch": 0.32226963441356243, "grad_norm": 1.6827002563814335, "learning_rate": 9.983973720851942e-07, "loss": 0.6579, "step": 3493 }, { "epoch": 0.32236189597508935, "grad_norm": 1.989817046564749, "learning_rate": 9.982464774517601e-07, "loss": 0.6656, "step": 3494 }, { "epoch": 0.3224541575366163, "grad_norm": 2.4968862552563533, "learning_rate": 9.980955489941426e-07, "loss": 0.6077, "step": 3495 }, { "epoch": 0.3224541575366163, "eval_GEN Loss": 0.4649212956428528, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3645148277282715, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8651442527770996, "eval_runtime": 56.6942, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3495 }, { "epoch": 0.32254641909814324, "grad_norm": 1.9968034514774233, "learning_rate": 9.979445867260192e-07, "loss": 0.7793, "step": 3496 }, { "epoch": 0.32263868065967016, "grad_norm": 1.8670585681050127, "learning_rate": 9.977935906610705e-07, "loss": 0.6814, "step": 3497 }, { "epoch": 0.3227309422211971, "grad_norm": 2.5632636171198646, "learning_rate": 9.976425608129797e-07, "loss": 0.5964, "step": 3498 }, { "epoch": 0.322823203782724, "grad_norm": 3.296842722098701, "learning_rate": 9.974914971954335e-07, "loss": 0.8559, "step": 3499 }, { "epoch": 0.322915465344251, "grad_norm": 2.117938633792717, "learning_rate": 9.973403998221216e-07, "loss": 0.8139, "step": 3500 }, { "epoch": 0.322915465344251, "eval_GEN Loss": 0.4646627604961395, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3864864408969879, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.851832926273346, "eval_runtime": 56.6424, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 3500 }, { "epoch": 0.3230077269057779, "grad_norm": 1.7625420107198013, "learning_rate": 9.971892687067365e-07, "loss": 0.7544, "step": 3501 }, { "epoch": 0.3230999884673048, "grad_norm": 1.543818768500952, "learning_rate": 9.970381038629739e-07, "loss": 0.6944, "step": 3502 }, { "epoch": 0.32319225002883173, "grad_norm": 1.7411614102137767, "learning_rate": 9.96886905304533e-07, "loss": 0.7008, "step": 3503 }, { "epoch": 0.32328451159035865, "grad_norm": 2.4201877683372226, "learning_rate": 9.967356730451153e-07, "loss": 0.6991, "step": 3504 }, { "epoch": 0.3233767731518856, "grad_norm": 1.5902999389333115, "learning_rate": 9.965844070984259e-07, "loss": 0.5897, "step": 3505 }, { "epoch": 0.3233767731518856, "eval_GEN Loss": 0.4636280834674835, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3915148973464966, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8522836565971375, "eval_runtime": 56.9852, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3505 }, { "epoch": 0.32346903471341254, "grad_norm": 1.8223841583214533, "learning_rate": 9.964331074781724e-07, "loss": 0.7535, "step": 3506 }, { "epoch": 0.32356129627493946, "grad_norm": 1.8371545605290758, "learning_rate": 9.962817741980662e-07, "loss": 0.753, "step": 3507 }, { "epoch": 0.3236535578364664, "grad_norm": 1.706081604023497, "learning_rate": 9.96130407271821e-07, "loss": 0.5756, "step": 3508 }, { "epoch": 0.3237458193979933, "grad_norm": 1.5201240848822422, "learning_rate": 9.959790067131545e-07, "loss": 0.5854, "step": 3509 }, { "epoch": 0.3238380809595202, "grad_norm": 1.5433507169008192, "learning_rate": 9.958275725357864e-07, "loss": 0.7748, "step": 3510 }, { "epoch": 0.3238380809595202, "eval_GEN Loss": 0.4637582302093506, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37704744935035706, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8530648946762085, "eval_runtime": 56.2812, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 3510 }, { "epoch": 0.3239303425210472, "grad_norm": 1.9682506816690448, "learning_rate": 9.956761047534398e-07, "loss": 0.6819, "step": 3511 }, { "epoch": 0.3240226040825741, "grad_norm": 2.234304513029621, "learning_rate": 9.955246033798412e-07, "loss": 0.8584, "step": 3512 }, { "epoch": 0.324114865644101, "grad_norm": 2.273810968616627, "learning_rate": 9.9537306842872e-07, "loss": 0.7094, "step": 3513 }, { "epoch": 0.32420712720562794, "grad_norm": 1.7473241154353563, "learning_rate": 9.95221499913808e-07, "loss": 0.6667, "step": 3514 }, { "epoch": 0.32429938876715486, "grad_norm": 2.204837392640544, "learning_rate": 9.950698978488413e-07, "loss": 0.7814, "step": 3515 }, { "epoch": 0.32429938876715486, "eval_GEN Loss": 0.46310362219810486, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36104968190193176, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8682692050933838, "eval_runtime": 56.0223, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 3515 }, { "epoch": 0.32439165032868184, "grad_norm": 3.279985801957001, "learning_rate": 9.949182622475578e-07, "loss": 0.754, "step": 3516 }, { "epoch": 0.32448391189020875, "grad_norm": 1.6149360580825767, "learning_rate": 9.94766593123699e-07, "loss": 0.7358, "step": 3517 }, { "epoch": 0.3245761734517357, "grad_norm": 2.603168287879418, "learning_rate": 9.946148904910097e-07, "loss": 0.6986, "step": 3518 }, { "epoch": 0.3246684350132626, "grad_norm": 1.5952717176591018, "learning_rate": 9.94463154363237e-07, "loss": 0.7918, "step": 3519 }, { "epoch": 0.3247606965747895, "grad_norm": 3.494653024342418, "learning_rate": 9.94311384754132e-07, "loss": 0.8076, "step": 3520 }, { "epoch": 0.3247606965747895, "eval_GEN Loss": 0.46455931663513184, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36879345774650574, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8652644157409668, "eval_runtime": 55.8298, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3520 }, { "epoch": 0.3248529581363165, "grad_norm": 1.6094419502732449, "learning_rate": 9.94159581677448e-07, "loss": 0.6275, "step": 3521 }, { "epoch": 0.3249452196978434, "grad_norm": 2.2631956566098324, "learning_rate": 9.940077451469415e-07, "loss": 0.7404, "step": 3522 }, { "epoch": 0.3250374812593703, "grad_norm": 1.967997279588366, "learning_rate": 9.938558751763722e-07, "loss": 0.7002, "step": 3523 }, { "epoch": 0.32512974282089724, "grad_norm": 1.4462636431295166, "learning_rate": 9.937039717795033e-07, "loss": 0.6084, "step": 3524 }, { "epoch": 0.32522200438242416, "grad_norm": 3.3220946326326035, "learning_rate": 9.935520349700998e-07, "loss": 1.0089, "step": 3525 }, { "epoch": 0.32522200438242416, "eval_GEN Loss": 0.46530255675315857, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38551005721092224, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8630408644676208, "eval_runtime": 55.9978, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3525 }, { "epoch": 0.3253142659439511, "grad_norm": 1.2702398349924198, "learning_rate": 9.934000647619308e-07, "loss": 0.6857, "step": 3526 }, { "epoch": 0.32540652750547805, "grad_norm": 1.4903996596380185, "learning_rate": 9.932480611687682e-07, "loss": 0.5613, "step": 3527 }, { "epoch": 0.32549878906700497, "grad_norm": 1.615800743168112, "learning_rate": 9.930960242043866e-07, "loss": 0.7292, "step": 3528 }, { "epoch": 0.3255910506285319, "grad_norm": 1.754218562582439, "learning_rate": 9.929439538825638e-07, "loss": 0.7225, "step": 3529 }, { "epoch": 0.3256833121900588, "grad_norm": 1.47978871431795, "learning_rate": 9.927918502170807e-07, "loss": 0.5319, "step": 3530 }, { "epoch": 0.3256833121900588, "eval_GEN Loss": 0.46523532271385193, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39558637142181396, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8748798370361328, "eval_runtime": 55.8385, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3530 }, { "epoch": 0.3257755737515857, "grad_norm": 1.44946982046061, "learning_rate": 9.926397132217215e-07, "loss": 0.7779, "step": 3531 }, { "epoch": 0.3258678353131127, "grad_norm": 1.3606095037000285, "learning_rate": 9.924875429102726e-07, "loss": 0.5909, "step": 3532 }, { "epoch": 0.3259600968746396, "grad_norm": 1.8284814268112917, "learning_rate": 9.923353392965242e-07, "loss": 0.5984, "step": 3533 }, { "epoch": 0.32605235843616653, "grad_norm": 2.3443389162735913, "learning_rate": 9.92183102394269e-07, "loss": 0.747, "step": 3534 }, { "epoch": 0.32614461999769345, "grad_norm": 1.8918598611991704, "learning_rate": 9.920308322173034e-07, "loss": 0.7048, "step": 3535 }, { "epoch": 0.32614461999769345, "eval_GEN Loss": 0.46586254239082336, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.40054383873939514, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8873196840286255, "eval_runtime": 56.3702, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 3535 }, { "epoch": 0.32623688155922037, "grad_norm": 2.1254200252964237, "learning_rate": 9.918785287794258e-07, "loss": 0.6929, "step": 3536 }, { "epoch": 0.32632914312074734, "grad_norm": 2.922619342579277, "learning_rate": 9.917261920944386e-07, "loss": 0.8515, "step": 3537 }, { "epoch": 0.32642140468227426, "grad_norm": 1.6413771771773444, "learning_rate": 9.915738221761467e-07, "loss": 0.62, "step": 3538 }, { "epoch": 0.3265136662438012, "grad_norm": 2.4277621445063735, "learning_rate": 9.91421419038358e-07, "loss": 0.6826, "step": 3539 }, { "epoch": 0.3266059278053281, "grad_norm": 1.8688089590377583, "learning_rate": 9.912689826948835e-07, "loss": 0.6656, "step": 3540 }, { "epoch": 0.3266059278053281, "eval_GEN Loss": 0.46760138869285583, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.41551968455314636, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8883413672447205, "eval_runtime": 55.8784, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3540 }, { "epoch": 0.326698189366855, "grad_norm": 2.3097141831984227, "learning_rate": 9.911165131595372e-07, "loss": 0.8522, "step": 3541 }, { "epoch": 0.32679045092838194, "grad_norm": 2.0738725418081287, "learning_rate": 9.909640104461363e-07, "loss": 0.8364, "step": 3542 }, { "epoch": 0.3268827124899089, "grad_norm": 2.6397397055896996, "learning_rate": 9.908114745685006e-07, "loss": 0.8954, "step": 3543 }, { "epoch": 0.32697497405143583, "grad_norm": 2.4376903133080288, "learning_rate": 9.906589055404534e-07, "loss": 0.8489, "step": 3544 }, { "epoch": 0.32706723561296275, "grad_norm": 1.9557592094536642, "learning_rate": 9.905063033758204e-07, "loss": 0.7317, "step": 3545 }, { "epoch": 0.32706723561296275, "eval_GEN Loss": 0.46769118309020996, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.43777814507484436, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8790565133094788, "eval_runtime": 55.8401, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3545 }, { "epoch": 0.32715949717448967, "grad_norm": 2.887833227549036, "learning_rate": 9.903536680884312e-07, "loss": 0.7556, "step": 3546 }, { "epoch": 0.3272517587360166, "grad_norm": 2.0135855167794174, "learning_rate": 9.902009996921174e-07, "loss": 0.8285, "step": 3547 }, { "epoch": 0.32734402029754356, "grad_norm": 1.6496526739939865, "learning_rate": 9.900482982007143e-07, "loss": 0.7358, "step": 3548 }, { "epoch": 0.3274362818590705, "grad_norm": 1.8934874830584503, "learning_rate": 9.898955636280596e-07, "loss": 0.7606, "step": 3549 }, { "epoch": 0.3275285434205974, "grad_norm": 1.6708224328009713, "learning_rate": 9.897427959879946e-07, "loss": 0.6658, "step": 3550 }, { "epoch": 0.3275285434205974, "eval_GEN Loss": 0.470447838306427, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8441558441558441, "eval_PRM F1 AUC": 0.7611314824515453, "eval_PRM F1 Neg": 0.5862068965517241, "eval_PRM Loss": 0.46784281730651855, "eval_PRM NPV": 0.4857142857142857, "eval_PRM Precision": 0.9154929577464789, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8864783644676208, "eval_runtime": 55.7936, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3550 }, { "epoch": 0.3276208049821243, "grad_norm": 1.9864574515885203, "learning_rate": 9.895899952943635e-07, "loss": 0.9907, "step": 3551 }, { "epoch": 0.32771306654365123, "grad_norm": 2.0995437303723774, "learning_rate": 9.89437161561013e-07, "loss": 0.7183, "step": 3552 }, { "epoch": 0.3278053281051782, "grad_norm": 2.986297370252215, "learning_rate": 9.892842948017933e-07, "loss": 0.7068, "step": 3553 }, { "epoch": 0.3278975896667051, "grad_norm": 2.518680116744529, "learning_rate": 9.891313950305576e-07, "loss": 0.7512, "step": 3554 }, { "epoch": 0.32798985122823204, "grad_norm": 2.800470026143454, "learning_rate": 9.889784622611614e-07, "loss": 0.6876, "step": 3555 }, { "epoch": 0.32798985122823204, "eval_GEN Loss": 0.4716262221336365, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8516129032258064, "eval_PRM F1 AUC": 0.7671555788370874, "eval_PRM F1 Neg": 0.5964912280701754, "eval_PRM Loss": 0.4461728632450104, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8704928159713745, "eval_runtime": 55.986, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3555 }, { "epoch": 0.32808211278975896, "grad_norm": 1.7422711145725653, "learning_rate": 9.888254965074643e-07, "loss": 0.6865, "step": 3556 }, { "epoch": 0.3281743743512859, "grad_norm": 2.3397409083732446, "learning_rate": 9.886724977833278e-07, "loss": 0.7051, "step": 3557 }, { "epoch": 0.3282666359128128, "grad_norm": 1.9108475400470184, "learning_rate": 9.885194661026174e-07, "loss": 0.6331, "step": 3558 }, { "epoch": 0.3283588974743398, "grad_norm": 1.5522411601505866, "learning_rate": 9.883664014792005e-07, "loss": 0.6853, "step": 3559 }, { "epoch": 0.3284511590358667, "grad_norm": 2.229268100481141, "learning_rate": 9.882133039269486e-07, "loss": 0.7715, "step": 3560 }, { "epoch": 0.3284511590358667, "eval_GEN Loss": 0.46998584270477295, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3751089572906494, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8559495210647583, "eval_runtime": 55.8954, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3560 }, { "epoch": 0.3285434205973936, "grad_norm": 2.098409479358096, "learning_rate": 9.880601734597354e-07, "loss": 0.648, "step": 3561 }, { "epoch": 0.32863568215892053, "grad_norm": 1.5486454764490598, "learning_rate": 9.879070100914375e-07, "loss": 0.7608, "step": 3562 }, { "epoch": 0.32872794372044745, "grad_norm": 1.4930135376285247, "learning_rate": 9.877538138359355e-07, "loss": 0.6318, "step": 3563 }, { "epoch": 0.3288202052819744, "grad_norm": 3.033861758280288, "learning_rate": 9.876005847071117e-07, "loss": 0.8673, "step": 3564 }, { "epoch": 0.32891246684350134, "grad_norm": 1.8478406721587446, "learning_rate": 9.874473227188523e-07, "loss": 0.6408, "step": 3565 }, { "epoch": 0.32891246684350134, "eval_GEN Loss": 0.4700247645378113, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35278984904289246, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8729567527770996, "eval_runtime": 56.8694, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3565 }, { "epoch": 0.32900472840502826, "grad_norm": 1.721789085268667, "learning_rate": 9.87294027885046e-07, "loss": 0.6808, "step": 3566 }, { "epoch": 0.3290969899665552, "grad_norm": 1.929773975651704, "learning_rate": 9.871407002195845e-07, "loss": 0.6625, "step": 3567 }, { "epoch": 0.3291892515280821, "grad_norm": 2.4115324080600087, "learning_rate": 9.869873397363628e-07, "loss": 0.7695, "step": 3568 }, { "epoch": 0.32928151308960907, "grad_norm": 2.0794827013150656, "learning_rate": 9.868339464492785e-07, "loss": 0.7534, "step": 3569 }, { "epoch": 0.329373774651136, "grad_norm": 2.420888531379509, "learning_rate": 9.866805203722327e-07, "loss": 0.9365, "step": 3570 }, { "epoch": 0.329373774651136, "eval_GEN Loss": 0.467998743057251, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3475819230079651, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8640024065971375, "eval_runtime": 56.7779, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3570 }, { "epoch": 0.3294660362126629, "grad_norm": 2.0227342219705027, "learning_rate": 9.865270615191285e-07, "loss": 0.6998, "step": 3571 }, { "epoch": 0.3295582977741898, "grad_norm": 1.6543561218331455, "learning_rate": 9.863735699038732e-07, "loss": 0.6135, "step": 3572 }, { "epoch": 0.32965055933571674, "grad_norm": 2.194018305326554, "learning_rate": 9.86220045540376e-07, "loss": 0.9116, "step": 3573 }, { "epoch": 0.32974282089724366, "grad_norm": 1.8454937454144151, "learning_rate": 9.860664884425499e-07, "loss": 0.7856, "step": 3574 }, { "epoch": 0.32983508245877063, "grad_norm": 1.634498692436031, "learning_rate": 9.859128986243102e-07, "loss": 0.7193, "step": 3575 }, { "epoch": 0.32983508245877063, "eval_GEN Loss": 0.46865424513816833, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34768542647361755, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8395432829856873, "eval_runtime": 56.7471, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3575 }, { "epoch": 0.32992734402029755, "grad_norm": 1.357543461498226, "learning_rate": 9.857592760995755e-07, "loss": 0.6006, "step": 3576 }, { "epoch": 0.33001960558182447, "grad_norm": 2.224208403060692, "learning_rate": 9.856056208822674e-07, "loss": 0.8296, "step": 3577 }, { "epoch": 0.3301118671433514, "grad_norm": 1.8696798446162632, "learning_rate": 9.854519329863102e-07, "loss": 0.6758, "step": 3578 }, { "epoch": 0.3302041287048783, "grad_norm": 2.034689805212518, "learning_rate": 9.852982124256317e-07, "loss": 0.6788, "step": 3579 }, { "epoch": 0.3302963902664053, "grad_norm": 1.4513004451549032, "learning_rate": 9.85144459214162e-07, "loss": 0.7563, "step": 3580 }, { "epoch": 0.3302963902664053, "eval_GEN Loss": 0.46821364760398865, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3536064326763153, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8288461565971375, "eval_runtime": 55.7502, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 3580 }, { "epoch": 0.3303886518279322, "grad_norm": 2.093938427424334, "learning_rate": 9.849906733658344e-07, "loss": 0.8765, "step": 3581 }, { "epoch": 0.3304809133894591, "grad_norm": 1.5655414643833065, "learning_rate": 9.848368548945855e-07, "loss": 0.7538, "step": 3582 }, { "epoch": 0.33057317495098604, "grad_norm": 1.5621782867141305, "learning_rate": 9.846830038143544e-07, "loss": 0.677, "step": 3583 }, { "epoch": 0.33066543651251296, "grad_norm": 1.7419478060144966, "learning_rate": 9.845291201390833e-07, "loss": 0.7433, "step": 3584 }, { "epoch": 0.33075769807403993, "grad_norm": 1.4566245925145112, "learning_rate": 9.843752038827174e-07, "loss": 0.6689, "step": 3585 }, { "epoch": 0.33075769807403993, "eval_GEN Loss": 0.467538058757782, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.3611035943031311, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8266226053237915, "eval_runtime": 55.9986, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3585 }, { "epoch": 0.33084995963556685, "grad_norm": 1.7653443118561036, "learning_rate": 9.842212550592048e-07, "loss": 0.5293, "step": 3586 }, { "epoch": 0.33094222119709377, "grad_norm": 1.9766834292208788, "learning_rate": 9.840672736824968e-07, "loss": 0.6617, "step": 3587 }, { "epoch": 0.3310344827586207, "grad_norm": 2.154507425593431, "learning_rate": 9.839132597665472e-07, "loss": 0.7231, "step": 3588 }, { "epoch": 0.3311267443201476, "grad_norm": 1.9482214572827599, "learning_rate": 9.837592133253131e-07, "loss": 0.827, "step": 3589 }, { "epoch": 0.3312190058816745, "grad_norm": 1.5324463255142962, "learning_rate": 9.836051343727542e-07, "loss": 0.6762, "step": 3590 }, { "epoch": 0.3312190058816745, "eval_GEN Loss": 0.4666840732097626, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3566901385784149, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8296874761581421, "eval_runtime": 55.9346, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3590 }, { "epoch": 0.3313112674432015, "grad_norm": 2.1318209293480193, "learning_rate": 9.83451022922834e-07, "loss": 0.7061, "step": 3591 }, { "epoch": 0.3314035290047284, "grad_norm": 2.0365177450658285, "learning_rate": 9.832968789895175e-07, "loss": 0.616, "step": 3592 }, { "epoch": 0.33149579056625533, "grad_norm": 1.8458554826737847, "learning_rate": 9.83142702586774e-07, "loss": 0.7136, "step": 3593 }, { "epoch": 0.33158805212778225, "grad_norm": 1.8249708828529854, "learning_rate": 9.82988493728575e-07, "loss": 0.6292, "step": 3594 }, { "epoch": 0.33168031368930917, "grad_norm": 1.4049328479545602, "learning_rate": 9.828342524288952e-07, "loss": 0.6941, "step": 3595 }, { "epoch": 0.33168031368930917, "eval_GEN Loss": 0.4676535129547119, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35014253854751587, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8380408883094788, "eval_runtime": 55.8272, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3595 }, { "epoch": 0.33177257525083614, "grad_norm": 1.918620717524742, "learning_rate": 9.826799787017125e-07, "loss": 0.6852, "step": 3596 }, { "epoch": 0.33186483681236306, "grad_norm": 2.7821418769492015, "learning_rate": 9.82525672561007e-07, "loss": 0.7714, "step": 3597 }, { "epoch": 0.33195709837389, "grad_norm": 2.7324268536076075, "learning_rate": 9.82371334020762e-07, "loss": 0.6198, "step": 3598 }, { "epoch": 0.3320493599354169, "grad_norm": 1.7560132191259046, "learning_rate": 9.822169630949646e-07, "loss": 0.7944, "step": 3599 }, { "epoch": 0.3321416214969438, "grad_norm": 1.9811400790997766, "learning_rate": 9.820625597976034e-07, "loss": 0.757, "step": 3600 }, { "epoch": 0.3321416214969438, "eval_GEN Loss": 0.46804919838905334, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.35448625683784485, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8407752513885498, "eval_runtime": 56.8251, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3600 }, { "epoch": 0.3322338830584708, "grad_norm": 2.317114525595054, "learning_rate": 9.819081241426712e-07, "loss": 0.8489, "step": 3601 }, { "epoch": 0.3323261446199977, "grad_norm": 2.3501109658797543, "learning_rate": 9.81753656144163e-07, "loss": 0.9152, "step": 3602 }, { "epoch": 0.33241840618152463, "grad_norm": 2.659171281274666, "learning_rate": 9.815991558160767e-07, "loss": 0.7636, "step": 3603 }, { "epoch": 0.33251066774305155, "grad_norm": 1.5818614548927388, "learning_rate": 9.81444623172414e-07, "loss": 0.7166, "step": 3604 }, { "epoch": 0.33260292930457847, "grad_norm": 1.9309032159798014, "learning_rate": 9.812900582271782e-07, "loss": 0.7325, "step": 3605 }, { "epoch": 0.33260292930457847, "eval_GEN Loss": 0.47041070461273193, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3725634813308716, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8425480723381042, "eval_runtime": 56.7459, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3605 }, { "epoch": 0.3326951908661054, "grad_norm": 1.997389389637752, "learning_rate": 9.811354609943768e-07, "loss": 0.8185, "step": 3606 }, { "epoch": 0.33278745242763236, "grad_norm": 2.4516550611031187, "learning_rate": 9.80980831488019e-07, "loss": 0.8558, "step": 3607 }, { "epoch": 0.3328797139891593, "grad_norm": 3.098445188537611, "learning_rate": 9.808261697221182e-07, "loss": 0.821, "step": 3608 }, { "epoch": 0.3329719755506862, "grad_norm": 3.3512603523443776, "learning_rate": 9.806714757106896e-07, "loss": 0.7201, "step": 3609 }, { "epoch": 0.3330642371122131, "grad_norm": 1.7652329363446022, "learning_rate": 9.805167494677522e-07, "loss": 0.6832, "step": 3610 }, { "epoch": 0.3330642371122131, "eval_GEN Loss": 0.471610963344574, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.39141222834587097, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8512319922447205, "eval_runtime": 56.7684, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3610 }, { "epoch": 0.33315649867374003, "grad_norm": 1.725382749587872, "learning_rate": 9.803619910073273e-07, "loss": 0.6388, "step": 3611 }, { "epoch": 0.333248760235267, "grad_norm": 1.3562386428929896, "learning_rate": 9.802072003434395e-07, "loss": 0.4694, "step": 3612 }, { "epoch": 0.3333410217967939, "grad_norm": 2.178595676424367, "learning_rate": 9.80052377490116e-07, "loss": 0.9785, "step": 3613 }, { "epoch": 0.33343328335832084, "grad_norm": 1.9166366676661377, "learning_rate": 9.798975224613874e-07, "loss": 0.7763, "step": 3614 }, { "epoch": 0.33352554491984776, "grad_norm": 2.886258933560402, "learning_rate": 9.797426352712865e-07, "loss": 0.9123, "step": 3615 }, { "epoch": 0.33352554491984776, "eval_GEN Loss": 0.474600613117218, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8496732026143791, "eval_PRM F1 AUC": 0.782870612886328, "eval_PRM F1 Neg": 0.6101694915254238, "eval_PRM Loss": 0.4381133019924164, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9285714285714286, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8804687261581421, "eval_runtime": 55.5869, "eval_samples_per_second": 1.169, "eval_steps_per_second": 0.09, "step": 3615 }, { "epoch": 0.3336178064813747, "grad_norm": 2.193058438376044, "learning_rate": 9.795877159338495e-07, "loss": 0.8594, "step": 3616 }, { "epoch": 0.33371006804290165, "grad_norm": 2.1883940438320395, "learning_rate": 9.794327644631158e-07, "loss": 0.8318, "step": 3617 }, { "epoch": 0.33380232960442857, "grad_norm": 1.6312277262767367, "learning_rate": 9.792777808731272e-07, "loss": 0.8312, "step": 3618 }, { "epoch": 0.3338945911659555, "grad_norm": 2.1066961426840316, "learning_rate": 9.791227651779281e-07, "loss": 0.5322, "step": 3619 }, { "epoch": 0.3339868527274824, "grad_norm": 1.4272026742780817, "learning_rate": 9.789677173915668e-07, "loss": 0.6554, "step": 3620 }, { "epoch": 0.3339868527274824, "eval_GEN Loss": 0.4727225601673126, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.42424073815345764, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8775841593742371, "eval_runtime": 55.7186, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3620 }, { "epoch": 0.3340791142890093, "grad_norm": 2.145798214258014, "learning_rate": 9.788126375280938e-07, "loss": 0.8423, "step": 3621 }, { "epoch": 0.33417137585053625, "grad_norm": 2.9563684798156435, "learning_rate": 9.786575256015626e-07, "loss": 0.8395, "step": 3622 }, { "epoch": 0.3342636374120632, "grad_norm": 1.7965145492137091, "learning_rate": 9.7850238162603e-07, "loss": 0.7023, "step": 3623 }, { "epoch": 0.33435589897359014, "grad_norm": 1.7984494777458995, "learning_rate": 9.78347205615555e-07, "loss": 0.5726, "step": 3624 }, { "epoch": 0.33444816053511706, "grad_norm": 1.406845092088345, "learning_rate": 9.781919975842e-07, "loss": 0.7181, "step": 3625 }, { "epoch": 0.33444816053511706, "eval_GEN Loss": 0.47157713770866394, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.39016249775886536, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8611177802085876, "eval_runtime": 56.817, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3625 }, { "epoch": 0.334540422096644, "grad_norm": 1.5375369962792949, "learning_rate": 9.780367575460303e-07, "loss": 0.7015, "step": 3626 }, { "epoch": 0.3346326836581709, "grad_norm": 2.5355376845655746, "learning_rate": 9.778814855151138e-07, "loss": 0.8713, "step": 3627 }, { "epoch": 0.33472494521969787, "grad_norm": 1.564816302027679, "learning_rate": 9.77726181505522e-07, "loss": 0.8189, "step": 3628 }, { "epoch": 0.3348172067812248, "grad_norm": 2.1185382668919535, "learning_rate": 9.775708455313283e-07, "loss": 0.9248, "step": 3629 }, { "epoch": 0.3349094683427517, "grad_norm": 2.394410579705335, "learning_rate": 9.774154776066093e-07, "loss": 0.8632, "step": 3630 }, { "epoch": 0.3349094683427517, "eval_GEN Loss": 0.4705427289009094, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.35791870951652527, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8482271432876587, "eval_runtime": 56.6399, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 3630 }, { "epoch": 0.3350017299042786, "grad_norm": 2.375203554586488, "learning_rate": 9.772600777454452e-07, "loss": 0.7267, "step": 3631 }, { "epoch": 0.33509399146580554, "grad_norm": 1.5536616085963402, "learning_rate": 9.771046459619185e-07, "loss": 0.7144, "step": 3632 }, { "epoch": 0.3351862530273325, "grad_norm": 2.492059887652298, "learning_rate": 9.769491822701144e-07, "loss": 0.8739, "step": 3633 }, { "epoch": 0.33527851458885943, "grad_norm": 1.7183116395532245, "learning_rate": 9.767936866841215e-07, "loss": 0.6874, "step": 3634 }, { "epoch": 0.33537077615038635, "grad_norm": 1.7403832046999108, "learning_rate": 9.76638159218031e-07, "loss": 0.7693, "step": 3635 }, { "epoch": 0.33537077615038635, "eval_GEN Loss": 0.4694426655769348, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3402249217033386, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8430889248847961, "eval_runtime": 56.7164, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3635 }, { "epoch": 0.33546303771191327, "grad_norm": 1.259890347045147, "learning_rate": 9.76482599885937e-07, "loss": 0.5989, "step": 3636 }, { "epoch": 0.3355552992734402, "grad_norm": 1.5214473482294408, "learning_rate": 9.763270087019366e-07, "loss": 0.5695, "step": 3637 }, { "epoch": 0.3356475608349671, "grad_norm": 2.1584421759239234, "learning_rate": 9.761713856801297e-07, "loss": 0.8237, "step": 3638 }, { "epoch": 0.3357398223964941, "grad_norm": 2.7809056361146203, "learning_rate": 9.76015730834619e-07, "loss": 0.8319, "step": 3639 }, { "epoch": 0.335832083958021, "grad_norm": 2.4080382572933536, "learning_rate": 9.758600441795104e-07, "loss": 0.7404, "step": 3640 }, { "epoch": 0.335832083958021, "eval_GEN Loss": 0.4696483612060547, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32540377974510193, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8377704620361328, "eval_runtime": 56.5814, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 3640 }, { "epoch": 0.3359243455195479, "grad_norm": 2.0434367395612214, "learning_rate": 9.75704325728912e-07, "loss": 0.727, "step": 3641 }, { "epoch": 0.33601660708107484, "grad_norm": 2.4873363449877135, "learning_rate": 9.75548575496936e-07, "loss": 0.6249, "step": 3642 }, { "epoch": 0.33610886864260175, "grad_norm": 1.7978561149299006, "learning_rate": 9.753927934976963e-07, "loss": 0.6698, "step": 3643 }, { "epoch": 0.33620113020412873, "grad_norm": 1.6167632990347218, "learning_rate": 9.752369797453098e-07, "loss": 0.625, "step": 3644 }, { "epoch": 0.33629339176565565, "grad_norm": 1.5494300264674061, "learning_rate": 9.75081134253897e-07, "loss": 0.6728, "step": 3645 }, { "epoch": 0.33629339176565565, "eval_GEN Loss": 0.46915918588638306, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.32989072799682617, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8176382184028625, "eval_runtime": 56.6609, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3645 }, { "epoch": 0.33638565332718257, "grad_norm": 1.8593922337502635, "learning_rate": 9.749252570375807e-07, "loss": 0.6463, "step": 3646 }, { "epoch": 0.3364779148887095, "grad_norm": 2.1989756024765894, "learning_rate": 9.747693481104871e-07, "loss": 0.7323, "step": 3647 }, { "epoch": 0.3365701764502364, "grad_norm": 1.6801286671949187, "learning_rate": 9.746134074867445e-07, "loss": 0.7104, "step": 3648 }, { "epoch": 0.3366624380117634, "grad_norm": 2.827493765635504, "learning_rate": 9.744574351804847e-07, "loss": 0.8494, "step": 3649 }, { "epoch": 0.3367546995732903, "grad_norm": 2.021652059715509, "learning_rate": 9.743014312058419e-07, "loss": 0.7701, "step": 3650 }, { "epoch": 0.3367546995732903, "eval_GEN Loss": 0.46834027767181396, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35319727659225464, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8159555196762085, "eval_runtime": 55.7016, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3650 }, { "epoch": 0.3368469611348172, "grad_norm": 1.5189083616034036, "learning_rate": 9.741453955769537e-07, "loss": 0.5413, "step": 3651 }, { "epoch": 0.33693922269634413, "grad_norm": 2.198977083488279, "learning_rate": 9.739893283079602e-07, "loss": 0.5491, "step": 3652 }, { "epoch": 0.33703148425787105, "grad_norm": 2.098928406083978, "learning_rate": 9.738332294130042e-07, "loss": 0.8467, "step": 3653 }, { "epoch": 0.33712374581939797, "grad_norm": 2.177492651983075, "learning_rate": 9.736770989062323e-07, "loss": 0.6042, "step": 3654 }, { "epoch": 0.33721600738092494, "grad_norm": 1.915251927667097, "learning_rate": 9.735209368017925e-07, "loss": 0.8345, "step": 3655 }, { "epoch": 0.33721600738092494, "eval_GEN Loss": 0.46902939677238464, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.89171974522293, "eval_PRM F1 AUC": 0.8347302252488213, "eval_PRM F1 Neg": 0.6909090909090909, "eval_PRM Loss": 0.3785856068134308, "eval_PRM NPV": 0.59375, "eval_PRM Precision": 0.9459459459459459, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 0.828906238079071, "eval_runtime": 56.2284, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 3655 }, { "epoch": 0.33730826894245186, "grad_norm": 2.489470358440496, "learning_rate": 9.733647431138372e-07, "loss": 0.7829, "step": 3656 }, { "epoch": 0.3374005305039788, "grad_norm": 2.248705874883505, "learning_rate": 9.732085178565203e-07, "loss": 0.7285, "step": 3657 }, { "epoch": 0.3374927920655057, "grad_norm": 2.1206303218948874, "learning_rate": 9.730522610439993e-07, "loss": 0.7276, "step": 3658 }, { "epoch": 0.3375850536270326, "grad_norm": 1.904699035757697, "learning_rate": 9.72895972690435e-07, "loss": 0.5263, "step": 3659 }, { "epoch": 0.3376773151885596, "grad_norm": 1.7465993965482869, "learning_rate": 9.727396528099895e-07, "loss": 0.6408, "step": 3660 }, { "epoch": 0.3376773151885596, "eval_GEN Loss": 0.468569815158844, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8903225806451613, "eval_PRM F1 AUC": 0.8504452592980618, "eval_PRM F1 Neg": 0.7017543859649122, "eval_PRM Loss": 0.38954806327819824, "eval_PRM NPV": 0.5882352941176471, "eval_PRM Precision": 0.9583333333333334, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.8695652173913043, "eval_loss": 0.8366886973381042, "eval_runtime": 55.7754, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3660 }, { "epoch": 0.3377695767500865, "grad_norm": 1.7376465982070755, "learning_rate": 9.725833014168299e-07, "loss": 0.7115, "step": 3661 }, { "epoch": 0.3378618383116134, "grad_norm": 2.417376726737251, "learning_rate": 9.72426918525124e-07, "loss": 1.0539, "step": 3662 }, { "epoch": 0.33795409987314035, "grad_norm": 1.7637093071233916, "learning_rate": 9.72270504149044e-07, "loss": 0.6651, "step": 3663 }, { "epoch": 0.33804636143466726, "grad_norm": 1.565703912701807, "learning_rate": 9.721140583027642e-07, "loss": 0.7624, "step": 3664 }, { "epoch": 0.33813862299619424, "grad_norm": 2.122687048201629, "learning_rate": 9.719575810004622e-07, "loss": 0.9355, "step": 3665 }, { "epoch": 0.33813862299619424, "eval_GEN Loss": 0.46805840730667114, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.8974358974358975, "eval_PRM F1 AUC": 0.8564693556836039, "eval_PRM F1 Neg": 0.7142857142857143, "eval_PRM Loss": 0.3779523968696594, "eval_PRM NPV": 0.6060606060606061, "eval_PRM Precision": 0.958904109589041, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.8695652173913043, "eval_loss": 0.8263221383094788, "eval_runtime": 55.6559, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 3665 }, { "epoch": 0.33823088455772116, "grad_norm": 4.193905375584633, "learning_rate": 9.718010722563181e-07, "loss": 1.0032, "step": 3666 }, { "epoch": 0.3383231461192481, "grad_norm": 2.1995600724755193, "learning_rate": 9.716445320845147e-07, "loss": 0.7828, "step": 3667 }, { "epoch": 0.338415407680775, "grad_norm": 1.7227909694563461, "learning_rate": 9.714879604992386e-07, "loss": 0.73, "step": 3668 }, { "epoch": 0.3385076692423019, "grad_norm": 3.2031034818587494, "learning_rate": 9.71331357514678e-07, "loss": 0.8766, "step": 3669 }, { "epoch": 0.33859993080382883, "grad_norm": 2.2793518104362716, "learning_rate": 9.711747231450245e-07, "loss": 0.6005, "step": 3670 }, { "epoch": 0.33859993080382883, "eval_GEN Loss": 0.46660399436950684, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.35452428460121155, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8137319684028625, "eval_runtime": 55.8921, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3670 }, { "epoch": 0.3386921923653558, "grad_norm": 2.450212002364278, "learning_rate": 9.710180574044727e-07, "loss": 0.9707, "step": 3671 }, { "epoch": 0.3387844539268827, "grad_norm": 1.9184393432890179, "learning_rate": 9.7086136030722e-07, "loss": 0.7585, "step": 3672 }, { "epoch": 0.33887671548840964, "grad_norm": 1.5332319234122729, "learning_rate": 9.707046318674664e-07, "loss": 0.681, "step": 3673 }, { "epoch": 0.33896897704993656, "grad_norm": 1.7981134862562713, "learning_rate": 9.70547872099415e-07, "loss": 0.6154, "step": 3674 }, { "epoch": 0.3390612386114635, "grad_norm": 1.3864572001784805, "learning_rate": 9.703910810172714e-07, "loss": 0.6337, "step": 3675 }, { "epoch": 0.3390612386114635, "eval_GEN Loss": 0.4660557210445404, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3518015444278717, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8154447078704834, "eval_runtime": 56.1294, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 3675 }, { "epoch": 0.33915350017299045, "grad_norm": 1.8251635328400626, "learning_rate": 9.702342586352444e-07, "loss": 0.7104, "step": 3676 }, { "epoch": 0.33924576173451737, "grad_norm": 1.7706215082444872, "learning_rate": 9.700774049675456e-07, "loss": 0.7321, "step": 3677 }, { "epoch": 0.3393380232960443, "grad_norm": 1.363043612442319, "learning_rate": 9.699205200283893e-07, "loss": 0.658, "step": 3678 }, { "epoch": 0.3394302848575712, "grad_norm": 1.395396675215874, "learning_rate": 9.697636038319924e-07, "loss": 0.5778, "step": 3679 }, { "epoch": 0.3395225464190981, "grad_norm": 1.2753565109487026, "learning_rate": 9.69606656392575e-07, "loss": 0.5915, "step": 3680 }, { "epoch": 0.3395225464190981, "eval_GEN Loss": 0.46370846033096313, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3440261483192444, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8190504908561707, "eval_runtime": 56.0384, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 3680 }, { "epoch": 0.3396148079806251, "grad_norm": 1.5388305527427382, "learning_rate": 9.6944967772436e-07, "loss": 0.6732, "step": 3681 }, { "epoch": 0.339707069542152, "grad_norm": 2.5860578343426774, "learning_rate": 9.69292667841573e-07, "loss": 0.7758, "step": 3682 }, { "epoch": 0.33979933110367894, "grad_norm": 2.217120260060514, "learning_rate": 9.691356267584426e-07, "loss": 0.7643, "step": 3683 }, { "epoch": 0.33989159266520586, "grad_norm": 1.6719881907051264, "learning_rate": 9.689785544892e-07, "loss": 0.6452, "step": 3684 }, { "epoch": 0.3399838542267328, "grad_norm": 2.2701623261076125, "learning_rate": 9.688214510480792e-07, "loss": 0.9379, "step": 3685 }, { "epoch": 0.3399838542267328, "eval_GEN Loss": 0.4624996781349182, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3344188332557678, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8329927921295166, "eval_runtime": 55.8232, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3685 }, { "epoch": 0.3400761157882597, "grad_norm": 2.1755879254878963, "learning_rate": 9.686643164493176e-07, "loss": 0.8055, "step": 3686 }, { "epoch": 0.34016837734978667, "grad_norm": 2.186986244273936, "learning_rate": 9.685071507071546e-07, "loss": 0.7312, "step": 3687 }, { "epoch": 0.3402606389113136, "grad_norm": 2.4219525196443996, "learning_rate": 9.68349953835833e-07, "loss": 0.8389, "step": 3688 }, { "epoch": 0.3403529004728405, "grad_norm": 1.811163087316862, "learning_rate": 9.681927258495978e-07, "loss": 0.6604, "step": 3689 }, { "epoch": 0.3404451620343674, "grad_norm": 2.2280629579605535, "learning_rate": 9.68035466762698e-07, "loss": 0.7746, "step": 3690 }, { "epoch": 0.3404451620343674, "eval_GEN Loss": 0.4619635045528412, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3435130715370178, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8375601172447205, "eval_runtime": 55.8567, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3690 }, { "epoch": 0.34053742359589434, "grad_norm": 1.486801093589663, "learning_rate": 9.67878176589384e-07, "loss": 0.6528, "step": 3691 }, { "epoch": 0.3406296851574213, "grad_norm": 2.02550157026884, "learning_rate": 9.677208553439102e-07, "loss": 0.8417, "step": 3692 }, { "epoch": 0.34072194671894823, "grad_norm": 1.7136683126158871, "learning_rate": 9.675635030405328e-07, "loss": 0.6631, "step": 3693 }, { "epoch": 0.34081420828047515, "grad_norm": 1.8907001519565731, "learning_rate": 9.674061196935117e-07, "loss": 0.6518, "step": 3694 }, { "epoch": 0.34090646984200207, "grad_norm": 1.6914300147416752, "learning_rate": 9.67248705317109e-07, "loss": 0.6074, "step": 3695 }, { "epoch": 0.34090646984200207, "eval_GEN Loss": 0.46258804202079773, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3438650965690613, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8478966355323792, "eval_runtime": 56.0644, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 3695 }, { "epoch": 0.340998731403529, "grad_norm": 1.5959064666900813, "learning_rate": 9.670912599255897e-07, "loss": 0.6259, "step": 3696 }, { "epoch": 0.3410909929650559, "grad_norm": 2.026588840209758, "learning_rate": 9.669337835332223e-07, "loss": 0.5374, "step": 3697 }, { "epoch": 0.3411832545265829, "grad_norm": 2.0114116905077544, "learning_rate": 9.66776276154277e-07, "loss": 0.6961, "step": 3698 }, { "epoch": 0.3412755160881098, "grad_norm": 2.0283224825638366, "learning_rate": 9.666187378030278e-07, "loss": 0.5546, "step": 3699 }, { "epoch": 0.3413677776496367, "grad_norm": 2.928884210405768, "learning_rate": 9.66461168493751e-07, "loss": 0.9221, "step": 3700 }, { "epoch": 0.3413677776496367, "eval_GEN Loss": 0.46336492896080017, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33952993154525757, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8602163195610046, "eval_runtime": 55.9332, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3700 }, { "epoch": 0.34146003921116364, "grad_norm": 2.471443110899123, "learning_rate": 9.66303568240725e-07, "loss": 0.8619, "step": 3701 }, { "epoch": 0.34155230077269055, "grad_norm": 1.1715910962923328, "learning_rate": 9.66145937058233e-07, "loss": 0.553, "step": 3702 }, { "epoch": 0.3416445623342175, "grad_norm": 1.501347001425055, "learning_rate": 9.65988274960559e-07, "loss": 0.5746, "step": 3703 }, { "epoch": 0.34173682389574445, "grad_norm": 1.464144404758925, "learning_rate": 9.65830581961991e-07, "loss": 0.4682, "step": 3704 }, { "epoch": 0.34182908545727136, "grad_norm": 2.9602733712186162, "learning_rate": 9.656728580768188e-07, "loss": 0.9073, "step": 3705 }, { "epoch": 0.34182908545727136, "eval_GEN Loss": 0.4640003442764282, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3416084349155426, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8563100695610046, "eval_runtime": 55.9781, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3705 }, { "epoch": 0.3419213470187983, "grad_norm": 1.39742700047925, "learning_rate": 9.655151033193362e-07, "loss": 0.5994, "step": 3706 }, { "epoch": 0.3420136085803252, "grad_norm": 1.3997881250587596, "learning_rate": 9.653573177038392e-07, "loss": 0.5794, "step": 3707 }, { "epoch": 0.3421058701418522, "grad_norm": 1.9537256665259948, "learning_rate": 9.65199501244626e-07, "loss": 0.7756, "step": 3708 }, { "epoch": 0.3421981317033791, "grad_norm": 2.5251039110342335, "learning_rate": 9.650416539559987e-07, "loss": 0.7615, "step": 3709 }, { "epoch": 0.342290393264906, "grad_norm": 1.9751014507249347, "learning_rate": 9.648837758522614e-07, "loss": 0.5872, "step": 3710 }, { "epoch": 0.342290393264906, "eval_GEN Loss": 0.46506547927856445, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36560991406440735, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8573317527770996, "eval_runtime": 56.0097, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3710 }, { "epoch": 0.34238265482643293, "grad_norm": 2.274600642817432, "learning_rate": 9.647258669477213e-07, "loss": 0.8695, "step": 3711 }, { "epoch": 0.34247491638795985, "grad_norm": 1.91019450167604, "learning_rate": 9.645679272566883e-07, "loss": 0.7842, "step": 3712 }, { "epoch": 0.34256717794948677, "grad_norm": 1.5952385364835358, "learning_rate": 9.644099567934756e-07, "loss": 0.8352, "step": 3713 }, { "epoch": 0.34265943951101374, "grad_norm": 2.710953429833622, "learning_rate": 9.64251955572398e-07, "loss": 0.6237, "step": 3714 }, { "epoch": 0.34275170107254066, "grad_norm": 1.366794952745796, "learning_rate": 9.640939236077742e-07, "loss": 0.7175, "step": 3715 }, { "epoch": 0.34275170107254066, "eval_GEN Loss": 0.46673673391342163, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3873176872730255, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8762019276618958, "eval_runtime": 56.7214, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3715 }, { "epoch": 0.3428439626340676, "grad_norm": 3.2775756515553356, "learning_rate": 9.639358609139257e-07, "loss": 0.8002, "step": 3716 }, { "epoch": 0.3429362241955945, "grad_norm": 2.67874937881373, "learning_rate": 9.637777675051757e-07, "loss": 0.9112, "step": 3717 }, { "epoch": 0.3430284857571214, "grad_norm": 2.214272219994824, "learning_rate": 9.636196433958515e-07, "loss": 0.7867, "step": 3718 }, { "epoch": 0.3431207473186484, "grad_norm": 1.9175322900304457, "learning_rate": 9.634614886002817e-07, "loss": 0.8526, "step": 3719 }, { "epoch": 0.3432130088801753, "grad_norm": 1.9718312198041474, "learning_rate": 9.633033031327993e-07, "loss": 0.7541, "step": 3720 }, { "epoch": 0.3432130088801753, "eval_GEN Loss": 0.46820056438446045, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.4053679406642914, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.885817289352417, "eval_runtime": 55.9795, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3720 }, { "epoch": 0.3433052704417022, "grad_norm": 1.6607748272890903, "learning_rate": 9.63145087007739e-07, "loss": 0.6884, "step": 3721 }, { "epoch": 0.34339753200322914, "grad_norm": 1.8858171279161577, "learning_rate": 9.629868402394387e-07, "loss": 0.7745, "step": 3722 }, { "epoch": 0.34348979356475606, "grad_norm": 1.7962143787665013, "learning_rate": 9.62828562842239e-07, "loss": 0.9024, "step": 3723 }, { "epoch": 0.34358205512628304, "grad_norm": 2.544460439921917, "learning_rate": 9.626702548304832e-07, "loss": 0.7605, "step": 3724 }, { "epoch": 0.34367431668780996, "grad_norm": 2.881148068779642, "learning_rate": 9.625119162185173e-07, "loss": 0.7746, "step": 3725 }, { "epoch": 0.34367431668780996, "eval_GEN Loss": 0.4682743549346924, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.41063398122787476, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8886418342590332, "eval_runtime": 55.8897, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3725 }, { "epoch": 0.3437665782493369, "grad_norm": 2.211281306245446, "learning_rate": 9.623535470206905e-07, "loss": 0.905, "step": 3726 }, { "epoch": 0.3438588398108638, "grad_norm": 1.6261235331180999, "learning_rate": 9.62195147251354e-07, "loss": 0.658, "step": 3727 }, { "epoch": 0.3439511013723907, "grad_norm": 1.3763894325034005, "learning_rate": 9.620367169248628e-07, "loss": 0.5018, "step": 3728 }, { "epoch": 0.34404336293391763, "grad_norm": 1.6154059462172627, "learning_rate": 9.618782560555736e-07, "loss": 0.6924, "step": 3729 }, { "epoch": 0.3441356244954446, "grad_norm": 2.6467165804514696, "learning_rate": 9.617197646578466e-07, "loss": 0.7522, "step": 3730 }, { "epoch": 0.3441356244954446, "eval_GEN Loss": 0.468242347240448, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.4047353267669678, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8870792984962463, "eval_runtime": 55.8541, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3730 }, { "epoch": 0.3442278860569715, "grad_norm": 1.593684201672445, "learning_rate": 9.615612427460444e-07, "loss": 0.5861, "step": 3731 }, { "epoch": 0.34432014761849844, "grad_norm": 2.1543309100245502, "learning_rate": 9.61402690334533e-07, "loss": 0.7387, "step": 3732 }, { "epoch": 0.34441240918002536, "grad_norm": 1.4882698916355077, "learning_rate": 9.6124410743768e-07, "loss": 0.6851, "step": 3733 }, { "epoch": 0.3445046707415523, "grad_norm": 1.8572118230979693, "learning_rate": 9.610854940698568e-07, "loss": 0.5976, "step": 3734 }, { "epoch": 0.34459693230307925, "grad_norm": 1.6671442899708826, "learning_rate": 9.609268502454373e-07, "loss": 0.6387, "step": 3735 }, { "epoch": 0.34459693230307925, "eval_GEN Loss": 0.46616464853286743, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3937951624393463, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8822716474533081, "eval_runtime": 55.7213, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 3735 }, { "epoch": 0.34468919386460617, "grad_norm": 2.0680544806719037, "learning_rate": 9.607681759787976e-07, "loss": 0.5404, "step": 3736 }, { "epoch": 0.3447814554261331, "grad_norm": 1.772288908488974, "learning_rate": 9.606094712843173e-07, "loss": 0.7036, "step": 3737 }, { "epoch": 0.34487371698766, "grad_norm": 1.9102702479273743, "learning_rate": 9.604507361763787e-07, "loss": 0.6893, "step": 3738 }, { "epoch": 0.3449659785491869, "grad_norm": 1.7583148862631657, "learning_rate": 9.602919706693661e-07, "loss": 0.6487, "step": 3739 }, { "epoch": 0.3450582401107139, "grad_norm": 1.2407806825683938, "learning_rate": 9.601331747776673e-07, "loss": 0.5756, "step": 3740 }, { "epoch": 0.3450582401107139, "eval_GEN Loss": 0.4655279517173767, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3840682804584503, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8846153616905212, "eval_runtime": 55.8923, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3740 }, { "epoch": 0.3451505016722408, "grad_norm": 1.845289086473611, "learning_rate": 9.599743485156733e-07, "loss": 0.7607, "step": 3741 }, { "epoch": 0.34524276323376774, "grad_norm": 1.974588145971051, "learning_rate": 9.598154918977758e-07, "loss": 0.6877, "step": 3742 }, { "epoch": 0.34533502479529465, "grad_norm": 2.734223985194787, "learning_rate": 9.59656604938372e-07, "loss": 0.7999, "step": 3743 }, { "epoch": 0.3454272863568216, "grad_norm": 1.2711755505902111, "learning_rate": 9.594976876518595e-07, "loss": 0.661, "step": 3744 }, { "epoch": 0.3455195479183485, "grad_norm": 1.3860884880801732, "learning_rate": 9.593387400526401e-07, "loss": 0.5841, "step": 3745 }, { "epoch": 0.3455195479183485, "eval_GEN Loss": 0.46540525555610657, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3680097758769989, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8952524065971375, "eval_runtime": 55.8634, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3745 }, { "epoch": 0.34561180947987546, "grad_norm": 2.0360075972208596, "learning_rate": 9.59179762155118e-07, "loss": 0.9218, "step": 3746 }, { "epoch": 0.3457040710414024, "grad_norm": 1.9912416761743457, "learning_rate": 9.590207539736998e-07, "loss": 0.6224, "step": 3747 }, { "epoch": 0.3457963326029293, "grad_norm": 1.410263018673505, "learning_rate": 9.58861715522795e-07, "loss": 0.6918, "step": 3748 }, { "epoch": 0.3458885941644562, "grad_norm": 3.480801931827441, "learning_rate": 9.587026468168164e-07, "loss": 0.8224, "step": 3749 }, { "epoch": 0.34598085572598314, "grad_norm": 3.476373522330977, "learning_rate": 9.585435478701784e-07, "loss": 0.8239, "step": 3750 }, { "epoch": 0.34598085572598314, "eval_GEN Loss": 0.4648699164390564, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3654617369174957, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9065504670143127, "eval_runtime": 55.9693, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3750 }, { "epoch": 0.3460731172875101, "grad_norm": 2.2131471786098253, "learning_rate": 9.58384418697299e-07, "loss": 0.5293, "step": 3751 }, { "epoch": 0.34616537884903703, "grad_norm": 2.211190767403979, "learning_rate": 9.58225259312599e-07, "loss": 0.8615, "step": 3752 }, { "epoch": 0.34625764041056395, "grad_norm": 2.277051565992359, "learning_rate": 9.580660697305014e-07, "loss": 0.6596, "step": 3753 }, { "epoch": 0.34634990197209087, "grad_norm": 1.7825016885152825, "learning_rate": 9.579068499654324e-07, "loss": 0.6554, "step": 3754 }, { "epoch": 0.3464421635336178, "grad_norm": 1.5833402800799643, "learning_rate": 9.577476000318205e-07, "loss": 0.4765, "step": 3755 }, { "epoch": 0.3464421635336178, "eval_GEN Loss": 0.46510693430900574, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3725627660751343, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8920673131942749, "eval_runtime": 55.8662, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3755 }, { "epoch": 0.34653442509514476, "grad_norm": 1.7563207722624166, "learning_rate": 9.575883199440972e-07, "loss": 0.4881, "step": 3756 }, { "epoch": 0.3466266866566717, "grad_norm": 2.880408204576627, "learning_rate": 9.574290097166973e-07, "loss": 0.8167, "step": 3757 }, { "epoch": 0.3467189482181986, "grad_norm": 1.4951138351055484, "learning_rate": 9.57269669364057e-07, "loss": 0.7277, "step": 3758 }, { "epoch": 0.3468112097797255, "grad_norm": 2.755994265752733, "learning_rate": 9.571102989006162e-07, "loss": 0.8306, "step": 3759 }, { "epoch": 0.34690347134125243, "grad_norm": 3.5789846195289416, "learning_rate": 9.569508983408176e-07, "loss": 0.9367, "step": 3760 }, { "epoch": 0.34690347134125243, "eval_GEN Loss": 0.46539977192878723, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39090612530708313, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8852163553237915, "eval_runtime": 55.9406, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3760 }, { "epoch": 0.34699573290277935, "grad_norm": 2.4155404325311904, "learning_rate": 9.56791467699106e-07, "loss": 0.6552, "step": 3761 }, { "epoch": 0.3470879944643063, "grad_norm": 1.5826400078873153, "learning_rate": 9.566320069899292e-07, "loss": 0.6167, "step": 3762 }, { "epoch": 0.34718025602583324, "grad_norm": 2.280185495672841, "learning_rate": 9.56472516227738e-07, "loss": 0.7432, "step": 3763 }, { "epoch": 0.34727251758736016, "grad_norm": 2.279201341934873, "learning_rate": 9.56312995426986e-07, "loss": 0.7819, "step": 3764 }, { "epoch": 0.3473647791488871, "grad_norm": 2.6630987225038747, "learning_rate": 9.561534446021283e-07, "loss": 0.9754, "step": 3765 }, { "epoch": 0.3473647791488871, "eval_GEN Loss": 0.4660956561565399, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.40761876106262207, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8894831538200378, "eval_runtime": 55.9735, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3765 }, { "epoch": 0.347457040710414, "grad_norm": 1.993435733786602, "learning_rate": 9.559938637676246e-07, "loss": 0.6586, "step": 3766 }, { "epoch": 0.347549302271941, "grad_norm": 2.533630176587448, "learning_rate": 9.558342529379359e-07, "loss": 0.8528, "step": 3767 }, { "epoch": 0.3476415638334679, "grad_norm": 2.5306174761243816, "learning_rate": 9.556746121275261e-07, "loss": 0.5803, "step": 3768 }, { "epoch": 0.3477338253949948, "grad_norm": 1.3563241511337962, "learning_rate": 9.555149413508627e-07, "loss": 0.6045, "step": 3769 }, { "epoch": 0.34782608695652173, "grad_norm": 1.3482186086924404, "learning_rate": 9.553552406224153e-07, "loss": 0.6691, "step": 3770 }, { "epoch": 0.34782608695652173, "eval_GEN Loss": 0.4648943245410919, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.41272056102752686, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8916466236114502, "eval_runtime": 56.9343, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3770 }, { "epoch": 0.34791834851804865, "grad_norm": 2.0529576917360686, "learning_rate": 9.551955099566558e-07, "loss": 0.7308, "step": 3771 }, { "epoch": 0.3480106100795756, "grad_norm": 2.4063712600360883, "learning_rate": 9.550357493680595e-07, "loss": 0.6653, "step": 3772 }, { "epoch": 0.34810287164110254, "grad_norm": 2.5305538893807475, "learning_rate": 9.548759588711041e-07, "loss": 0.7102, "step": 3773 }, { "epoch": 0.34819513320262946, "grad_norm": 2.1691344668854846, "learning_rate": 9.5471613848027e-07, "loss": 0.6277, "step": 3774 }, { "epoch": 0.3482873947641564, "grad_norm": 1.6769005741622578, "learning_rate": 9.545562882100406e-07, "loss": 0.7539, "step": 3775 }, { "epoch": 0.3482873947641564, "eval_GEN Loss": 0.46490785479545593, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3942284882068634, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8865384459495544, "eval_runtime": 55.8577, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3775 }, { "epoch": 0.3483796563256833, "grad_norm": 2.0073840928156366, "learning_rate": 9.543964080749017e-07, "loss": 0.7097, "step": 3776 }, { "epoch": 0.3484719178872102, "grad_norm": 2.1929671167175124, "learning_rate": 9.542364980893414e-07, "loss": 0.6984, "step": 3777 }, { "epoch": 0.3485641794487372, "grad_norm": 3.6134093049420746, "learning_rate": 9.54076558267852e-07, "loss": 0.9162, "step": 3778 }, { "epoch": 0.3486564410102641, "grad_norm": 2.037670869481623, "learning_rate": 9.539165886249262e-07, "loss": 0.7101, "step": 3779 }, { "epoch": 0.348748702571791, "grad_norm": 2.2242157983921924, "learning_rate": 9.537565891750619e-07, "loss": 0.6847, "step": 3780 }, { "epoch": 0.348748702571791, "eval_GEN Loss": 0.46401163935661316, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.39052385091781616, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8843749761581421, "eval_runtime": 55.8697, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3780 }, { "epoch": 0.34884096413331794, "grad_norm": 1.9904305979917003, "learning_rate": 9.53596559932758e-07, "loss": 0.7894, "step": 3781 }, { "epoch": 0.34893322569484486, "grad_norm": 1.9684031179267463, "learning_rate": 9.534365009125165e-07, "loss": 0.4988, "step": 3782 }, { "epoch": 0.34902548725637184, "grad_norm": 2.3661066800252395, "learning_rate": 9.532764121288423e-07, "loss": 0.6426, "step": 3783 }, { "epoch": 0.34911774881789875, "grad_norm": 1.990318659947277, "learning_rate": 9.531162935962432e-07, "loss": 0.7695, "step": 3784 }, { "epoch": 0.3492100103794257, "grad_norm": 1.9400922917227312, "learning_rate": 9.529561453292288e-07, "loss": 0.712, "step": 3785 }, { "epoch": 0.3492100103794257, "eval_GEN Loss": 0.4638323485851288, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3923055827617645, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8871995210647583, "eval_runtime": 55.7818, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 3785 }, { "epoch": 0.3493022719409526, "grad_norm": 1.6983564404606992, "learning_rate": 9.527959673423126e-07, "loss": 0.7138, "step": 3786 }, { "epoch": 0.3493945335024795, "grad_norm": 1.7608052182230653, "learning_rate": 9.526357596500097e-07, "loss": 0.8493, "step": 3787 }, { "epoch": 0.3494867950640065, "grad_norm": 2.095177570576328, "learning_rate": 9.524755222668383e-07, "loss": 0.5445, "step": 3788 }, { "epoch": 0.3495790566255334, "grad_norm": 2.1300396783995064, "learning_rate": 9.5231525520732e-07, "loss": 0.7375, "step": 3789 }, { "epoch": 0.3496713181870603, "grad_norm": 2.076996752497041, "learning_rate": 9.521549584859779e-07, "loss": 0.7043, "step": 3790 }, { "epoch": 0.3496713181870603, "eval_GEN Loss": 0.46403998136520386, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.40035301446914673, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8885817527770996, "eval_runtime": 55.9117, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3790 }, { "epoch": 0.34976357974858724, "grad_norm": 2.721758709724885, "learning_rate": 9.519946321173385e-07, "loss": 0.9223, "step": 3791 }, { "epoch": 0.34985584131011416, "grad_norm": 1.5456915103968132, "learning_rate": 9.518342761159307e-07, "loss": 0.6306, "step": 3792 }, { "epoch": 0.3499481028716411, "grad_norm": 1.9476559346686992, "learning_rate": 9.516738904962867e-07, "loss": 0.622, "step": 3793 }, { "epoch": 0.35004036443316805, "grad_norm": 1.8450391455544923, "learning_rate": 9.515134752729405e-07, "loss": 0.8644, "step": 3794 }, { "epoch": 0.35013262599469497, "grad_norm": 2.0371267793957806, "learning_rate": 9.51353030460429e-07, "loss": 0.7757, "step": 3795 }, { "epoch": 0.35013262599469497, "eval_GEN Loss": 0.46473821997642517, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.39523544907569885, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8787259459495544, "eval_runtime": 56.8412, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3795 }, { "epoch": 0.3502248875562219, "grad_norm": 2.100192006301843, "learning_rate": 9.511925560732924e-07, "loss": 0.6447, "step": 3796 }, { "epoch": 0.3503171491177488, "grad_norm": 1.4656661365226142, "learning_rate": 9.510320521260728e-07, "loss": 0.6536, "step": 3797 }, { "epoch": 0.3504094106792757, "grad_norm": 1.9324349060004573, "learning_rate": 9.508715186333156e-07, "loss": 0.8792, "step": 3798 }, { "epoch": 0.3505016722408027, "grad_norm": 1.9929081691027095, "learning_rate": 9.507109556095682e-07, "loss": 0.7737, "step": 3799 }, { "epoch": 0.3505939338023296, "grad_norm": 2.4839335273626837, "learning_rate": 9.505503630693816e-07, "loss": 0.9378, "step": 3800 }, { "epoch": 0.3505939338023296, "eval_GEN Loss": 0.4664175510406494, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.4022744596004486, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8781850934028625, "eval_runtime": 56.1148, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 3800 }, { "epoch": 0.35068619536385653, "grad_norm": 2.151126844136183, "learning_rate": 9.503897410273085e-07, "loss": 0.7538, "step": 3801 }, { "epoch": 0.35077845692538345, "grad_norm": 1.7029214297304305, "learning_rate": 9.502290894979049e-07, "loss": 0.7354, "step": 3802 }, { "epoch": 0.35087071848691037, "grad_norm": 3.72531159054256, "learning_rate": 9.500684084957293e-07, "loss": 0.8023, "step": 3803 }, { "epoch": 0.35096298004843735, "grad_norm": 2.883998651974907, "learning_rate": 9.49907698035343e-07, "loss": 0.8637, "step": 3804 }, { "epoch": 0.35105524160996426, "grad_norm": 2.5533777808372102, "learning_rate": 9.497469581313096e-07, "loss": 0.6717, "step": 3805 }, { "epoch": 0.35105524160996426, "eval_GEN Loss": 0.4656904339790344, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.410686194896698, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8751803040504456, "eval_runtime": 55.9079, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3805 }, { "epoch": 0.3511475031714912, "grad_norm": 1.6926813226920387, "learning_rate": 9.495861887981955e-07, "loss": 0.8087, "step": 3806 }, { "epoch": 0.3512397647330181, "grad_norm": 1.2478912525061865, "learning_rate": 9.494253900505704e-07, "loss": 0.5283, "step": 3807 }, { "epoch": 0.351332026294545, "grad_norm": 1.8740959615924406, "learning_rate": 9.492645619030057e-07, "loss": 0.642, "step": 3808 }, { "epoch": 0.35142428785607194, "grad_norm": 2.04318850754419, "learning_rate": 9.491037043700759e-07, "loss": 0.5957, "step": 3809 }, { "epoch": 0.3515165494175989, "grad_norm": 1.899982599882739, "learning_rate": 9.489428174663584e-07, "loss": 0.7386, "step": 3810 }, { "epoch": 0.3515165494175989, "eval_GEN Loss": 0.4658967852592468, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4093562066555023, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8658654093742371, "eval_runtime": 56.707, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3810 }, { "epoch": 0.35160881097912583, "grad_norm": 2.5564895762346453, "learning_rate": 9.487819012064326e-07, "loss": 0.9171, "step": 3811 }, { "epoch": 0.35170107254065275, "grad_norm": 2.1461505395937053, "learning_rate": 9.486209556048816e-07, "loss": 0.6051, "step": 3812 }, { "epoch": 0.35179333410217967, "grad_norm": 1.9175809793688028, "learning_rate": 9.4845998067629e-07, "loss": 0.7453, "step": 3813 }, { "epoch": 0.3518855956637066, "grad_norm": 1.7937262195464165, "learning_rate": 9.48298976435246e-07, "loss": 0.7153, "step": 3814 }, { "epoch": 0.35197785722523356, "grad_norm": 1.6516314850301779, "learning_rate": 9.481379428963397e-07, "loss": 0.7662, "step": 3815 }, { "epoch": 0.35197785722523356, "eval_GEN Loss": 0.463291198015213, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38919463753700256, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8502404093742371, "eval_runtime": 56.6495, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3815 }, { "epoch": 0.3520701187867605, "grad_norm": 1.6259084608320094, "learning_rate": 9.479768800741646e-07, "loss": 0.84, "step": 3816 }, { "epoch": 0.3521623803482874, "grad_norm": 2.452537410992221, "learning_rate": 9.47815787983316e-07, "loss": 0.8509, "step": 3817 }, { "epoch": 0.3522546419098143, "grad_norm": 2.069276426972907, "learning_rate": 9.476546666383928e-07, "loss": 0.6947, "step": 3818 }, { "epoch": 0.35234690347134123, "grad_norm": 2.4313907613121177, "learning_rate": 9.474935160539955e-07, "loss": 0.9207, "step": 3819 }, { "epoch": 0.3524391650328682, "grad_norm": 2.635050207075767, "learning_rate": 9.473323362447286e-07, "loss": 0.7986, "step": 3820 }, { "epoch": 0.3524391650328682, "eval_GEN Loss": 0.46222686767578125, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.37923020124435425, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8461538553237915, "eval_runtime": 55.8756, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3820 }, { "epoch": 0.3525314265943951, "grad_norm": 1.8978964523398498, "learning_rate": 9.47171127225198e-07, "loss": 0.8523, "step": 3821 }, { "epoch": 0.35262368815592204, "grad_norm": 1.614683666230754, "learning_rate": 9.470098890100124e-07, "loss": 0.6918, "step": 3822 }, { "epoch": 0.35271594971744896, "grad_norm": 1.6858822643243787, "learning_rate": 9.46848621613784e-07, "loss": 0.8118, "step": 3823 }, { "epoch": 0.3528082112789759, "grad_norm": 1.3720323494444129, "learning_rate": 9.466873250511269e-07, "loss": 0.5211, "step": 3824 }, { "epoch": 0.3529004728405028, "grad_norm": 3.001293814190167, "learning_rate": 9.46525999336658e-07, "loss": 0.8726, "step": 3825 }, { "epoch": 0.3529004728405028, "eval_GEN Loss": 0.4613455533981323, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3843279182910919, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8443509340286255, "eval_runtime": 55.8878, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3825 }, { "epoch": 0.3529927344020298, "grad_norm": 1.6061883282502658, "learning_rate": 9.463646444849971e-07, "loss": 0.6558, "step": 3826 }, { "epoch": 0.3530849959635567, "grad_norm": 2.499435859612238, "learning_rate": 9.46203260510766e-07, "loss": 0.6363, "step": 3827 }, { "epoch": 0.3531772575250836, "grad_norm": 2.466810532714648, "learning_rate": 9.460418474285901e-07, "loss": 0.7952, "step": 3828 }, { "epoch": 0.35326951908661053, "grad_norm": 1.7470667316172535, "learning_rate": 9.458804052530966e-07, "loss": 0.7722, "step": 3829 }, { "epoch": 0.35336178064813745, "grad_norm": 1.4695160320235972, "learning_rate": 9.457189339989158e-07, "loss": 0.6944, "step": 3830 }, { "epoch": 0.35336178064813745, "eval_GEN Loss": 0.461611270904541, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39079543948173523, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8508413434028625, "eval_runtime": 56.066, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 3830 }, { "epoch": 0.3534540422096644, "grad_norm": 1.5954380009008133, "learning_rate": 9.455574336806803e-07, "loss": 0.7239, "step": 3831 }, { "epoch": 0.35354630377119134, "grad_norm": 2.5123736388523277, "learning_rate": 9.453959043130255e-07, "loss": 0.7351, "step": 3832 }, { "epoch": 0.35363856533271826, "grad_norm": 1.332911708200968, "learning_rate": 9.452343459105898e-07, "loss": 0.5641, "step": 3833 }, { "epoch": 0.3537308268942452, "grad_norm": 1.4504415008958897, "learning_rate": 9.450727584880134e-07, "loss": 0.7043, "step": 3834 }, { "epoch": 0.3538230884557721, "grad_norm": 1.3033330344002674, "learning_rate": 9.449111420599398e-07, "loss": 0.6206, "step": 3835 }, { "epoch": 0.3538230884557721, "eval_GEN Loss": 0.4629392623901367, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.38266974687576294, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8508413434028625, "eval_runtime": 55.9445, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3835 }, { "epoch": 0.35391535001729907, "grad_norm": 2.173836572408765, "learning_rate": 9.447494966410151e-07, "loss": 0.7043, "step": 3836 }, { "epoch": 0.354007611578826, "grad_norm": 1.9238904080345363, "learning_rate": 9.445878222458876e-07, "loss": 0.5655, "step": 3837 }, { "epoch": 0.3540998731403529, "grad_norm": 2.7406387439384097, "learning_rate": 9.444261188892086e-07, "loss": 0.7306, "step": 3838 }, { "epoch": 0.3541921347018798, "grad_norm": 1.7635468735584554, "learning_rate": 9.44264386585632e-07, "loss": 0.7511, "step": 3839 }, { "epoch": 0.35428439626340674, "grad_norm": 1.9160124904326394, "learning_rate": 9.44102625349814e-07, "loss": 0.7338, "step": 3840 }, { "epoch": 0.35428439626340674, "eval_GEN Loss": 0.461733341217041, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36684173345565796, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8509014248847961, "eval_runtime": 56.9064, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3840 }, { "epoch": 0.35437665782493366, "grad_norm": 1.8609823494273454, "learning_rate": 9.439408351964141e-07, "loss": 0.8417, "step": 3841 }, { "epoch": 0.35446891938646063, "grad_norm": 1.815245733887611, "learning_rate": 9.437790161400934e-07, "loss": 0.6562, "step": 3842 }, { "epoch": 0.35456118094798755, "grad_norm": 2.025458500947324, "learning_rate": 9.436171681955167e-07, "loss": 0.674, "step": 3843 }, { "epoch": 0.35465344250951447, "grad_norm": 2.2212581093030765, "learning_rate": 9.434552913773506e-07, "loss": 0.784, "step": 3844 }, { "epoch": 0.3547457040710414, "grad_norm": 2.529955778467214, "learning_rate": 9.432933857002649e-07, "loss": 0.8232, "step": 3845 }, { "epoch": 0.3547457040710414, "eval_GEN Loss": 0.46213412284851074, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3619709312915802, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8529447317123413, "eval_runtime": 56.8045, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3845 }, { "epoch": 0.3548379656325683, "grad_norm": 2.8878755615180696, "learning_rate": 9.431314511789314e-07, "loss": 0.7746, "step": 3846 }, { "epoch": 0.3549302271940953, "grad_norm": 1.9593453625378463, "learning_rate": 9.429694878280252e-07, "loss": 0.7861, "step": 3847 }, { "epoch": 0.3550224887556222, "grad_norm": 1.7402377194876628, "learning_rate": 9.428074956622234e-07, "loss": 0.7562, "step": 3848 }, { "epoch": 0.3551147503171491, "grad_norm": 2.8108155560139965, "learning_rate": 9.42645474696206e-07, "loss": 0.7331, "step": 3849 }, { "epoch": 0.35520701187867604, "grad_norm": 1.953666290338613, "learning_rate": 9.42483424944656e-07, "loss": 0.6774, "step": 3850 }, { "epoch": 0.35520701187867604, "eval_GEN Loss": 0.46292129158973694, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3741525709629059, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8564302921295166, "eval_runtime": 55.8635, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3850 }, { "epoch": 0.35529927344020296, "grad_norm": 3.6255077078826496, "learning_rate": 9.42321346422258e-07, "loss": 0.8206, "step": 3851 }, { "epoch": 0.35539153500172993, "grad_norm": 1.6079824700403849, "learning_rate": 9.421592391437002e-07, "loss": 0.6385, "step": 3852 }, { "epoch": 0.35548379656325685, "grad_norm": 2.1655772457246814, "learning_rate": 9.419971031236731e-07, "loss": 0.9775, "step": 3853 }, { "epoch": 0.35557605812478377, "grad_norm": 1.8286955908035634, "learning_rate": 9.418349383768693e-07, "loss": 0.8645, "step": 3854 }, { "epoch": 0.3556683196863107, "grad_norm": 1.6657469796828948, "learning_rate": 9.416727449179849e-07, "loss": 0.5622, "step": 3855 }, { "epoch": 0.3556683196863107, "eval_GEN Loss": 0.4636772572994232, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3858485221862793, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8675480484962463, "eval_runtime": 55.8769, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3855 }, { "epoch": 0.3557605812478376, "grad_norm": 2.1092599758930834, "learning_rate": 9.41510522761718e-07, "loss": 0.9397, "step": 3856 }, { "epoch": 0.3558528428093645, "grad_norm": 1.6385850685683812, "learning_rate": 9.413482719227693e-07, "loss": 0.7014, "step": 3857 }, { "epoch": 0.3559451043708915, "grad_norm": 2.1391797324635426, "learning_rate": 9.41185992415842e-07, "loss": 0.7022, "step": 3858 }, { "epoch": 0.3560373659324184, "grad_norm": 1.6717476091751462, "learning_rate": 9.410236842556425e-07, "loss": 0.6209, "step": 3859 }, { "epoch": 0.35612962749394533, "grad_norm": 1.737214758222355, "learning_rate": 9.408613474568792e-07, "loss": 0.6674, "step": 3860 }, { "epoch": 0.35612962749394533, "eval_GEN Loss": 0.46808555722236633, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.39053481817245483, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8746995329856873, "eval_runtime": 55.8204, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 3860 }, { "epoch": 0.35622188905547225, "grad_norm": 1.634835933116288, "learning_rate": 9.406989820342635e-07, "loss": 0.7859, "step": 3861 }, { "epoch": 0.35631415061699917, "grad_norm": 2.1055771986113143, "learning_rate": 9.405365880025094e-07, "loss": 0.6726, "step": 3862 }, { "epoch": 0.35640641217852614, "grad_norm": 2.431314053750086, "learning_rate": 9.403741653763326e-07, "loss": 0.7384, "step": 3863 }, { "epoch": 0.35649867374005306, "grad_norm": 3.055052876372201, "learning_rate": 9.402117141704528e-07, "loss": 0.882, "step": 3864 }, { "epoch": 0.35659093530158, "grad_norm": 2.2987037223477986, "learning_rate": 9.400492343995913e-07, "loss": 0.6937, "step": 3865 }, { "epoch": 0.35659093530158, "eval_GEN Loss": 0.46811652183532715, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3976913392543793, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8783053159713745, "eval_runtime": 55.9134, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3865 }, { "epoch": 0.3566831968631069, "grad_norm": 1.88775680309827, "learning_rate": 9.398867260784722e-07, "loss": 0.7951, "step": 3866 }, { "epoch": 0.3567754584246338, "grad_norm": 2.757702026301362, "learning_rate": 9.397241892218224e-07, "loss": 0.7589, "step": 3867 }, { "epoch": 0.3568677199861608, "grad_norm": 1.4183440981857498, "learning_rate": 9.395616238443711e-07, "loss": 0.6209, "step": 3868 }, { "epoch": 0.3569599815476877, "grad_norm": 2.116785998997551, "learning_rate": 9.393990299608505e-07, "loss": 0.4923, "step": 3869 }, { "epoch": 0.35705224310921463, "grad_norm": 2.0178708897587248, "learning_rate": 9.392364075859947e-07, "loss": 0.8115, "step": 3870 }, { "epoch": 0.35705224310921463, "eval_GEN Loss": 0.46893763542175293, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38415005803108215, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8784855604171753, "eval_runtime": 56.6675, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 3870 }, { "epoch": 0.35714450467074155, "grad_norm": 1.9452389432296426, "learning_rate": 9.390737567345412e-07, "loss": 0.6038, "step": 3871 }, { "epoch": 0.35723676623226847, "grad_norm": 2.6029200983402556, "learning_rate": 9.389110774212292e-07, "loss": 0.8236, "step": 3872 }, { "epoch": 0.3573290277937954, "grad_norm": 2.134219518901736, "learning_rate": 9.387483696608017e-07, "loss": 0.6429, "step": 3873 }, { "epoch": 0.35742128935532236, "grad_norm": 1.2882575551910274, "learning_rate": 9.385856334680028e-07, "loss": 0.5704, "step": 3874 }, { "epoch": 0.3575135509168493, "grad_norm": 2.2756337927689088, "learning_rate": 9.384228688575804e-07, "loss": 0.7023, "step": 3875 }, { "epoch": 0.3575135509168493, "eval_GEN Loss": 0.4678434431552887, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3739252984523773, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8676081895828247, "eval_runtime": 56.8406, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3875 }, { "epoch": 0.3576058124783762, "grad_norm": 3.145844345187359, "learning_rate": 9.382600758442842e-07, "loss": 0.8728, "step": 3876 }, { "epoch": 0.3576980740399031, "grad_norm": 2.7632525316118164, "learning_rate": 9.380972544428668e-07, "loss": 0.8656, "step": 3877 }, { "epoch": 0.35779033560143003, "grad_norm": 1.8978531612523957, "learning_rate": 9.379344046680834e-07, "loss": 0.5401, "step": 3878 }, { "epoch": 0.357882597162957, "grad_norm": 2.388514387758438, "learning_rate": 9.377715265346918e-07, "loss": 0.6398, "step": 3879 }, { "epoch": 0.3579748587244839, "grad_norm": 1.8780245639190891, "learning_rate": 9.376086200574521e-07, "loss": 0.6647, "step": 3880 }, { "epoch": 0.3579748587244839, "eval_GEN Loss": 0.46916478872299194, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3886345326900482, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8644831776618958, "eval_runtime": 56.9015, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3880 }, { "epoch": 0.35806712028601084, "grad_norm": 2.009493156742869, "learning_rate": 9.374456852511271e-07, "loss": 0.6761, "step": 3881 }, { "epoch": 0.35815938184753776, "grad_norm": 1.7169391858657355, "learning_rate": 9.372827221304824e-07, "loss": 0.7489, "step": 3882 }, { "epoch": 0.3582516434090647, "grad_norm": 1.477651972755526, "learning_rate": 9.371197307102858e-07, "loss": 0.7054, "step": 3883 }, { "epoch": 0.35834390497059165, "grad_norm": 1.4775545777510137, "learning_rate": 9.369567110053079e-07, "loss": 0.659, "step": 3884 }, { "epoch": 0.35843616653211857, "grad_norm": 2.361819598256709, "learning_rate": 9.367936630303219e-07, "loss": 0.6494, "step": 3885 }, { "epoch": 0.35843616653211857, "eval_GEN Loss": 0.4692051410675049, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.3907117545604706, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8585336804389954, "eval_runtime": 56.947, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3885 }, { "epoch": 0.3585284280936455, "grad_norm": 2.1015243521485867, "learning_rate": 9.366305868001032e-07, "loss": 0.6841, "step": 3886 }, { "epoch": 0.3586206896551724, "grad_norm": 1.5275645613236177, "learning_rate": 9.364674823294305e-07, "loss": 0.7102, "step": 3887 }, { "epoch": 0.3587129512166993, "grad_norm": 1.694547908499395, "learning_rate": 9.363043496330841e-07, "loss": 0.6289, "step": 3888 }, { "epoch": 0.35880521277822625, "grad_norm": 2.6472250028389914, "learning_rate": 9.361411887258478e-07, "loss": 0.7378, "step": 3889 }, { "epoch": 0.3588974743397532, "grad_norm": 2.0570534130896982, "learning_rate": 9.359779996225069e-07, "loss": 0.849, "step": 3890 }, { "epoch": 0.3588974743397532, "eval_GEN Loss": 0.4700799286365509, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3856019377708435, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8542067408561707, "eval_runtime": 55.9946, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3890 }, { "epoch": 0.35898973590128014, "grad_norm": 2.4627103209735792, "learning_rate": 9.358147823378504e-07, "loss": 0.7538, "step": 3891 }, { "epoch": 0.35908199746280706, "grad_norm": 1.889462017915708, "learning_rate": 9.356515368866691e-07, "loss": 0.7394, "step": 3892 }, { "epoch": 0.359174259024334, "grad_norm": 1.5176644901269198, "learning_rate": 9.354882632837564e-07, "loss": 0.6269, "step": 3893 }, { "epoch": 0.3592665205858609, "grad_norm": 2.443968729888847, "learning_rate": 9.353249615439086e-07, "loss": 0.8084, "step": 3894 }, { "epoch": 0.35935878214738787, "grad_norm": 1.6250856842066927, "learning_rate": 9.351616316819244e-07, "loss": 0.6622, "step": 3895 }, { "epoch": 0.35935878214738787, "eval_GEN Loss": 0.4713021218776703, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.389230340719223, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8591646552085876, "eval_runtime": 56.9, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3895 }, { "epoch": 0.3594510437089148, "grad_norm": 2.135737398545149, "learning_rate": 9.349982737126049e-07, "loss": 0.8483, "step": 3896 }, { "epoch": 0.3595433052704417, "grad_norm": 3.0544410601012912, "learning_rate": 9.348348876507539e-07, "loss": 0.997, "step": 3897 }, { "epoch": 0.3596355668319686, "grad_norm": 1.7750545970717169, "learning_rate": 9.346714735111777e-07, "loss": 0.7438, "step": 3898 }, { "epoch": 0.35972782839349554, "grad_norm": 2.354262303495788, "learning_rate": 9.345080313086852e-07, "loss": 0.9604, "step": 3899 }, { "epoch": 0.3598200899550225, "grad_norm": 1.5586055281824707, "learning_rate": 9.343445610580876e-07, "loss": 0.5026, "step": 3900 }, { "epoch": 0.3598200899550225, "eval_GEN Loss": 0.4718244969844818, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3874286711215973, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8618389368057251, "eval_runtime": 55.9624, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 3900 }, { "epoch": 0.35991235151654943, "grad_norm": 2.532291224005924, "learning_rate": 9.34181062774199e-07, "loss": 0.8086, "step": 3901 }, { "epoch": 0.36000461307807635, "grad_norm": 1.4441988268323078, "learning_rate": 9.34017536471836e-07, "loss": 0.769, "step": 3902 }, { "epoch": 0.36009687463960327, "grad_norm": 1.5550775104131975, "learning_rate": 9.338539821658173e-07, "loss": 0.6358, "step": 3903 }, { "epoch": 0.3601891362011302, "grad_norm": 2.1635188110029695, "learning_rate": 9.336903998709645e-07, "loss": 0.8817, "step": 3904 }, { "epoch": 0.3602813977626571, "grad_norm": 2.2757405363598853, "learning_rate": 9.33526789602102e-07, "loss": 0.8107, "step": 3905 }, { "epoch": 0.3602813977626571, "eval_GEN Loss": 0.47220349311828613, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3897966742515564, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8663762211799622, "eval_runtime": 55.8937, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3905 }, { "epoch": 0.3603736593241841, "grad_norm": 2.2308007808204837, "learning_rate": 9.33363151374056e-07, "loss": 0.8066, "step": 3906 }, { "epoch": 0.360465920885711, "grad_norm": 1.3362641067355674, "learning_rate": 9.331994852016558e-07, "loss": 0.4111, "step": 3907 }, { "epoch": 0.3605581824472379, "grad_norm": 2.5460885774899906, "learning_rate": 9.330357910997333e-07, "loss": 0.6938, "step": 3908 }, { "epoch": 0.36065044400876484, "grad_norm": 2.2605960671612153, "learning_rate": 9.328720690831225e-07, "loss": 0.772, "step": 3909 }, { "epoch": 0.36074270557029176, "grad_norm": 1.792022086468857, "learning_rate": 9.327083191666603e-07, "loss": 0.8155, "step": 3910 }, { "epoch": 0.36074270557029176, "eval_GEN Loss": 0.4752283990383148, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.39145511388778687, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8692908883094788, "eval_runtime": 55.8883, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 3910 }, { "epoch": 0.36083496713181873, "grad_norm": 1.9763901690157581, "learning_rate": 9.325445413651857e-07, "loss": 0.7397, "step": 3911 }, { "epoch": 0.36092722869334565, "grad_norm": 2.225812758965922, "learning_rate": 9.323807356935408e-07, "loss": 0.7975, "step": 3912 }, { "epoch": 0.36101949025487257, "grad_norm": 1.4682897173636202, "learning_rate": 9.322169021665697e-07, "loss": 0.6978, "step": 3913 }, { "epoch": 0.3611117518163995, "grad_norm": 1.9344383215245098, "learning_rate": 9.320530407991195e-07, "loss": 0.7764, "step": 3914 }, { "epoch": 0.3612040133779264, "grad_norm": 1.2722725998123767, "learning_rate": 9.318891516060394e-07, "loss": 0.5773, "step": 3915 }, { "epoch": 0.3612040133779264, "eval_GEN Loss": 0.4741431474685669, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.38687625527381897, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8719651699066162, "eval_runtime": 55.7692, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 3915 }, { "epoch": 0.3612962749394534, "grad_norm": 1.8212294838929985, "learning_rate": 9.317252346021813e-07, "loss": 0.5912, "step": 3916 }, { "epoch": 0.3613885365009803, "grad_norm": 1.7452254458039675, "learning_rate": 9.315612898023996e-07, "loss": 0.6987, "step": 3917 }, { "epoch": 0.3614807980625072, "grad_norm": 1.31477492305167, "learning_rate": 9.313973172215512e-07, "loss": 0.6211, "step": 3918 }, { "epoch": 0.36157305962403413, "grad_norm": 2.0074989374716616, "learning_rate": 9.31233316874496e-07, "loss": 0.8034, "step": 3919 }, { "epoch": 0.36166532118556105, "grad_norm": 1.6624007379242667, "learning_rate": 9.310692887760953e-07, "loss": 0.6212, "step": 3920 }, { "epoch": 0.36166532118556105, "eval_GEN Loss": 0.4754544496536255, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.38960573077201843, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8695312738418579, "eval_runtime": 55.9215, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3920 }, { "epoch": 0.36175758274708797, "grad_norm": 2.9188768585500684, "learning_rate": 9.30905232941214e-07, "loss": 0.6554, "step": 3921 }, { "epoch": 0.36184984430861494, "grad_norm": 2.8486299249502864, "learning_rate": 9.307411493847189e-07, "loss": 0.7328, "step": 3922 }, { "epoch": 0.36194210587014186, "grad_norm": 3.0359147936149955, "learning_rate": 9.305770381214797e-07, "loss": 0.9836, "step": 3923 }, { "epoch": 0.3620343674316688, "grad_norm": 2.232953980129854, "learning_rate": 9.304128991663682e-07, "loss": 0.7897, "step": 3924 }, { "epoch": 0.3621266289931957, "grad_norm": 2.5579285213508447, "learning_rate": 9.302487325342592e-07, "loss": 0.8184, "step": 3925 }, { "epoch": 0.3621266289931957, "eval_GEN Loss": 0.4731970429420471, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3874712586402893, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8670673370361328, "eval_runtime": 55.9538, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3925 }, { "epoch": 0.3622188905547226, "grad_norm": 1.544779658763646, "learning_rate": 9.300845382400295e-07, "loss": 0.6434, "step": 3926 }, { "epoch": 0.3623111521162496, "grad_norm": 2.533379720921697, "learning_rate": 9.299203162985588e-07, "loss": 0.814, "step": 3927 }, { "epoch": 0.3624034136777765, "grad_norm": 2.0187043322722165, "learning_rate": 9.297560667247291e-07, "loss": 0.6568, "step": 3928 }, { "epoch": 0.3624956752393034, "grad_norm": 2.1658462527501814, "learning_rate": 9.295917895334247e-07, "loss": 0.8179, "step": 3929 }, { "epoch": 0.36258793680083035, "grad_norm": 1.8097854359582977, "learning_rate": 9.294274847395333e-07, "loss": 0.6307, "step": 3930 }, { "epoch": 0.36258793680083035, "eval_GEN Loss": 0.47248291969299316, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3808736503124237, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8524940013885498, "eval_runtime": 55.9452, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3930 }, { "epoch": 0.36268019836235726, "grad_norm": 3.1236716350800844, "learning_rate": 9.292631523579436e-07, "loss": 0.8585, "step": 3931 }, { "epoch": 0.36277245992388424, "grad_norm": 1.7941913378758887, "learning_rate": 9.290987924035483e-07, "loss": 0.7959, "step": 3932 }, { "epoch": 0.36286472148541116, "grad_norm": 1.5539593321714393, "learning_rate": 9.289344048912419e-07, "loss": 0.5842, "step": 3933 }, { "epoch": 0.3629569830469381, "grad_norm": 1.6377698814107418, "learning_rate": 9.287699898359212e-07, "loss": 0.5516, "step": 3934 }, { "epoch": 0.363049244608465, "grad_norm": 1.5011577632910293, "learning_rate": 9.28605547252486e-07, "loss": 0.493, "step": 3935 }, { "epoch": 0.363049244608465, "eval_GEN Loss": 0.4696495532989502, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3636634349822998, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8429387211799622, "eval_runtime": 55.9414, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 3935 }, { "epoch": 0.3631415061699919, "grad_norm": 2.185620317280508, "learning_rate": 9.284410771558381e-07, "loss": 0.64, "step": 3936 }, { "epoch": 0.36323376773151883, "grad_norm": 1.1611957577343748, "learning_rate": 9.282765795608823e-07, "loss": 0.5867, "step": 3937 }, { "epoch": 0.3633260292930458, "grad_norm": 2.29939808391568, "learning_rate": 9.281120544825253e-07, "loss": 0.7806, "step": 3938 }, { "epoch": 0.3634182908545727, "grad_norm": 1.7476494741268465, "learning_rate": 9.27947501935677e-07, "loss": 0.6418, "step": 3939 }, { "epoch": 0.36351055241609964, "grad_norm": 1.832308747311918, "learning_rate": 9.277829219352492e-07, "loss": 0.7227, "step": 3940 }, { "epoch": 0.36351055241609964, "eval_GEN Loss": 0.4686095714569092, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.35803502798080444, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8316105604171753, "eval_runtime": 56.9301, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3940 }, { "epoch": 0.36360281397762656, "grad_norm": 1.756504456086922, "learning_rate": 9.276183144961563e-07, "loss": 0.5178, "step": 3941 }, { "epoch": 0.3636950755391535, "grad_norm": 1.539716152384563, "learning_rate": 9.274536796333155e-07, "loss": 0.6088, "step": 3942 }, { "epoch": 0.36378733710068045, "grad_norm": 2.2323749504744295, "learning_rate": 9.272890173616461e-07, "loss": 0.6462, "step": 3943 }, { "epoch": 0.36387959866220737, "grad_norm": 2.7944215350707444, "learning_rate": 9.271243276960703e-07, "loss": 0.9325, "step": 3944 }, { "epoch": 0.3639718602237343, "grad_norm": 2.2827568375840417, "learning_rate": 9.269596106515123e-07, "loss": 0.7828, "step": 3945 }, { "epoch": 0.3639718602237343, "eval_GEN Loss": 0.46773645281791687, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3533172607421875, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8210036158561707, "eval_runtime": 56.8395, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3945 }, { "epoch": 0.3640641217852612, "grad_norm": 1.2240595302825128, "learning_rate": 9.267948662428991e-07, "loss": 0.5274, "step": 3946 }, { "epoch": 0.3641563833467881, "grad_norm": 3.213220609306924, "learning_rate": 9.2663009448516e-07, "loss": 0.8502, "step": 3947 }, { "epoch": 0.3642486449083151, "grad_norm": 2.392812082105232, "learning_rate": 9.264652953932269e-07, "loss": 0.63, "step": 3948 }, { "epoch": 0.364340906469842, "grad_norm": 1.5045056292338777, "learning_rate": 9.263004689820346e-07, "loss": 0.5596, "step": 3949 }, { "epoch": 0.36443316803136894, "grad_norm": 2.274918683669336, "learning_rate": 9.261356152665194e-07, "loss": 0.6024, "step": 3950 }, { "epoch": 0.36443316803136894, "eval_GEN Loss": 0.4670032262802124, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9221556886227545, "eval_PRM F1 AUC": 0.8116815086432687, "eval_PRM F1 Neg": 0.7111111111111111, "eval_PRM Loss": 0.3519865870475769, "eval_PRM NPV": 0.7272727272727273, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8191105723381042, "eval_runtime": 56.9892, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3950 }, { "epoch": 0.36452542959289586, "grad_norm": 1.9811678560162718, "learning_rate": 9.259707342616206e-07, "loss": 0.6069, "step": 3951 }, { "epoch": 0.3646176911544228, "grad_norm": 1.4454342477217352, "learning_rate": 9.258058259822801e-07, "loss": 0.5096, "step": 3952 }, { "epoch": 0.3647099527159497, "grad_norm": 2.3156618693135798, "learning_rate": 9.256408904434424e-07, "loss": 0.6777, "step": 3953 }, { "epoch": 0.36480221427747667, "grad_norm": 1.740709241229069, "learning_rate": 9.254759276600536e-07, "loss": 0.706, "step": 3954 }, { "epoch": 0.3648944758390036, "grad_norm": 2.606479521447348, "learning_rate": 9.253109376470637e-07, "loss": 0.8412, "step": 3955 }, { "epoch": 0.3648944758390036, "eval_GEN Loss": 0.468524694442749, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3395959734916687, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8205228447914124, "eval_runtime": 56.8418, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3955 }, { "epoch": 0.3649867374005305, "grad_norm": 2.7606277682607976, "learning_rate": 9.251459204194237e-07, "loss": 0.8132, "step": 3956 }, { "epoch": 0.3650789989620574, "grad_norm": 3.0246155566793966, "learning_rate": 9.24980875992088e-07, "loss": 0.5843, "step": 3957 }, { "epoch": 0.36517126052358434, "grad_norm": 2.1177339370604957, "learning_rate": 9.248158043800131e-07, "loss": 0.7132, "step": 3958 }, { "epoch": 0.3652635220851113, "grad_norm": 2.0518771132659035, "learning_rate": 9.246507055981581e-07, "loss": 0.7696, "step": 3959 }, { "epoch": 0.36535578364663823, "grad_norm": 2.0204041923069322, "learning_rate": 9.244855796614847e-07, "loss": 0.6573, "step": 3960 }, { "epoch": 0.36535578364663823, "eval_GEN Loss": 0.4692714214324951, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.34468531608581543, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8237680196762085, "eval_runtime": 56.9049, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 3960 }, { "epoch": 0.36544804520816515, "grad_norm": 2.3531646256363543, "learning_rate": 9.243204265849565e-07, "loss": 0.7047, "step": 3961 }, { "epoch": 0.36554030676969207, "grad_norm": 2.190645571443471, "learning_rate": 9.241552463835401e-07, "loss": 0.7353, "step": 3962 }, { "epoch": 0.365632568331219, "grad_norm": 1.836449679894377, "learning_rate": 9.239900390722044e-07, "loss": 0.6638, "step": 3963 }, { "epoch": 0.36572482989274596, "grad_norm": 1.8075356136350886, "learning_rate": 9.238248046659208e-07, "loss": 0.8139, "step": 3964 }, { "epoch": 0.3658170914542729, "grad_norm": 2.071607684536743, "learning_rate": 9.23659543179663e-07, "loss": 0.8313, "step": 3965 }, { "epoch": 0.3658170914542729, "eval_GEN Loss": 0.4681418836116791, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.34498780965805054, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8307992815971375, "eval_runtime": 56.9457, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 3965 }, { "epoch": 0.3659093530157998, "grad_norm": 1.6615308373019935, "learning_rate": 9.234942546284073e-07, "loss": 0.6671, "step": 3966 }, { "epoch": 0.3660016145773267, "grad_norm": 2.407311589772096, "learning_rate": 9.233289390271324e-07, "loss": 0.7313, "step": 3967 }, { "epoch": 0.36609387613885364, "grad_norm": 1.78091081399118, "learning_rate": 9.231635963908195e-07, "loss": 0.7081, "step": 3968 }, { "epoch": 0.36618613770038055, "grad_norm": 1.3524491992351055, "learning_rate": 9.229982267344521e-07, "loss": 0.4901, "step": 3969 }, { "epoch": 0.36627839926190753, "grad_norm": 2.4125619013458626, "learning_rate": 9.228328300730163e-07, "loss": 0.7864, "step": 3970 }, { "epoch": 0.36627839926190753, "eval_GEN Loss": 0.46698760986328125, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.34183862805366516, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8408052921295166, "eval_runtime": 56.717, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 3970 }, { "epoch": 0.36637066082343445, "grad_norm": 2.0102619639630483, "learning_rate": 9.226674064215009e-07, "loss": 0.6951, "step": 3971 }, { "epoch": 0.36646292238496136, "grad_norm": 2.1899655139354675, "learning_rate": 9.225019557948963e-07, "loss": 0.879, "step": 3972 }, { "epoch": 0.3665551839464883, "grad_norm": 2.9473848516990353, "learning_rate": 9.223364782081965e-07, "loss": 1.1008, "step": 3973 }, { "epoch": 0.3666474455080152, "grad_norm": 1.734542962304058, "learning_rate": 9.221709736763969e-07, "loss": 0.571, "step": 3974 }, { "epoch": 0.3667397070695422, "grad_norm": 2.087318540950687, "learning_rate": 9.220054422144958e-07, "loss": 0.7517, "step": 3975 }, { "epoch": 0.3667397070695422, "eval_GEN Loss": 0.4662870168685913, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9221556886227545, "eval_PRM F1 AUC": 0.8116815086432687, "eval_PRM F1 Neg": 0.7111111111111111, "eval_PRM Loss": 0.3461471498012543, "eval_PRM NPV": 0.7272727272727273, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8326321840286255, "eval_runtime": 56.8207, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3975 }, { "epoch": 0.3668319686310691, "grad_norm": 4.192616207272796, "learning_rate": 9.218398838374941e-07, "loss": 1.0464, "step": 3976 }, { "epoch": 0.366924230192596, "grad_norm": 1.3163866020779345, "learning_rate": 9.216742985603949e-07, "loss": 0.7344, "step": 3977 }, { "epoch": 0.36701649175412293, "grad_norm": 1.7421045252575347, "learning_rate": 9.215086863982038e-07, "loss": 0.7164, "step": 3978 }, { "epoch": 0.36710875331564985, "grad_norm": 1.9426012337940428, "learning_rate": 9.213430473659288e-07, "loss": 0.7645, "step": 3979 }, { "epoch": 0.3672010148771768, "grad_norm": 2.078511095833166, "learning_rate": 9.211773814785805e-07, "loss": 0.7956, "step": 3980 }, { "epoch": 0.3672010148771768, "eval_GEN Loss": 0.4650685787200928, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9146341463414634, "eval_PRM F1 AUC": 0.8213724463069669, "eval_PRM F1 Neg": 0.7083333333333334, "eval_PRM Loss": 0.354384183883667, "eval_PRM NPV": 0.68, "eval_PRM Precision": 0.9259259259259259, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8284855484962463, "eval_runtime": 56.7813, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 3980 }, { "epoch": 0.36729327643870374, "grad_norm": 1.4226300487337655, "learning_rate": 9.210116887511715e-07, "loss": 0.6856, "step": 3981 }, { "epoch": 0.36738553800023066, "grad_norm": 1.5802065341474425, "learning_rate": 9.208459691987173e-07, "loss": 0.7379, "step": 3982 }, { "epoch": 0.3674777995617576, "grad_norm": 2.931374876411286, "learning_rate": 9.20680222836236e-07, "loss": 0.8796, "step": 3983 }, { "epoch": 0.3675700611232845, "grad_norm": 1.664174322429993, "learning_rate": 9.205144496787473e-07, "loss": 0.5219, "step": 3984 }, { "epoch": 0.3676623226848114, "grad_norm": 2.3045945175787406, "learning_rate": 9.203486497412741e-07, "loss": 0.6681, "step": 3985 }, { "epoch": 0.3676623226848114, "eval_GEN Loss": 0.4651217758655548, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.360866516828537, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8353966474533081, "eval_runtime": 56.5806, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 3985 }, { "epoch": 0.3677545842463384, "grad_norm": 1.437534499562714, "learning_rate": 9.201828230388414e-07, "loss": 0.5612, "step": 3986 }, { "epoch": 0.3678468458078653, "grad_norm": 2.0339165764923592, "learning_rate": 9.200169695864766e-07, "loss": 0.7082, "step": 3987 }, { "epoch": 0.3679391073693922, "grad_norm": 2.4339029712856015, "learning_rate": 9.198510893992096e-07, "loss": 0.9734, "step": 3988 }, { "epoch": 0.36803136893091914, "grad_norm": 1.8425620431468062, "learning_rate": 9.196851824920728e-07, "loss": 0.7213, "step": 3989 }, { "epoch": 0.36812363049244606, "grad_norm": 2.0436216851794606, "learning_rate": 9.195192488801009e-07, "loss": 0.6996, "step": 3990 }, { "epoch": 0.36812363049244606, "eval_GEN Loss": 0.46527743339538574, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.36600261926651, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8408653736114502, "eval_runtime": 56.7965, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 3990 }, { "epoch": 0.36821589205397304, "grad_norm": 2.8902439169409244, "learning_rate": 9.193532885783311e-07, "loss": 0.9879, "step": 3991 }, { "epoch": 0.36830815361549996, "grad_norm": 1.6074402482743189, "learning_rate": 9.191873016018032e-07, "loss": 0.755, "step": 3992 }, { "epoch": 0.3684004151770269, "grad_norm": 2.707070551204786, "learning_rate": 9.190212879655585e-07, "loss": 0.8225, "step": 3993 }, { "epoch": 0.3684926767385538, "grad_norm": 2.0578697298196187, "learning_rate": 9.188552476846424e-07, "loss": 0.6969, "step": 3994 }, { "epoch": 0.3685849383000807, "grad_norm": 1.2209581399760836, "learning_rate": 9.186891807741008e-07, "loss": 0.6195, "step": 3995 }, { "epoch": 0.3685849383000807, "eval_GEN Loss": 0.4651360511779785, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.3803725242614746, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8537259697914124, "eval_runtime": 56.8539, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 3995 }, { "epoch": 0.3686771998616077, "grad_norm": 1.9462806070740368, "learning_rate": 9.185230872489836e-07, "loss": 0.6783, "step": 3996 }, { "epoch": 0.3687694614231346, "grad_norm": 1.515197633726276, "learning_rate": 9.183569671243422e-07, "loss": 0.7117, "step": 3997 }, { "epoch": 0.3688617229846615, "grad_norm": 2.8910756193567004, "learning_rate": 9.181908204152307e-07, "loss": 1.06, "step": 3998 }, { "epoch": 0.36895398454618844, "grad_norm": 1.6565018381522563, "learning_rate": 9.180246471367056e-07, "loss": 0.7391, "step": 3999 }, { "epoch": 0.36904624610771536, "grad_norm": 1.8025853766831315, "learning_rate": 9.178584473038256e-07, "loss": 0.7724, "step": 4000 }, { "epoch": 0.36904624610771536, "eval_GEN Loss": 0.46650370955467224, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3997230529785156, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8706430196762085, "eval_runtime": 56.8088, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4000 }, { "epoch": 0.3691385076692423, "grad_norm": 2.682410159310335, "learning_rate": 9.176922209316523e-07, "loss": 0.8458, "step": 4001 }, { "epoch": 0.36923076923076925, "grad_norm": 1.8513303134741645, "learning_rate": 9.175259680352491e-07, "loss": 0.8483, "step": 4002 }, { "epoch": 0.36932303079229617, "grad_norm": 2.0211716726128124, "learning_rate": 9.173596886296824e-07, "loss": 0.7502, "step": 4003 }, { "epoch": 0.3694152923538231, "grad_norm": 1.6796074854229206, "learning_rate": 9.171933827300203e-07, "loss": 0.7305, "step": 4004 }, { "epoch": 0.36950755391535, "grad_norm": 2.065852070488085, "learning_rate": 9.17027050351334e-07, "loss": 0.6767, "step": 4005 }, { "epoch": 0.36950755391535, "eval_GEN Loss": 0.4657479524612427, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.39866435527801514, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8692307472229004, "eval_runtime": 56.9144, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 4005 }, { "epoch": 0.3695998154768769, "grad_norm": 1.7698874648907141, "learning_rate": 9.168606915086968e-07, "loss": 0.7763, "step": 4006 }, { "epoch": 0.3696920770384039, "grad_norm": 3.00804928931779, "learning_rate": 9.166943062171843e-07, "loss": 0.8135, "step": 4007 }, { "epoch": 0.3697843385999308, "grad_norm": 2.1118877457957024, "learning_rate": 9.165278944918747e-07, "loss": 0.8485, "step": 4008 }, { "epoch": 0.36987660016145774, "grad_norm": 2.0106584675711883, "learning_rate": 9.163614563478484e-07, "loss": 0.9577, "step": 4009 }, { "epoch": 0.36996886172298465, "grad_norm": 1.728129128202833, "learning_rate": 9.161949918001884e-07, "loss": 0.7102, "step": 4010 }, { "epoch": 0.36996886172298465, "eval_GEN Loss": 0.4645037055015564, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.39239707589149475, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8724759817123413, "eval_runtime": 55.8278, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4010 }, { "epoch": 0.3700611232845116, "grad_norm": 2.035905752614218, "learning_rate": 9.160285008639798e-07, "loss": 0.8883, "step": 4011 }, { "epoch": 0.37015338484603855, "grad_norm": 1.3860527719352767, "learning_rate": 9.158619835543104e-07, "loss": 0.5338, "step": 4012 }, { "epoch": 0.37024564640756547, "grad_norm": 1.4082787162490455, "learning_rate": 9.156954398862701e-07, "loss": 0.6993, "step": 4013 }, { "epoch": 0.3703379079690924, "grad_norm": 2.892460946245489, "learning_rate": 9.155288698749514e-07, "loss": 0.9446, "step": 4014 }, { "epoch": 0.3704301695306193, "grad_norm": 1.8448389644174532, "learning_rate": 9.153622735354497e-07, "loss": 0.7462, "step": 4015 }, { "epoch": 0.3704301695306193, "eval_GEN Loss": 0.4658695459365845, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.39387214183807373, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8804687261581421, "eval_runtime": 55.7695, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4015 }, { "epoch": 0.3705224310921462, "grad_norm": 1.838572471588768, "learning_rate": 9.151956508828613e-07, "loss": 0.6251, "step": 4016 }, { "epoch": 0.37061469265367314, "grad_norm": 1.7592334646815513, "learning_rate": 9.150290019322864e-07, "loss": 0.7358, "step": 4017 }, { "epoch": 0.3707069542152001, "grad_norm": 1.6043460622418197, "learning_rate": 9.148623266988267e-07, "loss": 0.5459, "step": 4018 }, { "epoch": 0.37079921577672703, "grad_norm": 2.28665835970567, "learning_rate": 9.14695625197587e-07, "loss": 0.6591, "step": 4019 }, { "epoch": 0.37089147733825395, "grad_norm": 1.9493097046410903, "learning_rate": 9.145288974436733e-07, "loss": 0.8836, "step": 4020 }, { "epoch": 0.37089147733825395, "eval_GEN Loss": 0.4661194086074829, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3922044634819031, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8952524065971375, "eval_runtime": 55.7277, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4020 }, { "epoch": 0.37098373889978087, "grad_norm": 2.071579706138531, "learning_rate": 9.143621434521956e-07, "loss": 0.6997, "step": 4021 }, { "epoch": 0.3710760004613078, "grad_norm": 1.8797242045101994, "learning_rate": 9.14195363238265e-07, "loss": 0.7907, "step": 4022 }, { "epoch": 0.37116826202283476, "grad_norm": 1.4780756985737438, "learning_rate": 9.140285568169951e-07, "loss": 0.5715, "step": 4023 }, { "epoch": 0.3712605235843617, "grad_norm": 2.169615330791163, "learning_rate": 9.138617242035026e-07, "loss": 0.6418, "step": 4024 }, { "epoch": 0.3713527851458886, "grad_norm": 2.4617614692052947, "learning_rate": 9.136948654129058e-07, "loss": 0.8067, "step": 4025 }, { "epoch": 0.3713527851458886, "eval_GEN Loss": 0.4669303297996521, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3980518877506256, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9057692289352417, "eval_runtime": 55.7951, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4025 }, { "epoch": 0.3714450467074155, "grad_norm": 1.6853666388182196, "learning_rate": 9.135279804603262e-07, "loss": 0.5899, "step": 4026 }, { "epoch": 0.37153730826894243, "grad_norm": 1.6027268662219922, "learning_rate": 9.133610693608866e-07, "loss": 0.7735, "step": 4027 }, { "epoch": 0.3716295698304694, "grad_norm": 3.3010178510482437, "learning_rate": 9.131941321297131e-07, "loss": 0.8266, "step": 4028 }, { "epoch": 0.3717218313919963, "grad_norm": 1.6191175013110048, "learning_rate": 9.130271687819338e-07, "loss": 0.7277, "step": 4029 }, { "epoch": 0.37181409295352325, "grad_norm": 3.9012333777277113, "learning_rate": 9.12860179332679e-07, "loss": 0.711, "step": 4030 }, { "epoch": 0.37181409295352325, "eval_GEN Loss": 0.46693354845046997, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3991369307041168, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9065504670143127, "eval_runtime": 55.904, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4030 }, { "epoch": 0.37190635451505016, "grad_norm": 2.566631053448556, "learning_rate": 9.126931637970817e-07, "loss": 0.6825, "step": 4031 }, { "epoch": 0.3719986160765771, "grad_norm": 1.8342602799097993, "learning_rate": 9.12526122190277e-07, "loss": 0.5844, "step": 4032 }, { "epoch": 0.372090877638104, "grad_norm": 1.7245018786356503, "learning_rate": 9.123590545274028e-07, "loss": 0.6231, "step": 4033 }, { "epoch": 0.372183139199631, "grad_norm": 1.2882972868034825, "learning_rate": 9.121919608235984e-07, "loss": 0.6102, "step": 4034 }, { "epoch": 0.3722754007611579, "grad_norm": 2.4318892523648015, "learning_rate": 9.120248410940066e-07, "loss": 0.9743, "step": 4035 }, { "epoch": 0.3722754007611579, "eval_GEN Loss": 0.4661226272583008, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3899044096469879, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9005408883094788, "eval_runtime": 55.8406, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4035 }, { "epoch": 0.3723676623226848, "grad_norm": 1.4129661653841254, "learning_rate": 9.11857695353772e-07, "loss": 0.6628, "step": 4036 }, { "epoch": 0.37245992388421173, "grad_norm": 2.235675663639896, "learning_rate": 9.116905236180412e-07, "loss": 0.6884, "step": 4037 }, { "epoch": 0.37255218544573865, "grad_norm": 2.7216412016621345, "learning_rate": 9.115233259019643e-07, "loss": 1.123, "step": 4038 }, { "epoch": 0.3726444470072656, "grad_norm": 2.4642576140626895, "learning_rate": 9.113561022206924e-07, "loss": 0.828, "step": 4039 }, { "epoch": 0.37273670856879254, "grad_norm": 1.8259694350493174, "learning_rate": 9.111888525893799e-07, "loss": 0.6149, "step": 4040 }, { "epoch": 0.37273670856879254, "eval_GEN Loss": 0.46511706709861755, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.38533416390419006, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9043269157409668, "eval_runtime": 56.8252, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4040 }, { "epoch": 0.37282897013031946, "grad_norm": 2.4773444919848977, "learning_rate": 9.110215770231829e-07, "loss": 0.7007, "step": 4041 }, { "epoch": 0.3729212316918464, "grad_norm": 1.7804524882857788, "learning_rate": 9.108542755372607e-07, "loss": 0.6445, "step": 4042 }, { "epoch": 0.3730134932533733, "grad_norm": 2.072669769630183, "learning_rate": 9.10686948146774e-07, "loss": 0.8563, "step": 4043 }, { "epoch": 0.3731057548149002, "grad_norm": 2.693136566311807, "learning_rate": 9.105195948668863e-07, "loss": 0.8057, "step": 4044 }, { "epoch": 0.3731980163764272, "grad_norm": 1.891017567824246, "learning_rate": 9.103522157127635e-07, "loss": 0.6851, "step": 4045 }, { "epoch": 0.3731980163764272, "eval_GEN Loss": 0.4658222496509552, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3822549283504486, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.892848551273346, "eval_runtime": 56.6543, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4045 }, { "epoch": 0.3732902779379541, "grad_norm": 1.649263312835569, "learning_rate": 9.101848106995738e-07, "loss": 0.6073, "step": 4046 }, { "epoch": 0.373382539499481, "grad_norm": 2.1316612619140054, "learning_rate": 9.100173798424877e-07, "loss": 0.6932, "step": 4047 }, { "epoch": 0.37347480106100794, "grad_norm": 1.9378131597038677, "learning_rate": 9.098499231566779e-07, "loss": 0.6467, "step": 4048 }, { "epoch": 0.37356706262253486, "grad_norm": 2.0166981219815403, "learning_rate": 9.096824406573199e-07, "loss": 0.6986, "step": 4049 }, { "epoch": 0.37365932418406184, "grad_norm": 1.3359555592984909, "learning_rate": 9.095149323595908e-07, "loss": 0.6596, "step": 4050 }, { "epoch": 0.37365932418406184, "eval_GEN Loss": 0.46569550037384033, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.375729501247406, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.887499988079071, "eval_runtime": 56.7661, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4050 }, { "epoch": 0.37375158574558875, "grad_norm": 2.0655599871047152, "learning_rate": 9.093473982786708e-07, "loss": 0.8894, "step": 4051 }, { "epoch": 0.3738438473071157, "grad_norm": 2.774807538190179, "learning_rate": 9.091798384297419e-07, "loss": 0.9404, "step": 4052 }, { "epoch": 0.3739361088686426, "grad_norm": 2.466072038830056, "learning_rate": 9.090122528279888e-07, "loss": 0.7547, "step": 4053 }, { "epoch": 0.3740283704301695, "grad_norm": 2.0877020203222023, "learning_rate": 9.088446414885985e-07, "loss": 0.7237, "step": 4054 }, { "epoch": 0.3741206319916965, "grad_norm": 2.263149423748166, "learning_rate": 9.086770044267599e-07, "loss": 0.6551, "step": 4055 }, { "epoch": 0.3741206319916965, "eval_GEN Loss": 0.46623334288597107, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37452223896980286, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8838942050933838, "eval_runtime": 56.7906, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4055 }, { "epoch": 0.3742128935532234, "grad_norm": 1.950672893187621, "learning_rate": 9.085093416576644e-07, "loss": 0.5224, "step": 4056 }, { "epoch": 0.3743051551147503, "grad_norm": 1.5851451956760336, "learning_rate": 9.083416531965064e-07, "loss": 0.7405, "step": 4057 }, { "epoch": 0.37439741667627724, "grad_norm": 1.6121406269473215, "learning_rate": 9.081739390584818e-07, "loss": 0.6958, "step": 4058 }, { "epoch": 0.37448967823780416, "grad_norm": 1.9542873854807654, "learning_rate": 9.08006199258789e-07, "loss": 0.7563, "step": 4059 }, { "epoch": 0.3745819397993311, "grad_norm": 1.659723881225212, "learning_rate": 9.078384338126289e-07, "loss": 0.6368, "step": 4060 }, { "epoch": 0.3745819397993311, "eval_GEN Loss": 0.46463996171951294, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3785744309425354, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8866586685180664, "eval_runtime": 55.9519, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4060 }, { "epoch": 0.37467420136085805, "grad_norm": 1.8295808467681853, "learning_rate": 9.076706427352048e-07, "loss": 0.5662, "step": 4061 }, { "epoch": 0.37476646292238497, "grad_norm": 3.345993918974571, "learning_rate": 9.075028260417221e-07, "loss": 0.8254, "step": 4062 }, { "epoch": 0.3748587244839119, "grad_norm": 1.5304809935686723, "learning_rate": 9.073349837473888e-07, "loss": 0.7073, "step": 4063 }, { "epoch": 0.3749509860454388, "grad_norm": 1.932737370444257, "learning_rate": 9.071671158674148e-07, "loss": 0.7327, "step": 4064 }, { "epoch": 0.3750432476069657, "grad_norm": 1.7632726646771022, "learning_rate": 9.069992224170125e-07, "loss": 0.6399, "step": 4065 }, { "epoch": 0.3750432476069657, "eval_GEN Loss": 0.46530988812446594, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.38563913106918335, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8853365182876587, "eval_runtime": 55.9535, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4065 }, { "epoch": 0.3751355091684927, "grad_norm": 2.008937633115089, "learning_rate": 9.068313034113968e-07, "loss": 0.6322, "step": 4066 }, { "epoch": 0.3752277707300196, "grad_norm": 1.5091400584678478, "learning_rate": 9.06663358865785e-07, "loss": 0.59, "step": 4067 }, { "epoch": 0.37532003229154653, "grad_norm": 1.9643058749280151, "learning_rate": 9.064953887953961e-07, "loss": 0.7106, "step": 4068 }, { "epoch": 0.37541229385307345, "grad_norm": 1.4066710687651958, "learning_rate": 9.06327393215452e-07, "loss": 0.4696, "step": 4069 }, { "epoch": 0.37550455541460037, "grad_norm": 2.515416684612912, "learning_rate": 9.061593721411767e-07, "loss": 0.7084, "step": 4070 }, { "epoch": 0.37550455541460037, "eval_GEN Loss": 0.4660487771034241, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36429563164711, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8866586685180664, "eval_runtime": 55.7371, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4070 }, { "epoch": 0.37559681697612735, "grad_norm": 7.281703882839622, "learning_rate": 9.059913255877966e-07, "loss": 0.8893, "step": 4071 }, { "epoch": 0.37568907853765426, "grad_norm": 1.9450188003044784, "learning_rate": 9.058232535705403e-07, "loss": 0.8208, "step": 4072 }, { "epoch": 0.3757813400991812, "grad_norm": 1.5293624406192017, "learning_rate": 9.056551561046387e-07, "loss": 0.7075, "step": 4073 }, { "epoch": 0.3758736016607081, "grad_norm": 2.7747055999034633, "learning_rate": 9.05487033205325e-07, "loss": 0.6516, "step": 4074 }, { "epoch": 0.375965863222235, "grad_norm": 1.841774860399856, "learning_rate": 9.05318884887835e-07, "loss": 0.6616, "step": 4075 }, { "epoch": 0.375965863222235, "eval_GEN Loss": 0.46514856815338135, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3565382659435272, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8983774185180664, "eval_runtime": 56.7211, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4075 }, { "epoch": 0.37605812478376194, "grad_norm": 2.144210112325349, "learning_rate": 9.051507111674063e-07, "loss": 0.8158, "step": 4076 }, { "epoch": 0.3761503863452889, "grad_norm": 2.20490626849351, "learning_rate": 9.049825120592792e-07, "loss": 0.8346, "step": 4077 }, { "epoch": 0.37624264790681583, "grad_norm": 1.397526771085783, "learning_rate": 9.048142875786962e-07, "loss": 0.6113, "step": 4078 }, { "epoch": 0.37633490946834275, "grad_norm": 1.6255512559752765, "learning_rate": 9.046460377409021e-07, "loss": 0.5746, "step": 4079 }, { "epoch": 0.37642717102986967, "grad_norm": 2.1719524743768552, "learning_rate": 9.04477762561144e-07, "loss": 0.7364, "step": 4080 }, { "epoch": 0.37642717102986967, "eval_GEN Loss": 0.4640125334262848, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3585696220397949, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8894230723381042, "eval_runtime": 55.8127, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4080 }, { "epoch": 0.3765194325913966, "grad_norm": 1.7551920488598083, "learning_rate": 9.04309462054671e-07, "loss": 0.6205, "step": 4081 }, { "epoch": 0.37661169415292356, "grad_norm": 1.841775913433435, "learning_rate": 9.041411362367347e-07, "loss": 0.6243, "step": 4082 }, { "epoch": 0.3767039557144505, "grad_norm": 2.609938241896056, "learning_rate": 9.039727851225896e-07, "loss": 1.1076, "step": 4083 }, { "epoch": 0.3767962172759774, "grad_norm": 2.012470815006629, "learning_rate": 9.038044087274913e-07, "loss": 0.5505, "step": 4084 }, { "epoch": 0.3768884788375043, "grad_norm": 3.057574371135215, "learning_rate": 9.036360070666988e-07, "loss": 0.8766, "step": 4085 }, { "epoch": 0.3768884788375043, "eval_GEN Loss": 0.4655226469039917, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3777284324169159, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8847355842590332, "eval_runtime": 55.8848, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4085 }, { "epoch": 0.37698074039903123, "grad_norm": 1.2289862852034075, "learning_rate": 9.034675801554728e-07, "loss": 0.5911, "step": 4086 }, { "epoch": 0.3770730019605582, "grad_norm": 2.1253223280119684, "learning_rate": 9.032991280090763e-07, "loss": 0.9118, "step": 4087 }, { "epoch": 0.3771652635220851, "grad_norm": 1.580319589302749, "learning_rate": 9.031306506427748e-07, "loss": 0.7123, "step": 4088 }, { "epoch": 0.37725752508361204, "grad_norm": 2.0879649675225225, "learning_rate": 9.029621480718359e-07, "loss": 0.7451, "step": 4089 }, { "epoch": 0.37734978664513896, "grad_norm": 1.8203296833292217, "learning_rate": 9.027936203115298e-07, "loss": 0.6666, "step": 4090 }, { "epoch": 0.37734978664513896, "eval_GEN Loss": 0.4692361354827881, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8535031847133758, "eval_PRM F1 AUC": 0.751440544787847, "eval_PRM F1 Neg": 0.5818181818181818, "eval_PRM Loss": 0.4262109398841858, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9054054054054054, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9024038314819336, "eval_runtime": 55.7702, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4090 }, { "epoch": 0.3774420482066659, "grad_norm": 1.7255796283932037, "learning_rate": 9.026250673771285e-07, "loss": 0.6584, "step": 4091 }, { "epoch": 0.3775343097681928, "grad_norm": 1.8623634582837343, "learning_rate": 9.024564892839065e-07, "loss": 0.8439, "step": 4092 }, { "epoch": 0.3776265713297198, "grad_norm": 1.4866862015032798, "learning_rate": 9.022878860471408e-07, "loss": 0.5778, "step": 4093 }, { "epoch": 0.3777188328912467, "grad_norm": 1.9813739983608938, "learning_rate": 9.021192576821103e-07, "loss": 0.6114, "step": 4094 }, { "epoch": 0.3778110944527736, "grad_norm": 3.0584135468221385, "learning_rate": 9.019506042040965e-07, "loss": 0.6117, "step": 4095 }, { "epoch": 0.3778110944527736, "eval_GEN Loss": 0.4708370268344879, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8366013071895425, "eval_PRM F1 AUC": 0.7551073860660031, "eval_PRM F1 Neg": 0.576271186440678, "eval_PRM Loss": 0.4815226197242737, "eval_PRM NPV": 0.4722222222222222, "eval_PRM Precision": 0.9142857142857143, "eval_PRM Recall": 0.7710843373493976, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9449519515037537, "eval_runtime": 55.6971, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4095 }, { "epoch": 0.37790335601430053, "grad_norm": 2.525534773816227, "learning_rate": 9.017819256283831e-07, "loss": 0.7888, "step": 4096 }, { "epoch": 0.37799561757582745, "grad_norm": 1.6094735277602292, "learning_rate": 9.01613221970256e-07, "loss": 0.6046, "step": 4097 }, { "epoch": 0.3780878791373544, "grad_norm": 1.9296375765041347, "learning_rate": 9.014444932450031e-07, "loss": 0.7918, "step": 4098 }, { "epoch": 0.37818014069888134, "grad_norm": 1.7958187386170053, "learning_rate": 9.012757394679153e-07, "loss": 0.6623, "step": 4099 }, { "epoch": 0.37827240226040826, "grad_norm": 1.8015992592485275, "learning_rate": 9.011069606542851e-07, "loss": 0.697, "step": 4100 }, { "epoch": 0.37827240226040826, "eval_GEN Loss": 0.47058019042015076, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8441558441558441, "eval_PRM F1 AUC": 0.7611314824515453, "eval_PRM F1 Neg": 0.5862068965517241, "eval_PRM Loss": 0.46750107407569885, "eval_PRM NPV": 0.4857142857142857, "eval_PRM Precision": 0.9154929577464789, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9304086565971375, "eval_runtime": 55.7299, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4100 }, { "epoch": 0.3783646638219352, "grad_norm": 1.7976359852623367, "learning_rate": 9.009381568194076e-07, "loss": 0.688, "step": 4101 }, { "epoch": 0.3784569253834621, "grad_norm": 2.14261377974147, "learning_rate": 9.007693279785798e-07, "loss": 0.6121, "step": 4102 }, { "epoch": 0.37854918694498907, "grad_norm": 2.1940832758947146, "learning_rate": 9.006004741471015e-07, "loss": 0.8052, "step": 4103 }, { "epoch": 0.378641448506516, "grad_norm": 2.102796633400336, "learning_rate": 9.004315953402746e-07, "loss": 0.8437, "step": 4104 }, { "epoch": 0.3787337100680429, "grad_norm": 1.6218420515095666, "learning_rate": 9.002626915734026e-07, "loss": 0.518, "step": 4105 }, { "epoch": 0.3787337100680429, "eval_GEN Loss": 0.47079312801361084, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8589743589743589, "eval_PRM F1 AUC": 0.7731796752226295, "eval_PRM F1 Neg": 0.6071428571428571, "eval_PRM Loss": 0.4295346140861511, "eval_PRM NPV": 0.5151515151515151, "eval_PRM Precision": 0.9178082191780822, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9019832015037537, "eval_runtime": 56.0146, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 4105 }, { "epoch": 0.3788259716295698, "grad_norm": 2.400523109204971, "learning_rate": 9.000937628617926e-07, "loss": 0.8537, "step": 4106 }, { "epoch": 0.37891823319109674, "grad_norm": 1.8319235433145722, "learning_rate": 8.999248092207526e-07, "loss": 0.7021, "step": 4107 }, { "epoch": 0.37901049475262366, "grad_norm": 1.986099336811533, "learning_rate": 8.997558306655937e-07, "loss": 0.7189, "step": 4108 }, { "epoch": 0.37910275631415064, "grad_norm": 2.403008577479829, "learning_rate": 8.99586827211629e-07, "loss": 0.9662, "step": 4109 }, { "epoch": 0.37919501787567755, "grad_norm": 1.9345838871761694, "learning_rate": 8.994177988741737e-07, "loss": 0.6802, "step": 4110 }, { "epoch": 0.37919501787567755, "eval_GEN Loss": 0.4700886607170105, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.3806597888469696, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8706730604171753, "eval_runtime": 55.8094, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4110 }, { "epoch": 0.37928727943720447, "grad_norm": 2.9720549147061597, "learning_rate": 8.992487456685458e-07, "loss": 0.9286, "step": 4111 }, { "epoch": 0.3793795409987314, "grad_norm": 1.5057151845691115, "learning_rate": 8.990796676100645e-07, "loss": 0.4774, "step": 4112 }, { "epoch": 0.3794718025602583, "grad_norm": 2.4999280095476464, "learning_rate": 8.989105647140526e-07, "loss": 0.8233, "step": 4113 }, { "epoch": 0.3795640641217853, "grad_norm": 2.237538056428383, "learning_rate": 8.98741436995834e-07, "loss": 0.7955, "step": 4114 }, { "epoch": 0.3796563256833122, "grad_norm": 2.5053640123480925, "learning_rate": 8.985722844707356e-07, "loss": 0.6693, "step": 4115 }, { "epoch": 0.3796563256833122, "eval_GEN Loss": 0.46913740038871765, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.3650398552417755, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8587139248847961, "eval_runtime": 55.7723, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4115 }, { "epoch": 0.3797485872448391, "grad_norm": 1.9776617660935796, "learning_rate": 8.984031071540864e-07, "loss": 0.7515, "step": 4116 }, { "epoch": 0.37984084880636604, "grad_norm": 2.2762681584190285, "learning_rate": 8.982339050612171e-07, "loss": 0.6703, "step": 4117 }, { "epoch": 0.37993311036789296, "grad_norm": 2.202246794691524, "learning_rate": 8.98064678207461e-07, "loss": 0.8285, "step": 4118 }, { "epoch": 0.38002537192941993, "grad_norm": 2.3502799803474153, "learning_rate": 8.978954266081541e-07, "loss": 0.6768, "step": 4119 }, { "epoch": 0.38011763349094685, "grad_norm": 3.0643027733717756, "learning_rate": 8.977261502786342e-07, "loss": 0.7997, "step": 4120 }, { "epoch": 0.38011763349094685, "eval_GEN Loss": 0.47055891156196594, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.379611611366272, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8648437261581421, "eval_runtime": 55.7657, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4120 }, { "epoch": 0.38020989505247377, "grad_norm": 2.1003669521683968, "learning_rate": 8.975568492342412e-07, "loss": 0.7221, "step": 4121 }, { "epoch": 0.3803021566140007, "grad_norm": 1.5552526360183851, "learning_rate": 8.973875234903177e-07, "loss": 0.6073, "step": 4122 }, { "epoch": 0.3803944181755276, "grad_norm": 1.7268954960628977, "learning_rate": 8.972181730622079e-07, "loss": 0.6531, "step": 4123 }, { "epoch": 0.3804866797370545, "grad_norm": 1.693727855069528, "learning_rate": 8.970487979652588e-07, "loss": 0.5369, "step": 4124 }, { "epoch": 0.3805789412985815, "grad_norm": 1.507390905963885, "learning_rate": 8.968793982148194e-07, "loss": 0.5774, "step": 4125 }, { "epoch": 0.3805789412985815, "eval_GEN Loss": 0.4713898301124573, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.3831806182861328, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8662259578704834, "eval_runtime": 55.8614, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4125 }, { "epoch": 0.3806712028601084, "grad_norm": 2.209484094137634, "learning_rate": 8.96709973826241e-07, "loss": 0.6745, "step": 4126 }, { "epoch": 0.38076346442163533, "grad_norm": 2.186873075109473, "learning_rate": 8.965405248148772e-07, "loss": 0.4689, "step": 4127 }, { "epoch": 0.38085572598316225, "grad_norm": 2.6099540206379634, "learning_rate": 8.963710511960835e-07, "loss": 0.7421, "step": 4128 }, { "epoch": 0.38094798754468917, "grad_norm": 1.9645379617710306, "learning_rate": 8.96201552985218e-07, "loss": 0.8676, "step": 4129 }, { "epoch": 0.38104024910621614, "grad_norm": 1.6447165659097023, "learning_rate": 8.96032030197641e-07, "loss": 0.5708, "step": 4130 }, { "epoch": 0.38104024910621614, "eval_GEN Loss": 0.4711868166923523, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9212121212121213, "eval_PRM F1 AUC": 0.8273965426925091, "eval_PRM F1 Neg": 0.723404255319149, "eval_PRM Loss": 0.3539343774318695, "eval_PRM NPV": 0.7083333333333334, "eval_PRM Precision": 0.926829268292683, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8549879789352417, "eval_runtime": 55.9042, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4130 }, { "epoch": 0.38113251066774306, "grad_norm": 1.520369438128281, "learning_rate": 8.958624828487148e-07, "loss": 0.7368, "step": 4131 }, { "epoch": 0.38122477222927, "grad_norm": 2.2056337831280066, "learning_rate": 8.956929109538038e-07, "loss": 0.8261, "step": 4132 }, { "epoch": 0.3813170337907969, "grad_norm": 1.4795051528939969, "learning_rate": 8.955233145282754e-07, "loss": 0.7209, "step": 4133 }, { "epoch": 0.3814092953523238, "grad_norm": 1.367917648382338, "learning_rate": 8.953536935874983e-07, "loss": 0.7128, "step": 4134 }, { "epoch": 0.3815015569138508, "grad_norm": 1.8337092081931965, "learning_rate": 8.95184048146844e-07, "loss": 0.8696, "step": 4135 }, { "epoch": 0.3815015569138508, "eval_GEN Loss": 0.47096556425094604, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3369731903076172, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.854687511920929, "eval_runtime": 55.9978, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4135 }, { "epoch": 0.3815938184753777, "grad_norm": 1.6270411670323788, "learning_rate": 8.950143782216861e-07, "loss": 0.6367, "step": 4136 }, { "epoch": 0.38168608003690463, "grad_norm": 2.613811982352718, "learning_rate": 8.948446838274e-07, "loss": 0.8066, "step": 4137 }, { "epoch": 0.38177834159843155, "grad_norm": 2.4712859869770427, "learning_rate": 8.94674964979364e-07, "loss": 0.725, "step": 4138 }, { "epoch": 0.38187060315995847, "grad_norm": 1.2268644952870233, "learning_rate": 8.945052216929584e-07, "loss": 0.5812, "step": 4139 }, { "epoch": 0.3819628647214854, "grad_norm": 2.153654454794922, "learning_rate": 8.943354539835653e-07, "loss": 0.8481, "step": 4140 }, { "epoch": 0.3819628647214854, "eval_GEN Loss": 0.4700216054916382, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3401414155960083, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8580529093742371, "eval_runtime": 56.0493, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 4140 }, { "epoch": 0.38205512628301236, "grad_norm": 2.980288290905818, "learning_rate": 8.941656618665692e-07, "loss": 0.7908, "step": 4141 }, { "epoch": 0.3821473878445393, "grad_norm": 2.176296309902741, "learning_rate": 8.939958453573573e-07, "loss": 0.7233, "step": 4142 }, { "epoch": 0.3822396494060662, "grad_norm": 1.7614135698499784, "learning_rate": 8.938260044713185e-07, "loss": 0.7508, "step": 4143 }, { "epoch": 0.3823319109675931, "grad_norm": 1.6930084883845857, "learning_rate": 8.93656139223844e-07, "loss": 0.7988, "step": 4144 }, { "epoch": 0.38242417252912003, "grad_norm": 1.6486405498598211, "learning_rate": 8.934862496303273e-07, "loss": 0.851, "step": 4145 }, { "epoch": 0.38242417252912003, "eval_GEN Loss": 0.4703010022640228, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9212121212121213, "eval_PRM F1 AUC": 0.8273965426925091, "eval_PRM F1 Neg": 0.723404255319149, "eval_PRM Loss": 0.35920852422714233, "eval_PRM NPV": 0.7083333333333334, "eval_PRM Precision": 0.926829268292683, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8649038672447205, "eval_runtime": 55.7304, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4145 }, { "epoch": 0.382516434090647, "grad_norm": 1.9797619992575017, "learning_rate": 8.933163357061641e-07, "loss": 0.7228, "step": 4146 }, { "epoch": 0.3826086956521739, "grad_norm": 2.793289457320529, "learning_rate": 8.931463974667524e-07, "loss": 0.7135, "step": 4147 }, { "epoch": 0.38270095721370084, "grad_norm": 2.006307614165737, "learning_rate": 8.929764349274917e-07, "loss": 0.6977, "step": 4148 }, { "epoch": 0.38279321877522776, "grad_norm": 1.911785679074507, "learning_rate": 8.928064481037849e-07, "loss": 0.6887, "step": 4149 }, { "epoch": 0.3828854803367547, "grad_norm": 1.516171077232002, "learning_rate": 8.926364370110361e-07, "loss": 0.6743, "step": 4150 }, { "epoch": 0.3828854803367547, "eval_GEN Loss": 0.4698607325553894, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.3694307208061218, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8732572197914124, "eval_runtime": 56.5443, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 4150 }, { "epoch": 0.38297774189828165, "grad_norm": 1.5397195893431548, "learning_rate": 8.924664016646523e-07, "loss": 0.7933, "step": 4151 }, { "epoch": 0.3830700034598086, "grad_norm": 2.1903763474763815, "learning_rate": 8.922963420800421e-07, "loss": 0.8532, "step": 4152 }, { "epoch": 0.3831622650213355, "grad_norm": 2.8023344938705628, "learning_rate": 8.921262582726166e-07, "loss": 0.8403, "step": 4153 }, { "epoch": 0.3832545265828624, "grad_norm": 2.078904830604637, "learning_rate": 8.919561502577892e-07, "loss": 0.7517, "step": 4154 }, { "epoch": 0.3833467881443893, "grad_norm": 2.189586301332461, "learning_rate": 8.917860180509752e-07, "loss": 0.8015, "step": 4155 }, { "epoch": 0.3833467881443893, "eval_GEN Loss": 0.46900999546051025, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.38497164845466614, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8823317289352417, "eval_runtime": 55.8541, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4155 }, { "epoch": 0.38343904970591625, "grad_norm": 2.0327216013773035, "learning_rate": 8.916158616675924e-07, "loss": 0.7306, "step": 4156 }, { "epoch": 0.3835313112674432, "grad_norm": 2.107789450922101, "learning_rate": 8.914456811230604e-07, "loss": 0.6397, "step": 4157 }, { "epoch": 0.38362357282897014, "grad_norm": 2.73424299657904, "learning_rate": 8.912754764328014e-07, "loss": 0.8332, "step": 4158 }, { "epoch": 0.38371583439049706, "grad_norm": 2.7737737665339637, "learning_rate": 8.911052476122398e-07, "loss": 0.8803, "step": 4159 }, { "epoch": 0.383808095952024, "grad_norm": 1.9201754705277472, "learning_rate": 8.909349946768015e-07, "loss": 0.7676, "step": 4160 }, { "epoch": 0.383808095952024, "eval_GEN Loss": 0.4681911766529083, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3734659254550934, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8832331895828247, "eval_runtime": 55.866, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4160 }, { "epoch": 0.3839003575135509, "grad_norm": 2.369577124317477, "learning_rate": 8.907647176419157e-07, "loss": 0.814, "step": 4161 }, { "epoch": 0.38399261907507787, "grad_norm": 2.2861983181404213, "learning_rate": 8.905944165230127e-07, "loss": 0.7954, "step": 4162 }, { "epoch": 0.3840848806366048, "grad_norm": 2.3950837743453772, "learning_rate": 8.904240913355259e-07, "loss": 0.7816, "step": 4163 }, { "epoch": 0.3841771421981317, "grad_norm": 2.5310327958778487, "learning_rate": 8.902537420948898e-07, "loss": 0.8308, "step": 4164 }, { "epoch": 0.3842694037596586, "grad_norm": 2.6523252994872504, "learning_rate": 8.900833688165423e-07, "loss": 0.971, "step": 4165 }, { "epoch": 0.3842694037596586, "eval_GEN Loss": 0.4663677215576172, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36391881108283997, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8916466236114502, "eval_runtime": 55.8576, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4165 }, { "epoch": 0.38436166532118554, "grad_norm": 1.724650213178172, "learning_rate": 8.899129715159225e-07, "loss": 0.7285, "step": 4166 }, { "epoch": 0.3844539268827125, "grad_norm": 1.6841176991837141, "learning_rate": 8.897425502084722e-07, "loss": 0.7494, "step": 4167 }, { "epoch": 0.38454618844423943, "grad_norm": 1.9759139217235067, "learning_rate": 8.895721049096354e-07, "loss": 0.7731, "step": 4168 }, { "epoch": 0.38463845000576635, "grad_norm": 1.7685707146533716, "learning_rate": 8.89401635634858e-07, "loss": 0.6805, "step": 4169 }, { "epoch": 0.38473071156729327, "grad_norm": 1.545108224647599, "learning_rate": 8.892311423995882e-07, "loss": 0.7398, "step": 4170 }, { "epoch": 0.38473071156729327, "eval_GEN Loss": 0.4657104015350342, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36361831426620483, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8933293223381042, "eval_runtime": 55.8136, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4170 }, { "epoch": 0.3848229731288202, "grad_norm": 1.5057504669971054, "learning_rate": 8.890606252192764e-07, "loss": 0.5024, "step": 4171 }, { "epoch": 0.3849152346903471, "grad_norm": 2.081063713196889, "learning_rate": 8.88890084109375e-07, "loss": 0.7642, "step": 4172 }, { "epoch": 0.3850074962518741, "grad_norm": 2.046901548970188, "learning_rate": 8.88719519085339e-07, "loss": 0.6805, "step": 4173 }, { "epoch": 0.385099757813401, "grad_norm": 1.7701919851806927, "learning_rate": 8.88548930162625e-07, "loss": 0.7638, "step": 4174 }, { "epoch": 0.3851920193749279, "grad_norm": 2.263116391467018, "learning_rate": 8.883783173566922e-07, "loss": 0.7666, "step": 4175 }, { "epoch": 0.3851920193749279, "eval_GEN Loss": 0.46534600853919983, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3683016896247864, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8954927921295166, "eval_runtime": 55.9185, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4175 }, { "epoch": 0.38528428093645484, "grad_norm": 2.207970619843975, "learning_rate": 8.882076806830015e-07, "loss": 0.5522, "step": 4176 }, { "epoch": 0.38537654249798176, "grad_norm": 2.4600937725481153, "learning_rate": 8.880370201570167e-07, "loss": 0.7578, "step": 4177 }, { "epoch": 0.38546880405950873, "grad_norm": 1.815296054932152, "learning_rate": 8.87866335794203e-07, "loss": 0.7262, "step": 4178 }, { "epoch": 0.38556106562103565, "grad_norm": 1.9574633905051928, "learning_rate": 8.876956276100282e-07, "loss": 0.6068, "step": 4179 }, { "epoch": 0.38565332718256257, "grad_norm": 2.4599120766660088, "learning_rate": 8.87524895619962e-07, "loss": 0.7273, "step": 4180 }, { "epoch": 0.38565332718256257, "eval_GEN Loss": 0.46767744421958923, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3833829462528229, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9011418223381042, "eval_runtime": 56.0967, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 4180 }, { "epoch": 0.3857455887440895, "grad_norm": 1.7663893952240763, "learning_rate": 8.873541398394768e-07, "loss": 0.7064, "step": 4181 }, { "epoch": 0.3858378503056164, "grad_norm": 1.7272816864428557, "learning_rate": 8.871833602840463e-07, "loss": 0.6884, "step": 4182 }, { "epoch": 0.3859301118671434, "grad_norm": 1.7081083896742395, "learning_rate": 8.870125569691471e-07, "loss": 0.6074, "step": 4183 }, { "epoch": 0.3860223734286703, "grad_norm": 1.9922988697969741, "learning_rate": 8.868417299102575e-07, "loss": 0.722, "step": 4184 }, { "epoch": 0.3861146349901972, "grad_norm": 2.414018439640081, "learning_rate": 8.866708791228583e-07, "loss": 0.8671, "step": 4185 }, { "epoch": 0.3861146349901972, "eval_GEN Loss": 0.4676385223865509, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3864862620830536, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9075120091438293, "eval_runtime": 56.0006, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4185 }, { "epoch": 0.38620689655172413, "grad_norm": 2.2164509051288137, "learning_rate": 8.86500004622432e-07, "loss": 0.5784, "step": 4186 }, { "epoch": 0.38629915811325105, "grad_norm": 1.7056810662656736, "learning_rate": 8.863291064244639e-07, "loss": 0.5829, "step": 4187 }, { "epoch": 0.38639141967477797, "grad_norm": 2.400412623022726, "learning_rate": 8.861581845444407e-07, "loss": 0.8468, "step": 4188 }, { "epoch": 0.38648368123630494, "grad_norm": 1.9693845638268446, "learning_rate": 8.859872389978518e-07, "loss": 0.7192, "step": 4189 }, { "epoch": 0.38657594279783186, "grad_norm": 1.9040475462580282, "learning_rate": 8.858162698001885e-07, "loss": 0.728, "step": 4190 }, { "epoch": 0.38657594279783186, "eval_GEN Loss": 0.4676743149757385, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38475629687309265, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9117187261581421, "eval_runtime": 55.7488, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4190 }, { "epoch": 0.3866682043593588, "grad_norm": 1.9798730968837608, "learning_rate": 8.856452769669441e-07, "loss": 0.8242, "step": 4191 }, { "epoch": 0.3867604659208857, "grad_norm": 1.77718143310619, "learning_rate": 8.854742605136147e-07, "loss": 0.878, "step": 4192 }, { "epoch": 0.3868527274824126, "grad_norm": 2.41595112775984, "learning_rate": 8.853032204556977e-07, "loss": 0.5646, "step": 4193 }, { "epoch": 0.3869449890439396, "grad_norm": 2.116837203567898, "learning_rate": 8.85132156808693e-07, "loss": 0.7877, "step": 4194 }, { "epoch": 0.3870372506054665, "grad_norm": 1.9309305362091516, "learning_rate": 8.84961069588103e-07, "loss": 0.7074, "step": 4195 }, { "epoch": 0.3870372506054665, "eval_GEN Loss": 0.4683523178100586, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.381059855222702, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9173678159713745, "eval_runtime": 55.7508, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4195 }, { "epoch": 0.38712951216699343, "grad_norm": 1.9911867343954848, "learning_rate": 8.847899588094316e-07, "loss": 0.6731, "step": 4196 }, { "epoch": 0.38722177372852035, "grad_norm": 2.8252080754802202, "learning_rate": 8.846188244881854e-07, "loss": 1.019, "step": 4197 }, { "epoch": 0.38731403529004726, "grad_norm": 1.9017921564465072, "learning_rate": 8.844476666398726e-07, "loss": 0.6573, "step": 4198 }, { "epoch": 0.38740629685157424, "grad_norm": 1.648562886711212, "learning_rate": 8.842764852800037e-07, "loss": 0.7175, "step": 4199 }, { "epoch": 0.38749855841310116, "grad_norm": 1.899182383830107, "learning_rate": 8.841052804240918e-07, "loss": 0.6292, "step": 4200 }, { "epoch": 0.38749855841310116, "eval_GEN Loss": 0.4674999713897705, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.38112860918045044, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9100961685180664, "eval_runtime": 55.9871, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4200 }, { "epoch": 0.3875908199746281, "grad_norm": 3.086778704607036, "learning_rate": 8.839340520876513e-07, "loss": 0.9341, "step": 4201 }, { "epoch": 0.387683081536155, "grad_norm": 1.420937228764487, "learning_rate": 8.837628002861998e-07, "loss": 0.6994, "step": 4202 }, { "epoch": 0.3877753430976819, "grad_norm": 1.621592627710753, "learning_rate": 8.835915250352557e-07, "loss": 0.6528, "step": 4203 }, { "epoch": 0.38786760465920883, "grad_norm": 1.815620082216712, "learning_rate": 8.834202263503409e-07, "loss": 0.7354, "step": 4204 }, { "epoch": 0.3879598662207358, "grad_norm": 2.5642367575220777, "learning_rate": 8.83248904246978e-07, "loss": 0.6432, "step": 4205 }, { "epoch": 0.3879598662207358, "eval_GEN Loss": 0.46722376346588135, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3848364055156708, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9116586446762085, "eval_runtime": 55.8921, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4205 }, { "epoch": 0.3880521277822627, "grad_norm": 2.057249050716057, "learning_rate": 8.830775587406932e-07, "loss": 0.7836, "step": 4206 }, { "epoch": 0.38814438934378964, "grad_norm": 3.066725636991236, "learning_rate": 8.829061898470137e-07, "loss": 0.9165, "step": 4207 }, { "epoch": 0.38823665090531656, "grad_norm": 2.269660349015463, "learning_rate": 8.827347975814693e-07, "loss": 0.8813, "step": 4208 }, { "epoch": 0.3883289124668435, "grad_norm": 1.8156204829884148, "learning_rate": 8.82563381959592e-07, "loss": 0.5474, "step": 4209 }, { "epoch": 0.38842117402837045, "grad_norm": 1.4701347270248641, "learning_rate": 8.823919429969156e-07, "loss": 0.7296, "step": 4210 }, { "epoch": 0.38842117402837045, "eval_GEN Loss": 0.46739426255226135, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4045126438140869, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.920192301273346, "eval_runtime": 55.82, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4210 }, { "epoch": 0.38851343558989737, "grad_norm": 2.4347157445639453, "learning_rate": 8.822204807089763e-07, "loss": 0.5665, "step": 4211 }, { "epoch": 0.3886056971514243, "grad_norm": 1.6792201907571038, "learning_rate": 8.820489951113117e-07, "loss": 0.8638, "step": 4212 }, { "epoch": 0.3886979587129512, "grad_norm": 2.130828845031335, "learning_rate": 8.81877486219463e-07, "loss": 0.6532, "step": 4213 }, { "epoch": 0.3887902202744781, "grad_norm": 1.8535774897395798, "learning_rate": 8.81705954048972e-07, "loss": 0.7654, "step": 4214 }, { "epoch": 0.3888824818360051, "grad_norm": 1.5685077404719894, "learning_rate": 8.815343986153833e-07, "loss": 0.6149, "step": 4215 }, { "epoch": 0.3888824818360051, "eval_GEN Loss": 0.46671146154403687, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.39625248312950134, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9140625, "eval_runtime": 55.6395, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4215 }, { "epoch": 0.388974743397532, "grad_norm": 1.6526513609658287, "learning_rate": 8.813628199342438e-07, "loss": 0.6009, "step": 4216 }, { "epoch": 0.38906700495905894, "grad_norm": 1.757727787369412, "learning_rate": 8.81191218021102e-07, "loss": 0.6424, "step": 4217 }, { "epoch": 0.38915926652058586, "grad_norm": 2.169229011572423, "learning_rate": 8.810195928915087e-07, "loss": 0.6784, "step": 4218 }, { "epoch": 0.3892515280821128, "grad_norm": 1.6219806215029597, "learning_rate": 8.808479445610169e-07, "loss": 0.5808, "step": 4219 }, { "epoch": 0.3893437896436397, "grad_norm": 1.4709005221147395, "learning_rate": 8.806762730451818e-07, "loss": 0.7293, "step": 4220 }, { "epoch": 0.3893437896436397, "eval_GEN Loss": 0.46757838129997253, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.382976233959198, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9084134697914124, "eval_runtime": 55.7814, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4220 }, { "epoch": 0.38943605120516667, "grad_norm": 1.604322000558313, "learning_rate": 8.805045783595604e-07, "loss": 0.6584, "step": 4221 }, { "epoch": 0.3895283127666936, "grad_norm": 2.038467337841438, "learning_rate": 8.803328605197117e-07, "loss": 0.7671, "step": 4222 }, { "epoch": 0.3896205743282205, "grad_norm": 1.878972099042478, "learning_rate": 8.801611195411975e-07, "loss": 0.7579, "step": 4223 }, { "epoch": 0.3897128358897474, "grad_norm": 1.5431423004238445, "learning_rate": 8.799893554395808e-07, "loss": 0.7222, "step": 4224 }, { "epoch": 0.38980509745127434, "grad_norm": 2.2025219864565972, "learning_rate": 8.798175682304275e-07, "loss": 0.8172, "step": 4225 }, { "epoch": 0.38980509745127434, "eval_GEN Loss": 0.4683484733104706, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3735651969909668, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9147836565971375, "eval_runtime": 56.9154, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 4225 }, { "epoch": 0.3898973590128013, "grad_norm": 2.045514727852902, "learning_rate": 8.796457579293049e-07, "loss": 0.7462, "step": 4226 }, { "epoch": 0.38998962057432823, "grad_norm": 1.6115629716649735, "learning_rate": 8.794739245517833e-07, "loss": 0.8266, "step": 4227 }, { "epoch": 0.39008188213585515, "grad_norm": 1.7415746057289088, "learning_rate": 8.793020681134337e-07, "loss": 0.7017, "step": 4228 }, { "epoch": 0.39017414369738207, "grad_norm": 2.6234889182620753, "learning_rate": 8.791301886298306e-07, "loss": 0.6513, "step": 4229 }, { "epoch": 0.390266405258909, "grad_norm": 1.6981577867104116, "learning_rate": 8.789582861165498e-07, "loss": 0.594, "step": 4230 }, { "epoch": 0.390266405258909, "eval_GEN Loss": 0.46845388412475586, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3746455907821655, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9098557829856873, "eval_runtime": 56.7228, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4230 }, { "epoch": 0.39035866682043596, "grad_norm": 2.773731049775948, "learning_rate": 8.787863605891693e-07, "loss": 1.1777, "step": 4231 }, { "epoch": 0.3904509283819629, "grad_norm": 1.696418373981368, "learning_rate": 8.786144120632695e-07, "loss": 0.6604, "step": 4232 }, { "epoch": 0.3905431899434898, "grad_norm": 2.1182461696003143, "learning_rate": 8.784424405544323e-07, "loss": 0.8694, "step": 4233 }, { "epoch": 0.3906354515050167, "grad_norm": 1.4293058448827018, "learning_rate": 8.782704460782423e-07, "loss": 0.5743, "step": 4234 }, { "epoch": 0.39072771306654364, "grad_norm": 1.8843160214318244, "learning_rate": 8.780984286502859e-07, "loss": 0.661, "step": 4235 }, { "epoch": 0.39072771306654364, "eval_GEN Loss": 0.4686843454837799, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3805236518383026, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9052884578704834, "eval_runtime": 56.7354, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4235 }, { "epoch": 0.39081997462807055, "grad_norm": 2.3980605896043388, "learning_rate": 8.779263882861513e-07, "loss": 0.6525, "step": 4236 }, { "epoch": 0.39091223618959753, "grad_norm": 1.3055808070959023, "learning_rate": 8.777543250014295e-07, "loss": 0.6436, "step": 4237 }, { "epoch": 0.39100449775112445, "grad_norm": 2.0331653865520964, "learning_rate": 8.775822388117128e-07, "loss": 0.6717, "step": 4238 }, { "epoch": 0.39109675931265137, "grad_norm": 1.9885650635117162, "learning_rate": 8.77410129732596e-07, "loss": 0.8394, "step": 4239 }, { "epoch": 0.3911890208741783, "grad_norm": 1.6864053757155355, "learning_rate": 8.77237997779676e-07, "loss": 0.6439, "step": 4240 }, { "epoch": 0.3911890208741783, "eval_GEN Loss": 0.46901586651802063, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3903825581073761, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.900120198726654, "eval_runtime": 56.4945, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 4240 }, { "epoch": 0.3912812824357052, "grad_norm": 1.6301848760171647, "learning_rate": 8.770658429685516e-07, "loss": 0.5913, "step": 4241 }, { "epoch": 0.3913735439972322, "grad_norm": 2.0210589593852935, "learning_rate": 8.768936653148238e-07, "loss": 0.6881, "step": 4242 }, { "epoch": 0.3914658055587591, "grad_norm": 2.2252430452388317, "learning_rate": 8.767214648340956e-07, "loss": 0.6681, "step": 4243 }, { "epoch": 0.391558067120286, "grad_norm": 2.453319884352639, "learning_rate": 8.765492415419718e-07, "loss": 0.9377, "step": 4244 }, { "epoch": 0.39165032868181293, "grad_norm": 2.2995127505561657, "learning_rate": 8.763769954540602e-07, "loss": 0.6208, "step": 4245 }, { "epoch": 0.39165032868181293, "eval_GEN Loss": 0.4683094620704651, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4013063609600067, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8981971144676208, "eval_runtime": 55.9065, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4245 }, { "epoch": 0.39174259024333985, "grad_norm": 1.5032394570002048, "learning_rate": 8.762047265859694e-07, "loss": 0.6121, "step": 4246 }, { "epoch": 0.3918348518048668, "grad_norm": 1.5480770372463208, "learning_rate": 8.760324349533107e-07, "loss": 0.6737, "step": 4247 }, { "epoch": 0.39192711336639374, "grad_norm": 3.29304573792603, "learning_rate": 8.758601205716979e-07, "loss": 1.124, "step": 4248 }, { "epoch": 0.39201937492792066, "grad_norm": 2.828185598759477, "learning_rate": 8.75687783456746e-07, "loss": 0.7595, "step": 4249 }, { "epoch": 0.3921116364894476, "grad_norm": 1.9740521344126285, "learning_rate": 8.755154236240724e-07, "loss": 0.7065, "step": 4250 }, { "epoch": 0.3921116364894476, "eval_GEN Loss": 0.46747711300849915, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.40354177355766296, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.889723539352417, "eval_runtime": 55.8998, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4250 }, { "epoch": 0.3922038980509745, "grad_norm": 3.759399027897542, "learning_rate": 8.75343041089297e-07, "loss": 1.1175, "step": 4251 }, { "epoch": 0.3922961596125014, "grad_norm": 1.6637726403596287, "learning_rate": 8.751706358680412e-07, "loss": 0.8956, "step": 4252 }, { "epoch": 0.3923884211740284, "grad_norm": 1.6850903286112668, "learning_rate": 8.749982079759284e-07, "loss": 0.6962, "step": 4253 }, { "epoch": 0.3924806827355553, "grad_norm": 1.7528438887076614, "learning_rate": 8.748257574285847e-07, "loss": 0.8169, "step": 4254 }, { "epoch": 0.3925729442970822, "grad_norm": 1.5810883783134633, "learning_rate": 8.746532842416374e-07, "loss": 0.6327, "step": 4255 }, { "epoch": 0.3925729442970822, "eval_GEN Loss": 0.4670736491680145, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.41287872195243835, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8895432949066162, "eval_runtime": 56.7809, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4255 }, { "epoch": 0.39266520585860915, "grad_norm": 2.8406146197077455, "learning_rate": 8.744807884307167e-07, "loss": 0.7154, "step": 4256 }, { "epoch": 0.39275746742013606, "grad_norm": 1.2857420565541273, "learning_rate": 8.743082700114544e-07, "loss": 0.5915, "step": 4257 }, { "epoch": 0.39284972898166304, "grad_norm": 1.637782652915373, "learning_rate": 8.74135728999484e-07, "loss": 0.7289, "step": 4258 }, { "epoch": 0.39294199054318996, "grad_norm": 2.969165663626796, "learning_rate": 8.739631654104418e-07, "loss": 0.8184, "step": 4259 }, { "epoch": 0.3930342521047169, "grad_norm": 2.559728727344599, "learning_rate": 8.737905792599656e-07, "loss": 0.6754, "step": 4260 }, { "epoch": 0.3930342521047169, "eval_GEN Loss": 0.46754637360572815, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.43243032693862915, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8934495449066162, "eval_runtime": 55.7105, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4260 }, { "epoch": 0.3931265136662438, "grad_norm": 2.5493950798759752, "learning_rate": 8.736179705636956e-07, "loss": 0.7258, "step": 4261 }, { "epoch": 0.3932187752277707, "grad_norm": 2.392558144440463, "learning_rate": 8.734453393372737e-07, "loss": 0.8199, "step": 4262 }, { "epoch": 0.3933110367892977, "grad_norm": 3.0183404373499054, "learning_rate": 8.73272685596344e-07, "loss": 0.765, "step": 4263 }, { "epoch": 0.3934032983508246, "grad_norm": 2.0420228995141523, "learning_rate": 8.73100009356553e-07, "loss": 0.8191, "step": 4264 }, { "epoch": 0.3934955599123515, "grad_norm": 1.6300875443257699, "learning_rate": 8.729273106335484e-07, "loss": 0.5293, "step": 4265 }, { "epoch": 0.3934955599123515, "eval_GEN Loss": 0.4678018093109131, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.42081284523010254, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8900841474533081, "eval_runtime": 55.9135, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4265 }, { "epoch": 0.39358782147387844, "grad_norm": 2.6738385856087556, "learning_rate": 8.727545894429808e-07, "loss": 0.8442, "step": 4266 }, { "epoch": 0.39368008303540536, "grad_norm": 2.977650023710774, "learning_rate": 8.725818458005023e-07, "loss": 0.7996, "step": 4267 }, { "epoch": 0.3937723445969323, "grad_norm": 2.202312702165346, "learning_rate": 8.724090797217673e-07, "loss": 0.7535, "step": 4268 }, { "epoch": 0.39386460615845925, "grad_norm": 2.2462239745983648, "learning_rate": 8.722362912224319e-07, "loss": 0.8528, "step": 4269 }, { "epoch": 0.39395686771998617, "grad_norm": 1.4743924556776011, "learning_rate": 8.72063480318155e-07, "loss": 0.6928, "step": 4270 }, { "epoch": 0.39395686771998617, "eval_GEN Loss": 0.46791863441467285, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4018362760543823, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8888221383094788, "eval_runtime": 55.8428, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4270 }, { "epoch": 0.3940491292815131, "grad_norm": 1.6676823465996011, "learning_rate": 8.718906470245962e-07, "loss": 0.6344, "step": 4271 }, { "epoch": 0.39414139084304, "grad_norm": 1.6338925494223546, "learning_rate": 8.717177913574185e-07, "loss": 0.5008, "step": 4272 }, { "epoch": 0.3942336524045669, "grad_norm": 2.31864908227619, "learning_rate": 8.715449133322862e-07, "loss": 0.8714, "step": 4273 }, { "epoch": 0.3943259139660939, "grad_norm": 2.967127583133976, "learning_rate": 8.713720129648658e-07, "loss": 0.8467, "step": 4274 }, { "epoch": 0.3944181755276208, "grad_norm": 1.7684710300278648, "learning_rate": 8.711990902708259e-07, "loss": 0.8083, "step": 4275 }, { "epoch": 0.3944181755276208, "eval_GEN Loss": 0.46796780824661255, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3863297998905182, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8980769515037537, "eval_runtime": 55.8049, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4275 }, { "epoch": 0.39451043708914774, "grad_norm": 2.1835758697785215, "learning_rate": 8.710261452658367e-07, "loss": 0.7628, "step": 4276 }, { "epoch": 0.39460269865067465, "grad_norm": 1.616844244186754, "learning_rate": 8.708531779655712e-07, "loss": 0.656, "step": 4277 }, { "epoch": 0.3946949602122016, "grad_norm": 1.9467251957577303, "learning_rate": 8.706801883857036e-07, "loss": 0.5198, "step": 4278 }, { "epoch": 0.39478722177372855, "grad_norm": 2.0203125928456545, "learning_rate": 8.705071765419107e-07, "loss": 0.7089, "step": 4279 }, { "epoch": 0.39487948333525547, "grad_norm": 2.401128089853153, "learning_rate": 8.703341424498709e-07, "loss": 0.5473, "step": 4280 }, { "epoch": 0.39487948333525547, "eval_GEN Loss": 0.469140887260437, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.37683579325675964, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8948917984962463, "eval_runtime": 56.0903, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 4280 }, { "epoch": 0.3949717448967824, "grad_norm": 2.4335425958896266, "learning_rate": 8.701610861252651e-07, "loss": 0.6486, "step": 4281 }, { "epoch": 0.3950640064583093, "grad_norm": 1.9253960622065953, "learning_rate": 8.699880075837758e-07, "loss": 0.6372, "step": 4282 }, { "epoch": 0.3951562680198362, "grad_norm": 2.1450626740156618, "learning_rate": 8.698149068410874e-07, "loss": 0.8274, "step": 4283 }, { "epoch": 0.39524852958136314, "grad_norm": 1.8894892390947697, "learning_rate": 8.69641783912887e-07, "loss": 0.5552, "step": 4284 }, { "epoch": 0.3953407911428901, "grad_norm": 1.3202127166939235, "learning_rate": 8.694686388148629e-07, "loss": 0.5809, "step": 4285 }, { "epoch": 0.3953407911428901, "eval_GEN Loss": 0.4691178798675537, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3823791444301605, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8769831657409668, "eval_runtime": 55.9286, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4285 }, { "epoch": 0.39543305270441703, "grad_norm": 1.7775162075571096, "learning_rate": 8.692954715627061e-07, "loss": 0.7479, "step": 4286 }, { "epoch": 0.39552531426594395, "grad_norm": 2.333735615942076, "learning_rate": 8.691222821721091e-07, "loss": 0.7185, "step": 4287 }, { "epoch": 0.39561757582747087, "grad_norm": 2.8226766334007642, "learning_rate": 8.689490706587665e-07, "loss": 0.7122, "step": 4288 }, { "epoch": 0.3957098373889978, "grad_norm": 2.0178110729702547, "learning_rate": 8.687758370383753e-07, "loss": 0.8036, "step": 4289 }, { "epoch": 0.39580209895052476, "grad_norm": 2.5008606023518145, "learning_rate": 8.686025813266341e-07, "loss": 0.9469, "step": 4290 }, { "epoch": 0.39580209895052476, "eval_GEN Loss": 0.46987855434417725, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3912084996700287, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8719350695610046, "eval_runtime": 55.8113, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4290 }, { "epoch": 0.3958943605120517, "grad_norm": 2.3268250789852067, "learning_rate": 8.684293035392434e-07, "loss": 0.8212, "step": 4291 }, { "epoch": 0.3959866220735786, "grad_norm": 1.9505158873446584, "learning_rate": 8.682560036919061e-07, "loss": 0.6496, "step": 4292 }, { "epoch": 0.3960788836351055, "grad_norm": 2.038437527865328, "learning_rate": 8.68082681800327e-07, "loss": 0.7373, "step": 4293 }, { "epoch": 0.39617114519663243, "grad_norm": 2.4737729408867306, "learning_rate": 8.679093378802126e-07, "loss": 0.7354, "step": 4294 }, { "epoch": 0.3962634067581594, "grad_norm": 1.6244962839446495, "learning_rate": 8.677359719472715e-07, "loss": 0.6132, "step": 4295 }, { "epoch": 0.3962634067581594, "eval_GEN Loss": 0.47019505500793457, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3758028745651245, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8687499761581421, "eval_runtime": 55.7957, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4295 }, { "epoch": 0.3963556683196863, "grad_norm": 1.5006721132422796, "learning_rate": 8.675625840172145e-07, "loss": 0.6793, "step": 4296 }, { "epoch": 0.39644792988121325, "grad_norm": 1.854110476334864, "learning_rate": 8.673891741057545e-07, "loss": 0.7255, "step": 4297 }, { "epoch": 0.39654019144274016, "grad_norm": 2.881951406084966, "learning_rate": 8.672157422286059e-07, "loss": 0.9449, "step": 4298 }, { "epoch": 0.3966324530042671, "grad_norm": 2.6298327970311997, "learning_rate": 8.670422884014857e-07, "loss": 0.8994, "step": 4299 }, { "epoch": 0.396724714565794, "grad_norm": 2.422473869873427, "learning_rate": 8.668688126401122e-07, "loss": 0.9399, "step": 4300 }, { "epoch": 0.396724714565794, "eval_GEN Loss": 0.4692126512527466, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36371347308158875, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8774639368057251, "eval_runtime": 55.8896, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4300 }, { "epoch": 0.396816976127321, "grad_norm": 1.5792953443899793, "learning_rate": 8.666953149602061e-07, "loss": 0.6925, "step": 4301 }, { "epoch": 0.3969092376888479, "grad_norm": 1.2419722108732951, "learning_rate": 8.665217953774902e-07, "loss": 0.6279, "step": 4302 }, { "epoch": 0.3970014992503748, "grad_norm": 3.743828938173356, "learning_rate": 8.663482539076891e-07, "loss": 0.6552, "step": 4303 }, { "epoch": 0.39709376081190173, "grad_norm": 2.2608987667639786, "learning_rate": 8.661746905665295e-07, "loss": 0.7684, "step": 4304 }, { "epoch": 0.39718602237342865, "grad_norm": 2.48220334487363, "learning_rate": 8.660011053697396e-07, "loss": 0.7858, "step": 4305 }, { "epoch": 0.39718602237342865, "eval_GEN Loss": 0.4675985872745514, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3623906970024109, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8757211565971375, "eval_runtime": 55.8885, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4305 }, { "epoch": 0.3972782839349556, "grad_norm": 1.9106094571790158, "learning_rate": 8.658274983330501e-07, "loss": 0.6983, "step": 4306 }, { "epoch": 0.39737054549648254, "grad_norm": 2.021054454586861, "learning_rate": 8.656538694721938e-07, "loss": 0.6352, "step": 4307 }, { "epoch": 0.39746280705800946, "grad_norm": 1.8533564134638605, "learning_rate": 8.65480218802905e-07, "loss": 0.6699, "step": 4308 }, { "epoch": 0.3975550686195364, "grad_norm": 1.8649460331187122, "learning_rate": 8.653065463409203e-07, "loss": 0.6021, "step": 4309 }, { "epoch": 0.3976473301810633, "grad_norm": 1.8993497965328716, "learning_rate": 8.65132852101978e-07, "loss": 0.8226, "step": 4310 }, { "epoch": 0.3976473301810633, "eval_GEN Loss": 0.46792805194854736, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3694693446159363, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8582331538200378, "eval_runtime": 55.9861, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4310 }, { "epoch": 0.39773959174259027, "grad_norm": 1.1810875212470133, "learning_rate": 8.649591361018189e-07, "loss": 0.6184, "step": 4311 }, { "epoch": 0.3978318533041172, "grad_norm": 2.0411580430573415, "learning_rate": 8.647853983561849e-07, "loss": 0.7681, "step": 4312 }, { "epoch": 0.3979241148656441, "grad_norm": 1.7961702318560229, "learning_rate": 8.646116388808208e-07, "loss": 0.7263, "step": 4313 }, { "epoch": 0.398016376427171, "grad_norm": 3.8066442571781756, "learning_rate": 8.64437857691473e-07, "loss": 0.8646, "step": 4314 }, { "epoch": 0.39810863798869794, "grad_norm": 1.7079718234420176, "learning_rate": 8.642640548038894e-07, "loss": 0.7741, "step": 4315 }, { "epoch": 0.39810863798869794, "eval_GEN Loss": 0.46880170702934265, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3784363567829132, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8519831895828247, "eval_runtime": 55.8455, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4315 }, { "epoch": 0.39820089955022486, "grad_norm": 1.693772350603163, "learning_rate": 8.640902302338205e-07, "loss": 0.7377, "step": 4316 }, { "epoch": 0.39829316111175184, "grad_norm": 1.9772742178441343, "learning_rate": 8.63916383997019e-07, "loss": 0.6117, "step": 4317 }, { "epoch": 0.39838542267327876, "grad_norm": 2.2263447589393395, "learning_rate": 8.637425161092385e-07, "loss": 0.7982, "step": 4318 }, { "epoch": 0.3984776842348057, "grad_norm": 2.169691279340369, "learning_rate": 8.635686265862353e-07, "loss": 0.8237, "step": 4319 }, { "epoch": 0.3985699457963326, "grad_norm": 3.8853240209915243, "learning_rate": 8.633947154437676e-07, "loss": 0.6362, "step": 4320 }, { "epoch": 0.3985699457963326, "eval_GEN Loss": 0.46980276703834534, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4024483561515808, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8568509817123413, "eval_runtime": 55.8756, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4320 }, { "epoch": 0.3986622073578595, "grad_norm": 1.3914618434889319, "learning_rate": 8.632207826975957e-07, "loss": 0.5795, "step": 4321 }, { "epoch": 0.3987544689193865, "grad_norm": 1.915776930310122, "learning_rate": 8.630468283634814e-07, "loss": 0.705, "step": 4322 }, { "epoch": 0.3988467304809134, "grad_norm": 1.7215899315176006, "learning_rate": 8.62872852457189e-07, "loss": 0.8159, "step": 4323 }, { "epoch": 0.3989389920424403, "grad_norm": 1.545074800659904, "learning_rate": 8.626988549944841e-07, "loss": 0.5778, "step": 4324 }, { "epoch": 0.39903125360396724, "grad_norm": 1.7586549280698154, "learning_rate": 8.625248359911349e-07, "loss": 0.8274, "step": 4325 }, { "epoch": 0.39903125360396724, "eval_GEN Loss": 0.46910834312438965, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8662420382165605, "eval_PRM F1 AUC": 0.7792037716081718, "eval_PRM F1 Neg": 0.6181818181818182, "eval_PRM Loss": 0.4126182198524475, "eval_PRM NPV": 0.53125, "eval_PRM Precision": 0.918918918918919, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8543269038200378, "eval_runtime": 55.8429, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4325 }, { "epoch": 0.39912351516549416, "grad_norm": 2.5558426758543007, "learning_rate": 8.623507954629112e-07, "loss": 0.638, "step": 4326 }, { "epoch": 0.39921577672702113, "grad_norm": 1.5081553023369632, "learning_rate": 8.621767334255848e-07, "loss": 0.6766, "step": 4327 }, { "epoch": 0.39930803828854805, "grad_norm": 2.1463099975729816, "learning_rate": 8.620026498949296e-07, "loss": 0.7741, "step": 4328 }, { "epoch": 0.39940029985007497, "grad_norm": 1.9034757117327512, "learning_rate": 8.618285448867211e-07, "loss": 0.6781, "step": 4329 }, { "epoch": 0.3994925614116019, "grad_norm": 1.2363998587003104, "learning_rate": 8.616544184167372e-07, "loss": 0.5225, "step": 4330 }, { "epoch": 0.3994925614116019, "eval_GEN Loss": 0.47018128633499146, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.40099209547042847, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8483173251152039, "eval_runtime": 56.7683, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4330 }, { "epoch": 0.3995848229731288, "grad_norm": 2.6054869448047797, "learning_rate": 8.614802705007573e-07, "loss": 0.8293, "step": 4331 }, { "epoch": 0.3996770845346557, "grad_norm": 1.871319476311996, "learning_rate": 8.613061011545631e-07, "loss": 0.6276, "step": 4332 }, { "epoch": 0.3997693460961827, "grad_norm": 2.2925421434459423, "learning_rate": 8.611319103939381e-07, "loss": 0.9295, "step": 4333 }, { "epoch": 0.3998616076577096, "grad_norm": 2.4538391934055537, "learning_rate": 8.609576982346676e-07, "loss": 0.8343, "step": 4334 }, { "epoch": 0.39995386921923654, "grad_norm": 2.8113169959474975, "learning_rate": 8.60783464692539e-07, "loss": 0.8452, "step": 4335 }, { "epoch": 0.39995386921923654, "eval_GEN Loss": 0.4706370234489441, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.3908641040325165, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8507211804389954, "eval_runtime": 56.6316, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4335 }, { "epoch": 0.40004613078076345, "grad_norm": 2.5281605112095114, "learning_rate": 8.606092097833418e-07, "loss": 0.9098, "step": 4336 }, { "epoch": 0.40013839234229037, "grad_norm": 1.3100590711659552, "learning_rate": 8.604349335228673e-07, "loss": 0.652, "step": 4337 }, { "epoch": 0.40023065390381735, "grad_norm": 1.5234659517323896, "learning_rate": 8.602606359269083e-07, "loss": 0.7689, "step": 4338 }, { "epoch": 0.40032291546534426, "grad_norm": 3.0874861229794472, "learning_rate": 8.600863170112604e-07, "loss": 0.9095, "step": 4339 }, { "epoch": 0.4004151770268712, "grad_norm": 2.235667731018532, "learning_rate": 8.599119767917204e-07, "loss": 0.7663, "step": 4340 }, { "epoch": 0.4004151770268712, "eval_GEN Loss": 0.4703901708126068, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.39742788672447205, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.849879801273346, "eval_runtime": 56.5996, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4340 }, { "epoch": 0.4005074385883981, "grad_norm": 1.9462855893287139, "learning_rate": 8.597376152840872e-07, "loss": 0.5899, "step": 4341 }, { "epoch": 0.400599700149925, "grad_norm": 2.6000624996684785, "learning_rate": 8.59563232504162e-07, "loss": 0.8631, "step": 4342 }, { "epoch": 0.400691961711452, "grad_norm": 2.156921172353974, "learning_rate": 8.593888284677472e-07, "loss": 0.5716, "step": 4343 }, { "epoch": 0.4007842232729789, "grad_norm": 2.584212344365474, "learning_rate": 8.59214403190648e-07, "loss": 0.8445, "step": 4344 }, { "epoch": 0.40087648483450583, "grad_norm": 2.03840427685523, "learning_rate": 8.590399566886708e-07, "loss": 0.6369, "step": 4345 }, { "epoch": 0.40087648483450583, "eval_GEN Loss": 0.4684564769268036, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.40281203389167786, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.848557710647583, "eval_runtime": 55.942, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4345 }, { "epoch": 0.40096874639603275, "grad_norm": 1.7097548289773044, "learning_rate": 8.588654889776244e-07, "loss": 0.7837, "step": 4346 }, { "epoch": 0.40106100795755967, "grad_norm": 1.613053005537647, "learning_rate": 8.586910000733193e-07, "loss": 0.7572, "step": 4347 }, { "epoch": 0.4011532695190866, "grad_norm": 2.1600841435389917, "learning_rate": 8.585164899915679e-07, "loss": 0.8231, "step": 4348 }, { "epoch": 0.40124553108061356, "grad_norm": 2.3169260190547933, "learning_rate": 8.583419587481845e-07, "loss": 0.8244, "step": 4349 }, { "epoch": 0.4013377926421405, "grad_norm": 2.4666178968342956, "learning_rate": 8.581674063589858e-07, "loss": 0.7386, "step": 4350 }, { "epoch": 0.4013377926421405, "eval_GEN Loss": 0.46762922406196594, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.4029407203197479, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.849879801273346, "eval_runtime": 56.6279, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4350 }, { "epoch": 0.4014300542036674, "grad_norm": 1.9500004709727101, "learning_rate": 8.579928328397897e-07, "loss": 0.7464, "step": 4351 }, { "epoch": 0.4015223157651943, "grad_norm": 1.7715356063353256, "learning_rate": 8.578182382064161e-07, "loss": 0.6496, "step": 4352 }, { "epoch": 0.40161457732672123, "grad_norm": 1.7966537489965584, "learning_rate": 8.576436224746874e-07, "loss": 0.7461, "step": 4353 }, { "epoch": 0.4017068388882482, "grad_norm": 1.4498825680301908, "learning_rate": 8.574689856604274e-07, "loss": 0.5625, "step": 4354 }, { "epoch": 0.4017991004497751, "grad_norm": 1.805573182684093, "learning_rate": 8.572943277794623e-07, "loss": 0.683, "step": 4355 }, { "epoch": 0.4017991004497751, "eval_GEN Loss": 0.46739768981933594, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.3970527946949005, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8538461327552795, "eval_runtime": 56.8637, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 4355 }, { "epoch": 0.40189136201130204, "grad_norm": 1.9613282217487513, "learning_rate": 8.571196488476191e-07, "loss": 0.6686, "step": 4356 }, { "epoch": 0.40198362357282896, "grad_norm": 1.632307050440881, "learning_rate": 8.569449488807282e-07, "loss": 0.7813, "step": 4357 }, { "epoch": 0.4020758851343559, "grad_norm": 1.6378752783854558, "learning_rate": 8.56770227894621e-07, "loss": 0.4462, "step": 4358 }, { "epoch": 0.40216814669588286, "grad_norm": 2.5864864685607944, "learning_rate": 8.56595485905131e-07, "loss": 0.7576, "step": 4359 }, { "epoch": 0.4022604082574098, "grad_norm": 1.7330514206039742, "learning_rate": 8.564207229280934e-07, "loss": 0.7924, "step": 4360 }, { "epoch": 0.4022604082574098, "eval_GEN Loss": 0.46744897961616516, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38540875911712646, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8606970906257629, "eval_runtime": 56.7162, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4360 }, { "epoch": 0.4023526698189367, "grad_norm": 3.369996026573113, "learning_rate": 8.562459389793456e-07, "loss": 0.7206, "step": 4361 }, { "epoch": 0.4024449313804636, "grad_norm": 3.2931655708702103, "learning_rate": 8.560711340747269e-07, "loss": 1.0202, "step": 4362 }, { "epoch": 0.40253719294199053, "grad_norm": 1.8059033468820964, "learning_rate": 8.558963082300784e-07, "loss": 0.7273, "step": 4363 }, { "epoch": 0.40262945450351745, "grad_norm": 1.8184119178783473, "learning_rate": 8.557214614612428e-07, "loss": 0.8668, "step": 4364 }, { "epoch": 0.4027217160650444, "grad_norm": 2.9247755605565113, "learning_rate": 8.555465937840654e-07, "loss": 0.7438, "step": 4365 }, { "epoch": 0.4027217160650444, "eval_GEN Loss": 0.46761518716812134, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38552287220954895, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8652644157409668, "eval_runtime": 56.6237, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4365 }, { "epoch": 0.40281397762657134, "grad_norm": 2.007352052654947, "learning_rate": 8.553717052143927e-07, "loss": 0.5653, "step": 4366 }, { "epoch": 0.40290623918809826, "grad_norm": 2.4348150487070366, "learning_rate": 8.551967957680735e-07, "loss": 0.7362, "step": 4367 }, { "epoch": 0.4029985007496252, "grad_norm": 1.6882944930720185, "learning_rate": 8.550218654609583e-07, "loss": 0.6152, "step": 4368 }, { "epoch": 0.4030907623111521, "grad_norm": 2.728792418299751, "learning_rate": 8.548469143088995e-07, "loss": 0.9368, "step": 4369 }, { "epoch": 0.40318302387267907, "grad_norm": 1.7312906967832777, "learning_rate": 8.546719423277515e-07, "loss": 0.6434, "step": 4370 }, { "epoch": 0.40318302387267907, "eval_GEN Loss": 0.4671454131603241, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37842366099357605, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8683894276618958, "eval_runtime": 55.9002, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4370 }, { "epoch": 0.403275285434206, "grad_norm": 2.387194276491699, "learning_rate": 8.544969495333708e-07, "loss": 0.7262, "step": 4371 }, { "epoch": 0.4033675469957329, "grad_norm": 2.3504103136965036, "learning_rate": 8.54321935941615e-07, "loss": 0.8849, "step": 4372 }, { "epoch": 0.4034598085572598, "grad_norm": 2.5378532715092943, "learning_rate": 8.541469015683448e-07, "loss": 0.6914, "step": 4373 }, { "epoch": 0.40355207011878674, "grad_norm": 1.3334952623466765, "learning_rate": 8.539718464294214e-07, "loss": 0.5388, "step": 4374 }, { "epoch": 0.40364433168031366, "grad_norm": 2.5910527360789968, "learning_rate": 8.537967705407091e-07, "loss": 1.1671, "step": 4375 }, { "epoch": 0.40364433168031366, "eval_GEN Loss": 0.4680883288383484, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.39346766471862793, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.876682698726654, "eval_runtime": 56.8994, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 4375 }, { "epoch": 0.40373659324184064, "grad_norm": 2.4608254281800583, "learning_rate": 8.536216739180732e-07, "loss": 0.8573, "step": 4376 }, { "epoch": 0.40382885480336755, "grad_norm": 1.6992940977093691, "learning_rate": 8.534465565773812e-07, "loss": 0.8575, "step": 4377 }, { "epoch": 0.4039211163648945, "grad_norm": 2.17954121982997, "learning_rate": 8.53271418534503e-07, "loss": 0.9639, "step": 4378 }, { "epoch": 0.4040133779264214, "grad_norm": 1.8256402776695555, "learning_rate": 8.530962598053093e-07, "loss": 0.6011, "step": 4379 }, { "epoch": 0.4041056394879483, "grad_norm": 1.9087405972380291, "learning_rate": 8.529210804056736e-07, "loss": 0.6906, "step": 4380 }, { "epoch": 0.4041056394879483, "eval_GEN Loss": 0.46784546971321106, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.41346266865730286, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8895432949066162, "eval_runtime": 56.7067, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4380 }, { "epoch": 0.4041979010494753, "grad_norm": 1.8445393058249546, "learning_rate": 8.527458803514707e-07, "loss": 0.8251, "step": 4381 }, { "epoch": 0.4042901626110022, "grad_norm": 1.9618027964644604, "learning_rate": 8.525706596585778e-07, "loss": 0.8287, "step": 4382 }, { "epoch": 0.4043824241725291, "grad_norm": 1.9320467612487213, "learning_rate": 8.523954183428734e-07, "loss": 0.801, "step": 4383 }, { "epoch": 0.40447468573405604, "grad_norm": 1.875394469172402, "learning_rate": 8.522201564202384e-07, "loss": 0.8412, "step": 4384 }, { "epoch": 0.40456694729558296, "grad_norm": 2.4927860706774556, "learning_rate": 8.520448739065551e-07, "loss": 0.7267, "step": 4385 }, { "epoch": 0.40456694729558296, "eval_GEN Loss": 0.4678288698196411, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.4132847785949707, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8905649185180664, "eval_runtime": 56.7675, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4385 }, { "epoch": 0.40465920885710993, "grad_norm": 1.7263428219561536, "learning_rate": 8.51869570817708e-07, "loss": 0.6153, "step": 4386 }, { "epoch": 0.40475147041863685, "grad_norm": 1.4988849618998097, "learning_rate": 8.516942471695832e-07, "loss": 0.6473, "step": 4387 }, { "epoch": 0.40484373198016377, "grad_norm": 1.1853685593104997, "learning_rate": 8.51518902978069e-07, "loss": 0.51, "step": 4388 }, { "epoch": 0.4049359935416907, "grad_norm": 2.2161008965613775, "learning_rate": 8.513435382590553e-07, "loss": 0.8579, "step": 4389 }, { "epoch": 0.4050282551032176, "grad_norm": 1.9920668011206768, "learning_rate": 8.511681530284338e-07, "loss": 0.7394, "step": 4390 }, { "epoch": 0.4050282551032176, "eval_GEN Loss": 0.46759864687919617, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.395404577255249, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8879206776618958, "eval_runtime": 56.6619, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4390 }, { "epoch": 0.4051205166647445, "grad_norm": 2.2142864018699857, "learning_rate": 8.509927473020984e-07, "loss": 0.7945, "step": 4391 }, { "epoch": 0.4052127782262715, "grad_norm": 3.7178164515061827, "learning_rate": 8.508173210959443e-07, "loss": 0.8368, "step": 4392 }, { "epoch": 0.4053050397877984, "grad_norm": 2.126597112537908, "learning_rate": 8.506418744258691e-07, "loss": 0.7517, "step": 4393 }, { "epoch": 0.40539730134932533, "grad_norm": 1.7946472581849136, "learning_rate": 8.504664073077723e-07, "loss": 0.841, "step": 4394 }, { "epoch": 0.40548956291085225, "grad_norm": 1.4681017207467861, "learning_rate": 8.502909197575545e-07, "loss": 0.749, "step": 4395 }, { "epoch": 0.40548956291085225, "eval_GEN Loss": 0.46796053647994995, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3973378539085388, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8907451629638672, "eval_runtime": 56.8194, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4395 }, { "epoch": 0.40558182447237917, "grad_norm": 1.7169143722621392, "learning_rate": 8.501154117911194e-07, "loss": 0.8347, "step": 4396 }, { "epoch": 0.40567408603390614, "grad_norm": 2.1505651863819844, "learning_rate": 8.49939883424371e-07, "loss": 0.7512, "step": 4397 }, { "epoch": 0.40576634759543306, "grad_norm": 2.8080987594474296, "learning_rate": 8.497643346732164e-07, "loss": 0.8967, "step": 4398 }, { "epoch": 0.40585860915696, "grad_norm": 1.7603215902984848, "learning_rate": 8.49588765553564e-07, "loss": 0.7488, "step": 4399 }, { "epoch": 0.4059508707184869, "grad_norm": 3.248644485469129, "learning_rate": 8.494131760813243e-07, "loss": 0.6555, "step": 4400 }, { "epoch": 0.4059508707184869, "eval_GEN Loss": 0.46874508261680603, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4028520882129669, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8941105604171753, "eval_runtime": 56.6489, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4400 }, { "epoch": 0.4060431322800138, "grad_norm": 2.126199976435892, "learning_rate": 8.49237566272409e-07, "loss": 0.748, "step": 4401 }, { "epoch": 0.4061353938415408, "grad_norm": 1.876211486711498, "learning_rate": 8.490619361427327e-07, "loss": 0.6085, "step": 4402 }, { "epoch": 0.4062276554030677, "grad_norm": 1.90944988052703, "learning_rate": 8.488862857082112e-07, "loss": 0.5791, "step": 4403 }, { "epoch": 0.40631991696459463, "grad_norm": 3.087267682102724, "learning_rate": 8.487106149847619e-07, "loss": 0.7401, "step": 4404 }, { "epoch": 0.40641217852612155, "grad_norm": 1.6621465576501164, "learning_rate": 8.485349239883045e-07, "loss": 0.6956, "step": 4405 }, { "epoch": 0.40641217852612155, "eval_GEN Loss": 0.4685569703578949, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8944099378881988, "eval_PRM F1 AUC": 0.8033001571503404, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4055129587650299, "eval_PRM NPV": 0.6071428571428571, "eval_PRM Precision": 0.9230769230769231, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8938701748847961, "eval_runtime": 56.6806, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4405 }, { "epoch": 0.40650444008764847, "grad_norm": 1.4851470168327767, "learning_rate": 8.483592127347605e-07, "loss": 0.661, "step": 4406 }, { "epoch": 0.4065967016491754, "grad_norm": 1.8451475631657672, "learning_rate": 8.481834812400532e-07, "loss": 0.7586, "step": 4407 }, { "epoch": 0.40668896321070236, "grad_norm": 1.3547269587281008, "learning_rate": 8.480077295201072e-07, "loss": 0.7059, "step": 4408 }, { "epoch": 0.4067812247722293, "grad_norm": 1.7124027834867268, "learning_rate": 8.478319575908502e-07, "loss": 0.6812, "step": 4409 }, { "epoch": 0.4068734863337562, "grad_norm": 1.759564729600565, "learning_rate": 8.4765616546821e-07, "loss": 0.7851, "step": 4410 }, { "epoch": 0.4068734863337562, "eval_GEN Loss": 0.4692930281162262, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.42200595140457153, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9019230604171753, "eval_runtime": 56.7105, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4410 }, { "epoch": 0.4069657478952831, "grad_norm": 1.7811880694067443, "learning_rate": 8.474803531681181e-07, "loss": 0.5887, "step": 4411 }, { "epoch": 0.40705800945681003, "grad_norm": 2.2451517550932794, "learning_rate": 8.473045207065062e-07, "loss": 0.7215, "step": 4412 }, { "epoch": 0.407150271018337, "grad_norm": 1.7316909628745827, "learning_rate": 8.471286680993085e-07, "loss": 0.7175, "step": 4413 }, { "epoch": 0.4072425325798639, "grad_norm": 2.340231309531403, "learning_rate": 8.469527953624615e-07, "loss": 0.6224, "step": 4414 }, { "epoch": 0.40733479414139084, "grad_norm": 1.4651810419410551, "learning_rate": 8.467769025119027e-07, "loss": 0.5748, "step": 4415 }, { "epoch": 0.40733479414139084, "eval_GEN Loss": 0.4682878255844116, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.4185051918029785, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.9013822078704834, "eval_runtime": 56.5889, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4415 }, { "epoch": 0.40742705570291776, "grad_norm": 1.879025493176752, "learning_rate": 8.46600989563572e-07, "loss": 0.7935, "step": 4416 }, { "epoch": 0.4075193172644447, "grad_norm": 2.327842369918227, "learning_rate": 8.464250565334107e-07, "loss": 0.5894, "step": 4417 }, { "epoch": 0.40761157882597165, "grad_norm": 1.3246416414931381, "learning_rate": 8.462491034373623e-07, "loss": 0.5294, "step": 4418 }, { "epoch": 0.4077038403874986, "grad_norm": 3.7774430830015397, "learning_rate": 8.46073130291372e-07, "loss": 0.706, "step": 4419 }, { "epoch": 0.4077961019490255, "grad_norm": 2.650456065546193, "learning_rate": 8.458971371113865e-07, "loss": 0.882, "step": 4420 }, { "epoch": 0.4077961019490255, "eval_GEN Loss": 0.467420756816864, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.39714956283569336, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.89453125, "eval_runtime": 56.6992, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4420 }, { "epoch": 0.4078883635105524, "grad_norm": 2.0157016281789484, "learning_rate": 8.457211239133549e-07, "loss": 0.9023, "step": 4421 }, { "epoch": 0.40798062507207933, "grad_norm": 2.223748213372893, "learning_rate": 8.455450907132276e-07, "loss": 0.6436, "step": 4422 }, { "epoch": 0.40807288663360625, "grad_norm": 3.16632598211609, "learning_rate": 8.453690375269571e-07, "loss": 0.987, "step": 4423 }, { "epoch": 0.4081651481951332, "grad_norm": 2.002340916306112, "learning_rate": 8.451929643704973e-07, "loss": 0.758, "step": 4424 }, { "epoch": 0.40825740975666014, "grad_norm": 1.4163943534286552, "learning_rate": 8.450168712598047e-07, "loss": 0.6064, "step": 4425 }, { "epoch": 0.40825740975666014, "eval_GEN Loss": 0.4673185646533966, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3878537714481354, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8930889368057251, "eval_runtime": 56.7088, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4425 }, { "epoch": 0.40834967131818706, "grad_norm": 1.7478277707364132, "learning_rate": 8.448407582108369e-07, "loss": 0.7904, "step": 4426 }, { "epoch": 0.408441932879714, "grad_norm": 2.2197129291864166, "learning_rate": 8.446646252395533e-07, "loss": 1.0033, "step": 4427 }, { "epoch": 0.4085341944412409, "grad_norm": 1.675542293324628, "learning_rate": 8.444884723619159e-07, "loss": 0.8066, "step": 4428 }, { "epoch": 0.40862645600276787, "grad_norm": 1.4592189769777335, "learning_rate": 8.443122995938876e-07, "loss": 0.6287, "step": 4429 }, { "epoch": 0.4087187175642948, "grad_norm": 1.3523548018805331, "learning_rate": 8.441361069514334e-07, "loss": 0.6749, "step": 4430 }, { "epoch": 0.4087187175642948, "eval_GEN Loss": 0.4690874218940735, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.39502543210983276, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8984375, "eval_runtime": 56.7137, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4430 }, { "epoch": 0.4088109791258217, "grad_norm": 1.5013281547125283, "learning_rate": 8.439598944505204e-07, "loss": 0.6776, "step": 4431 }, { "epoch": 0.4089032406873486, "grad_norm": 1.7706508398410616, "learning_rate": 8.437836621071171e-07, "loss": 0.6414, "step": 4432 }, { "epoch": 0.40899550224887554, "grad_norm": 2.4259695608999476, "learning_rate": 8.436074099371938e-07, "loss": 0.7821, "step": 4433 }, { "epoch": 0.4090877638104025, "grad_norm": 2.524478691095849, "learning_rate": 8.434311379567231e-07, "loss": 0.7882, "step": 4434 }, { "epoch": 0.40918002537192943, "grad_norm": 1.722788404617185, "learning_rate": 8.432548461816788e-07, "loss": 0.6921, "step": 4435 }, { "epoch": 0.40918002537192943, "eval_GEN Loss": 0.4683658182621002, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.38892853260040283, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.890625, "eval_runtime": 56.9599, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 4435 }, { "epoch": 0.40927228693345635, "grad_norm": 1.7227399959850518, "learning_rate": 8.430785346280368e-07, "loss": 0.6833, "step": 4436 }, { "epoch": 0.40936454849498327, "grad_norm": 2.7846131252207473, "learning_rate": 8.429022033117748e-07, "loss": 1.0043, "step": 4437 }, { "epoch": 0.4094568100565102, "grad_norm": 2.058279534043985, "learning_rate": 8.42725852248872e-07, "loss": 0.7642, "step": 4438 }, { "epoch": 0.4095490716180371, "grad_norm": 2.8036887462122917, "learning_rate": 8.425494814553098e-07, "loss": 0.7572, "step": 4439 }, { "epoch": 0.4096413331795641, "grad_norm": 1.5305309942984735, "learning_rate": 8.423730909470712e-07, "loss": 0.7385, "step": 4440 }, { "epoch": 0.4096413331795641, "eval_GEN Loss": 0.46863633394241333, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9146341463414634, "eval_PRM F1 AUC": 0.8213724463069669, "eval_PRM F1 Neg": 0.7083333333333334, "eval_PRM Loss": 0.3912132680416107, "eval_PRM NPV": 0.68, "eval_PRM Precision": 0.9259259259259259, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8941707015037537, "eval_runtime": 55.83, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4440 }, { "epoch": 0.409733594741091, "grad_norm": 1.6620025701406809, "learning_rate": 8.421966807401409e-07, "loss": 0.6896, "step": 4441 }, { "epoch": 0.4098258563026179, "grad_norm": 2.3311673457438267, "learning_rate": 8.420202508505056e-07, "loss": 0.7278, "step": 4442 }, { "epoch": 0.40991811786414484, "grad_norm": 2.0409251633390197, "learning_rate": 8.418438012941535e-07, "loss": 0.6658, "step": 4443 }, { "epoch": 0.41001037942567176, "grad_norm": 2.7458604685369465, "learning_rate": 8.41667332087075e-07, "loss": 0.8577, "step": 4444 }, { "epoch": 0.41010264098719873, "grad_norm": 1.809262802391263, "learning_rate": 8.414908432452616e-07, "loss": 0.6504, "step": 4445 }, { "epoch": 0.41010264098719873, "eval_GEN Loss": 0.4685811698436737, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9079754601226994, "eval_PRM F1 AUC": 0.8153483499214248, "eval_PRM F1 Neg": 0.6938775510204082, "eval_PRM Loss": 0.39829114079475403, "eval_PRM NPV": 0.6538461538461539, "eval_PRM Precision": 0.925, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8966947197914124, "eval_runtime": 56.0773, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 4445 }, { "epoch": 0.41019490254872565, "grad_norm": 2.2159807326316163, "learning_rate": 8.413143347847073e-07, "loss": 0.8437, "step": 4446 }, { "epoch": 0.41028716411025257, "grad_norm": 1.815086239177233, "learning_rate": 8.411378067214075e-07, "loss": 0.7837, "step": 4447 }, { "epoch": 0.4103794256717795, "grad_norm": 1.8169003421483951, "learning_rate": 8.409612590713595e-07, "loss": 0.814, "step": 4448 }, { "epoch": 0.4104716872333064, "grad_norm": 1.5581465180457919, "learning_rate": 8.407846918505621e-07, "loss": 0.7114, "step": 4449 }, { "epoch": 0.4105639487948334, "grad_norm": 1.7951832995862964, "learning_rate": 8.406081050750164e-07, "loss": 0.7132, "step": 4450 }, { "epoch": 0.4105639487948334, "eval_GEN Loss": 0.4693397581577301, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9, "eval_PRM F1 AUC": 0.8250392875851232, "eval_PRM F1 Neg": 0.6923076923076923, "eval_PRM Loss": 0.4170929193496704, "eval_PRM NPV": 0.6206896551724138, "eval_PRM Precision": 0.935064935064935, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9039062261581421, "eval_runtime": 55.981, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4450 }, { "epoch": 0.4106562103563603, "grad_norm": 2.0050657877483835, "learning_rate": 8.40431498760725e-07, "loss": 0.6324, "step": 4451 }, { "epoch": 0.4107484719178872, "grad_norm": 2.1479722246348203, "learning_rate": 8.402548729236919e-07, "loss": 0.576, "step": 4452 }, { "epoch": 0.41084073347941413, "grad_norm": 2.2416873439526057, "learning_rate": 8.400782275799236e-07, "loss": 0.7593, "step": 4453 }, { "epoch": 0.41093299504094105, "grad_norm": 1.9037926701573586, "learning_rate": 8.399015627454274e-07, "loss": 0.7573, "step": 4454 }, { "epoch": 0.41102525660246797, "grad_norm": 2.282854272157789, "learning_rate": 8.397248784362136e-07, "loss": 0.8826, "step": 4455 }, { "epoch": 0.41102525660246797, "eval_GEN Loss": 0.4691080152988434, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.4137914180755615, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.905348539352417, "eval_runtime": 55.8514, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4455 }, { "epoch": 0.41111751816399494, "grad_norm": 2.0067909166136464, "learning_rate": 8.395481746682932e-07, "loss": 0.7274, "step": 4456 }, { "epoch": 0.41120977972552186, "grad_norm": 2.1478142640649573, "learning_rate": 8.393714514576797e-07, "loss": 0.8989, "step": 4457 }, { "epoch": 0.4113020412870488, "grad_norm": 3.3050958758486906, "learning_rate": 8.391947088203877e-07, "loss": 0.756, "step": 4458 }, { "epoch": 0.4113943028485757, "grad_norm": 1.4580142202762119, "learning_rate": 8.390179467724341e-07, "loss": 0.744, "step": 4459 }, { "epoch": 0.4114865644101026, "grad_norm": 2.115557227177532, "learning_rate": 8.388411653298373e-07, "loss": 0.7162, "step": 4460 }, { "epoch": 0.4114865644101026, "eval_GEN Loss": 0.46775931119918823, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.40120822191238403, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9041466116905212, "eval_runtime": 55.8126, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4460 }, { "epoch": 0.4115788259716296, "grad_norm": 2.704404467676901, "learning_rate": 8.386643645086174e-07, "loss": 0.7605, "step": 4461 }, { "epoch": 0.4116710875331565, "grad_norm": 1.8194182036124926, "learning_rate": 8.384875443247965e-07, "loss": 0.7232, "step": 4462 }, { "epoch": 0.41176334909468343, "grad_norm": 1.4935980073225366, "learning_rate": 8.383107047943984e-07, "loss": 0.6165, "step": 4463 }, { "epoch": 0.41185561065621035, "grad_norm": 1.6614528684593, "learning_rate": 8.381338459334484e-07, "loss": 0.5703, "step": 4464 }, { "epoch": 0.41194787221773727, "grad_norm": 1.2808233276497625, "learning_rate": 8.379569677579738e-07, "loss": 0.5915, "step": 4465 }, { "epoch": 0.41194787221773727, "eval_GEN Loss": 0.46657660603523254, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.39101603627204895, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9128004908561707, "eval_runtime": 55.9853, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4465 }, { "epoch": 0.41204013377926424, "grad_norm": 2.186578060323299, "learning_rate": 8.377800702840034e-07, "loss": 0.8973, "step": 4466 }, { "epoch": 0.41213239534079116, "grad_norm": 1.9318827540981358, "learning_rate": 8.376031535275685e-07, "loss": 0.662, "step": 4467 }, { "epoch": 0.4122246569023181, "grad_norm": 3.6880093608066518, "learning_rate": 8.374262175047008e-07, "loss": 0.9352, "step": 4468 }, { "epoch": 0.412316918463845, "grad_norm": 1.4699628358500672, "learning_rate": 8.372492622314351e-07, "loss": 0.4356, "step": 4469 }, { "epoch": 0.4124091800253719, "grad_norm": 2.2722085263208913, "learning_rate": 8.370722877238074e-07, "loss": 0.8579, "step": 4470 }, { "epoch": 0.4124091800253719, "eval_GEN Loss": 0.4665497839450836, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.39095500111579895, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9246995449066162, "eval_runtime": 55.8651, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4470 }, { "epoch": 0.41250144158689883, "grad_norm": 2.2356962555940334, "learning_rate": 8.368952939978551e-07, "loss": 0.833, "step": 4471 }, { "epoch": 0.4125937031484258, "grad_norm": 1.8751205604035595, "learning_rate": 8.367182810696174e-07, "loss": 0.6344, "step": 4472 }, { "epoch": 0.4126859647099527, "grad_norm": 3.220241121045629, "learning_rate": 8.365412489551361e-07, "loss": 0.9262, "step": 4473 }, { "epoch": 0.41277822627147964, "grad_norm": 1.3901277316331762, "learning_rate": 8.363641976704537e-07, "loss": 0.6542, "step": 4474 }, { "epoch": 0.41287048783300656, "grad_norm": 1.596711024441536, "learning_rate": 8.361871272316149e-07, "loss": 0.6882, "step": 4475 }, { "epoch": 0.41287048783300656, "eval_GEN Loss": 0.46529778838157654, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3983197808265686, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9189903736114502, "eval_runtime": 55.9033, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4475 }, { "epoch": 0.4129627493945335, "grad_norm": 1.6681143143459427, "learning_rate": 8.360100376546665e-07, "loss": 0.7299, "step": 4476 }, { "epoch": 0.41305501095606045, "grad_norm": 2.2424161084535594, "learning_rate": 8.358329289556562e-07, "loss": 0.673, "step": 4477 }, { "epoch": 0.41314727251758737, "grad_norm": 1.7662827683428823, "learning_rate": 8.356558011506341e-07, "loss": 0.7465, "step": 4478 }, { "epoch": 0.4132395340791143, "grad_norm": 3.055652146740076, "learning_rate": 8.354786542556515e-07, "loss": 0.8324, "step": 4479 }, { "epoch": 0.4133317956406412, "grad_norm": 1.488356917683893, "learning_rate": 8.353014882867623e-07, "loss": 0.4947, "step": 4480 }, { "epoch": 0.4133317956406412, "eval_GEN Loss": 0.46626776456832886, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.40798261761665344, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9106971025466919, "eval_runtime": 56.9463, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 4480 }, { "epoch": 0.4134240572021681, "grad_norm": 1.7835403412196758, "learning_rate": 8.35124303260021e-07, "loss": 0.7146, "step": 4481 }, { "epoch": 0.4135163187636951, "grad_norm": 1.9581232939708986, "learning_rate": 8.349470991914846e-07, "loss": 0.77, "step": 4482 }, { "epoch": 0.413608580325222, "grad_norm": 1.5995569070562858, "learning_rate": 8.347698760972117e-07, "loss": 0.5544, "step": 4483 }, { "epoch": 0.41370084188674894, "grad_norm": 2.5398514864931605, "learning_rate": 8.345926339932624e-07, "loss": 0.8174, "step": 4484 }, { "epoch": 0.41379310344827586, "grad_norm": 1.5217580094923997, "learning_rate": 8.344153728956987e-07, "loss": 0.6762, "step": 4485 }, { "epoch": 0.41379310344827586, "eval_GEN Loss": 0.4669657051563263, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9012345679012346, "eval_PRM F1 AUC": 0.8093242535358826, "eval_PRM F1 Neg": 0.68, "eval_PRM Loss": 0.41092225909233093, "eval_PRM NPV": 0.6296296296296297, "eval_PRM Precision": 0.9240506329113924, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8997595906257629, "eval_runtime": 56.6675, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4485 }, { "epoch": 0.4138853650098028, "grad_norm": 3.042243171827483, "learning_rate": 8.342380928205842e-07, "loss": 0.7689, "step": 4486 }, { "epoch": 0.4139776265713297, "grad_norm": 1.5485432781574762, "learning_rate": 8.340607937839845e-07, "loss": 0.8441, "step": 4487 }, { "epoch": 0.41406988813285667, "grad_norm": 1.756016456470045, "learning_rate": 8.338834758019666e-07, "loss": 0.6179, "step": 4488 }, { "epoch": 0.4141621496943836, "grad_norm": 2.4625968719934614, "learning_rate": 8.337061388905994e-07, "loss": 0.8448, "step": 4489 }, { "epoch": 0.4142544112559105, "grad_norm": 1.935119372912926, "learning_rate": 8.335287830659532e-07, "loss": 0.7571, "step": 4490 }, { "epoch": 0.4142544112559105, "eval_GEN Loss": 0.46851304173469543, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8717948717948718, "eval_PRM F1 AUC": 0.8009429020429545, "eval_PRM F1 Neg": 0.6428571428571429, "eval_PRM Loss": 0.4371475577354431, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.9315068493150684, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.9039062261581421, "eval_runtime": 56.6122, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4490 }, { "epoch": 0.4143466728174374, "grad_norm": 2.2362447481289847, "learning_rate": 8.333514083441005e-07, "loss": 0.6513, "step": 4491 }, { "epoch": 0.41443893437896434, "grad_norm": 1.5410883047355917, "learning_rate": 8.331740147411154e-07, "loss": 0.6805, "step": 4492 }, { "epoch": 0.4145311959404913, "grad_norm": 2.7168498366099927, "learning_rate": 8.329966022730731e-07, "loss": 0.802, "step": 4493 }, { "epoch": 0.41462345750201823, "grad_norm": 2.572989119387312, "learning_rate": 8.328191709560517e-07, "loss": 0.8211, "step": 4494 }, { "epoch": 0.41471571906354515, "grad_norm": 2.550119540256824, "learning_rate": 8.326417208061296e-07, "loss": 0.5406, "step": 4495 }, { "epoch": 0.41471571906354515, "eval_GEN Loss": 0.4688943326473236, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.864516129032258, "eval_PRM F1 AUC": 0.7949188056574124, "eval_PRM F1 Neg": 0.631578947368421, "eval_PRM Loss": 0.44194895029067993, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.9305555555555556, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.8975961804389954, "eval_runtime": 56.8679, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 4495 }, { "epoch": 0.41480798062507207, "grad_norm": 2.7199340244458647, "learning_rate": 8.324642518393882e-07, "loss": 0.9646, "step": 4496 }, { "epoch": 0.414900242186599, "grad_norm": 1.891792622852327, "learning_rate": 8.322867640719094e-07, "loss": 0.8376, "step": 4497 }, { "epoch": 0.41499250374812596, "grad_norm": 2.6360234208519358, "learning_rate": 8.321092575197778e-07, "loss": 0.8396, "step": 4498 }, { "epoch": 0.4150847653096529, "grad_norm": 1.7398535721206243, "learning_rate": 8.319317321990796e-07, "loss": 0.668, "step": 4499 }, { "epoch": 0.4151770268711798, "grad_norm": 2.429001589129579, "learning_rate": 8.317541881259019e-07, "loss": 0.744, "step": 4500 }, { "epoch": 0.4151770268711798, "eval_GEN Loss": 0.46817731857299805, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.42457708716392517, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8905048370361328, "eval_runtime": 56.6838, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4500 }, { "epoch": 0.4152692884327067, "grad_norm": 2.064673484711817, "learning_rate": 8.315766253163343e-07, "loss": 0.6263, "step": 4501 }, { "epoch": 0.41536154999423364, "grad_norm": 2.4450738164345376, "learning_rate": 8.313990437864678e-07, "loss": 0.7596, "step": 4502 }, { "epoch": 0.41545381155576055, "grad_norm": 2.2871975664051325, "learning_rate": 8.312214435523949e-07, "loss": 0.8851, "step": 4503 }, { "epoch": 0.41554607311728753, "grad_norm": 2.11922700554762, "learning_rate": 8.310438246302102e-07, "loss": 0.7334, "step": 4504 }, { "epoch": 0.41563833467881445, "grad_norm": 2.5553943399106367, "learning_rate": 8.3086618703601e-07, "loss": 0.7467, "step": 4505 }, { "epoch": 0.41563833467881445, "eval_GEN Loss": 0.4669327437877655, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.39795249700546265, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8918269276618958, "eval_runtime": 56.649, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4505 }, { "epoch": 0.41573059624034137, "grad_norm": 2.099246274155791, "learning_rate": 8.306885307858919e-07, "loss": 0.6897, "step": 4506 }, { "epoch": 0.4158228578018683, "grad_norm": 2.061926230236892, "learning_rate": 8.305108558959552e-07, "loss": 0.7504, "step": 4507 }, { "epoch": 0.4159151193633952, "grad_norm": 1.7042740350309604, "learning_rate": 8.303331623823014e-07, "loss": 0.7082, "step": 4508 }, { "epoch": 0.4160073809249222, "grad_norm": 1.554695869992794, "learning_rate": 8.30155450261033e-07, "loss": 0.5857, "step": 4509 }, { "epoch": 0.4160996424864491, "grad_norm": 1.71116092258539, "learning_rate": 8.299777195482551e-07, "loss": 0.5458, "step": 4510 }, { "epoch": 0.4160996424864491, "eval_GEN Loss": 0.4649601876735687, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9221556886227545, "eval_PRM F1 AUC": 0.8116815086432687, "eval_PRM F1 Neg": 0.7111111111111111, "eval_PRM Loss": 0.3838547468185425, "eval_PRM NPV": 0.7272727272727273, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9049879908561707, "eval_runtime": 56.7257, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4510 }, { "epoch": 0.416191904047976, "grad_norm": 2.288727253134445, "learning_rate": 8.297999702600734e-07, "loss": 0.784, "step": 4511 }, { "epoch": 0.41628416560950293, "grad_norm": 2.7591239066814457, "learning_rate": 8.29622202412596e-07, "loss": 0.8433, "step": 4512 }, { "epoch": 0.41637642717102985, "grad_norm": 2.3216802408809643, "learning_rate": 8.294444160219327e-07, "loss": 0.8367, "step": 4513 }, { "epoch": 0.4164686887325568, "grad_norm": 2.4617013225691236, "learning_rate": 8.292666111041944e-07, "loss": 0.7336, "step": 4514 }, { "epoch": 0.41656095029408374, "grad_norm": 1.8423646415781811, "learning_rate": 8.290887876754945e-07, "loss": 0.7329, "step": 4515 }, { "epoch": 0.41656095029408374, "eval_GEN Loss": 0.4635125398635864, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9221556886227545, "eval_PRM F1 AUC": 0.8116815086432687, "eval_PRM F1 Neg": 0.7111111111111111, "eval_PRM Loss": 0.3853199779987335, "eval_PRM NPV": 0.7272727272727273, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9107571840286255, "eval_runtime": 56.6753, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4515 }, { "epoch": 0.41665321185561066, "grad_norm": 3.531586683189887, "learning_rate": 8.289109457519475e-07, "loss": 0.9745, "step": 4516 }, { "epoch": 0.4167454734171376, "grad_norm": 3.850137687516783, "learning_rate": 8.287330853496694e-07, "loss": 0.8018, "step": 4517 }, { "epoch": 0.4168377349786645, "grad_norm": 1.9724708060845544, "learning_rate": 8.285552064847785e-07, "loss": 0.7392, "step": 4518 }, { "epoch": 0.4169299965401914, "grad_norm": 1.3668215924039335, "learning_rate": 8.283773091733945e-07, "loss": 0.4953, "step": 4519 }, { "epoch": 0.4170222581017184, "grad_norm": 1.8798959743233898, "learning_rate": 8.281993934316383e-07, "loss": 0.7317, "step": 4520 }, { "epoch": 0.4170222581017184, "eval_GEN Loss": 0.46402081847190857, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8773584905660378, "eval_PRM F1": 0.9221556886227545, "eval_PRM F1 AUC": 0.8116815086432687, "eval_PRM F1 Neg": 0.7111111111111111, "eval_PRM Loss": 0.3894936144351959, "eval_PRM NPV": 0.7272727272727273, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8960937261581421, "eval_runtime": 55.7052, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4520 }, { "epoch": 0.4171145196632453, "grad_norm": 2.50306472540344, "learning_rate": 8.280214592756336e-07, "loss": 0.7285, "step": 4521 }, { "epoch": 0.4172067812247722, "grad_norm": 1.9630268915014357, "learning_rate": 8.278435067215045e-07, "loss": 0.8117, "step": 4522 }, { "epoch": 0.41729904278629915, "grad_norm": 1.842105589877852, "learning_rate": 8.276655357853775e-07, "loss": 0.6846, "step": 4523 }, { "epoch": 0.41739130434782606, "grad_norm": 1.8582154479703934, "learning_rate": 8.274875464833808e-07, "loss": 0.7357, "step": 4524 }, { "epoch": 0.41748356590935304, "grad_norm": 1.7397440358541465, "learning_rate": 8.273095388316438e-07, "loss": 0.6746, "step": 4525 }, { "epoch": 0.41748356590935304, "eval_GEN Loss": 0.4638248085975647, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9156626506024096, "eval_PRM F1 AUC": 0.8056574122577265, "eval_PRM F1 Neg": 0.6956521739130435, "eval_PRM Loss": 0.3951420187950134, "eval_PRM NPV": 0.6956521739130435, "eval_PRM Precision": 0.9156626506024096, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8816706538200378, "eval_runtime": 55.624, "eval_samples_per_second": 1.169, "eval_steps_per_second": 0.09, "step": 4525 }, { "epoch": 0.41757582747087996, "grad_norm": 1.5696856810379392, "learning_rate": 8.27131512846298e-07, "loss": 0.6206, "step": 4526 }, { "epoch": 0.4176680890324069, "grad_norm": 1.8517298443955166, "learning_rate": 8.269534685434763e-07, "loss": 0.656, "step": 4527 }, { "epoch": 0.4177603505939338, "grad_norm": 1.9308530495710357, "learning_rate": 8.267754059393135e-07, "loss": 0.6379, "step": 4528 }, { "epoch": 0.4178526121554607, "grad_norm": 1.7919526932830527, "learning_rate": 8.265973250499458e-07, "loss": 0.7593, "step": 4529 }, { "epoch": 0.4179448737169877, "grad_norm": 1.9102358035116955, "learning_rate": 8.26419225891511e-07, "loss": 0.7269, "step": 4530 }, { "epoch": 0.4179448737169877, "eval_GEN Loss": 0.46301814913749695, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.39663055539131165, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8749399185180664, "eval_runtime": 56.571, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4530 }, { "epoch": 0.4180371352785146, "grad_norm": 1.8003211820129328, "learning_rate": 8.262411084801492e-07, "loss": 0.7852, "step": 4531 }, { "epoch": 0.4181293968400415, "grad_norm": 1.7057002777957437, "learning_rate": 8.26062972832001e-07, "loss": 0.5957, "step": 4532 }, { "epoch": 0.41822165840156844, "grad_norm": 1.5727669818308572, "learning_rate": 8.258848189632102e-07, "loss": 0.6785, "step": 4533 }, { "epoch": 0.41831391996309536, "grad_norm": 1.558815545709368, "learning_rate": 8.257066468899205e-07, "loss": 0.6092, "step": 4534 }, { "epoch": 0.4184061815246223, "grad_norm": 2.259646757326405, "learning_rate": 8.255284566282788e-07, "loss": 0.7888, "step": 4535 }, { "epoch": 0.4184061815246223, "eval_GEN Loss": 0.46308478713035583, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.40247470140457153, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8742788434028625, "eval_runtime": 56.7184, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4535 }, { "epoch": 0.41849844308614925, "grad_norm": 1.7430739619232098, "learning_rate": 8.253502481944325e-07, "loss": 0.4716, "step": 4536 }, { "epoch": 0.41859070464767617, "grad_norm": 2.490427239786558, "learning_rate": 8.251720216045316e-07, "loss": 0.8345, "step": 4537 }, { "epoch": 0.4186829662092031, "grad_norm": 2.3513191658238073, "learning_rate": 8.249937768747269e-07, "loss": 0.802, "step": 4538 }, { "epoch": 0.41877522777073, "grad_norm": 2.002155447542008, "learning_rate": 8.248155140211714e-07, "loss": 0.8071, "step": 4539 }, { "epoch": 0.4188674893322569, "grad_norm": 2.957086477407491, "learning_rate": 8.246372330600195e-07, "loss": 0.7517, "step": 4540 }, { "epoch": 0.4188674893322569, "eval_GEN Loss": 0.4623944163322449, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8875, "eval_PRM F1 AUC": 0.7972760607647982, "eval_PRM F1 Neg": 0.6538461538461539, "eval_PRM Loss": 0.4076211750507355, "eval_PRM NPV": 0.5862068965517241, "eval_PRM Precision": 0.922077922077922, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8747896552085876, "eval_runtime": 56.8488, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 4540 }, { "epoch": 0.4189597508937839, "grad_norm": 1.9427676891032644, "learning_rate": 8.244589340074273e-07, "loss": 0.699, "step": 4541 }, { "epoch": 0.4190520124553108, "grad_norm": 2.1087024976003743, "learning_rate": 8.242806168795525e-07, "loss": 0.7288, "step": 4542 }, { "epoch": 0.41914427401683774, "grad_norm": 1.6314485332881135, "learning_rate": 8.241022816925546e-07, "loss": 0.5722, "step": 4543 }, { "epoch": 0.41923653557836466, "grad_norm": 3.4083128955022453, "learning_rate": 8.239239284625945e-07, "loss": 0.8327, "step": 4544 }, { "epoch": 0.4193287971398916, "grad_norm": 1.8470085213709662, "learning_rate": 8.237455572058348e-07, "loss": 0.4849, "step": 4545 }, { "epoch": 0.4193287971398916, "eval_GEN Loss": 0.46134865283966064, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8805031446540881, "eval_PRM F1 AUC": 0.7912519643792562, "eval_PRM F1 Neg": 0.6415094339622641, "eval_PRM Loss": 0.414465069770813, "eval_PRM NPV": 0.5666666666666667, "eval_PRM Precision": 0.9210526315789473, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8778846263885498, "eval_runtime": 55.8391, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4545 }, { "epoch": 0.41942105870141855, "grad_norm": 1.5943242157495834, "learning_rate": 8.235671679384399e-07, "loss": 0.6338, "step": 4546 }, { "epoch": 0.41951332026294547, "grad_norm": 2.275050955940321, "learning_rate": 8.233887606765758e-07, "loss": 0.74, "step": 4547 }, { "epoch": 0.4196055818244724, "grad_norm": 1.3924438896353948, "learning_rate": 8.232103354364099e-07, "loss": 0.6355, "step": 4548 }, { "epoch": 0.4196978433859993, "grad_norm": 1.6622964042441053, "learning_rate": 8.230318922341114e-07, "loss": 0.522, "step": 4549 }, { "epoch": 0.4197901049475262, "grad_norm": 1.9126773755745825, "learning_rate": 8.228534310858511e-07, "loss": 0.5954, "step": 4550 }, { "epoch": 0.4197901049475262, "eval_GEN Loss": 0.4626624286174774, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4123472571372986, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8880107998847961, "eval_runtime": 55.84, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4550 }, { "epoch": 0.41988236650905314, "grad_norm": 2.535722185197096, "learning_rate": 8.226749520078014e-07, "loss": 0.8972, "step": 4551 }, { "epoch": 0.4199746280705801, "grad_norm": 1.6502006063135173, "learning_rate": 8.224964550161365e-07, "loss": 0.6993, "step": 4552 }, { "epoch": 0.42006688963210703, "grad_norm": 1.724068340010751, "learning_rate": 8.223179401270322e-07, "loss": 0.5109, "step": 4553 }, { "epoch": 0.42015915119363395, "grad_norm": 1.6568360730515146, "learning_rate": 8.221394073566652e-07, "loss": 0.7574, "step": 4554 }, { "epoch": 0.42025141275516087, "grad_norm": 2.206391416406214, "learning_rate": 8.219608567212149e-07, "loss": 0.7891, "step": 4555 }, { "epoch": 0.42025141275516087, "eval_GEN Loss": 0.46152740716934204, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.41259726881980896, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8937199711799622, "eval_runtime": 56.9016, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 4555 }, { "epoch": 0.4203436743166878, "grad_norm": 2.025070497635663, "learning_rate": 8.217822882368619e-07, "loss": 0.6692, "step": 4556 }, { "epoch": 0.42043593587821476, "grad_norm": 1.8652951416253487, "learning_rate": 8.21603701919788e-07, "loss": 0.7729, "step": 4557 }, { "epoch": 0.4205281974397417, "grad_norm": 2.1520640386253755, "learning_rate": 8.214250977861773e-07, "loss": 0.7704, "step": 4558 }, { "epoch": 0.4206204590012686, "grad_norm": 2.0040518150240647, "learning_rate": 8.21246475852215e-07, "loss": 0.7372, "step": 4559 }, { "epoch": 0.4207127205627955, "grad_norm": 2.583448901768514, "learning_rate": 8.210678361340881e-07, "loss": 0.9066, "step": 4560 }, { "epoch": 0.4207127205627955, "eval_GEN Loss": 0.4638822674751282, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.41820263862609863, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9066706895828247, "eval_runtime": 56.7208, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4560 }, { "epoch": 0.42080498212432244, "grad_norm": 1.7922688567722063, "learning_rate": 8.208891786479855e-07, "loss": 0.7752, "step": 4561 }, { "epoch": 0.4208972436858494, "grad_norm": 2.2680942014394163, "learning_rate": 8.20710503410097e-07, "loss": 0.707, "step": 4562 }, { "epoch": 0.4209895052473763, "grad_norm": 2.1866600206533575, "learning_rate": 8.205318104366146e-07, "loss": 0.769, "step": 4563 }, { "epoch": 0.42108176680890325, "grad_norm": 2.2766924909878843, "learning_rate": 8.20353099743732e-07, "loss": 0.5799, "step": 4564 }, { "epoch": 0.42117402837043016, "grad_norm": 2.001949834964628, "learning_rate": 8.201743713476438e-07, "loss": 0.8231, "step": 4565 }, { "epoch": 0.42117402837043016, "eval_GEN Loss": 0.4633524715900421, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4163985252380371, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9140625, "eval_runtime": 55.7404, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4565 }, { "epoch": 0.4212662899319571, "grad_norm": 2.5680584736328718, "learning_rate": 8.199956252645469e-07, "loss": 0.7752, "step": 4566 }, { "epoch": 0.421358551493484, "grad_norm": 1.8375902563419673, "learning_rate": 8.198168615106396e-07, "loss": 0.7641, "step": 4567 }, { "epoch": 0.421450813055011, "grad_norm": 1.977909749246119, "learning_rate": 8.196380801021216e-07, "loss": 0.741, "step": 4568 }, { "epoch": 0.4215430746165379, "grad_norm": 2.2249880903972685, "learning_rate": 8.194592810551943e-07, "loss": 0.6423, "step": 4569 }, { "epoch": 0.4216353361780648, "grad_norm": 1.5575055473157065, "learning_rate": 8.192804643860611e-07, "loss": 0.749, "step": 4570 }, { "epoch": 0.4216353361780648, "eval_GEN Loss": 0.4634056091308594, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.42050236463546753, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9188100695610046, "eval_runtime": 56.5856, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4570 }, { "epoch": 0.42172759773959173, "grad_norm": 2.1950560122275, "learning_rate": 8.191016301109262e-07, "loss": 0.7019, "step": 4571 }, { "epoch": 0.42181985930111865, "grad_norm": 1.8606839789101812, "learning_rate": 8.189227782459962e-07, "loss": 0.6684, "step": 4572 }, { "epoch": 0.4219121208626456, "grad_norm": 2.4108315162612755, "learning_rate": 8.187439088074787e-07, "loss": 0.7533, "step": 4573 }, { "epoch": 0.42200438242417254, "grad_norm": 2.3361743273235183, "learning_rate": 8.185650218115833e-07, "loss": 0.7505, "step": 4574 }, { "epoch": 0.42209664398569946, "grad_norm": 2.283136432730305, "learning_rate": 8.18386117274521e-07, "loss": 0.6839, "step": 4575 }, { "epoch": 0.42209664398569946, "eval_GEN Loss": 0.46167024970054626, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4159373939037323, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.924879789352417, "eval_runtime": 56.5442, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 4575 }, { "epoch": 0.4221889055472264, "grad_norm": 1.3361878180603297, "learning_rate": 8.182071952125043e-07, "loss": 0.5469, "step": 4576 }, { "epoch": 0.4222811671087533, "grad_norm": 1.6270961728446756, "learning_rate": 8.180282556417474e-07, "loss": 0.6142, "step": 4577 }, { "epoch": 0.42237342867028027, "grad_norm": 2.195228717467554, "learning_rate": 8.178492985784663e-07, "loss": 0.9104, "step": 4578 }, { "epoch": 0.4224656902318072, "grad_norm": 2.1750689827816, "learning_rate": 8.176703240388779e-07, "loss": 0.6975, "step": 4579 }, { "epoch": 0.4225579517933341, "grad_norm": 1.6230987050188155, "learning_rate": 8.174913320392016e-07, "loss": 0.7803, "step": 4580 }, { "epoch": 0.4225579517933341, "eval_GEN Loss": 0.46204501390457153, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4172798693180084, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9306490421295166, "eval_runtime": 56.6336, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4580 }, { "epoch": 0.422650213354861, "grad_norm": 1.95439613322131, "learning_rate": 8.173123225956579e-07, "loss": 0.5871, "step": 4581 }, { "epoch": 0.42274247491638794, "grad_norm": 1.547615158126757, "learning_rate": 8.171332957244687e-07, "loss": 0.581, "step": 4582 }, { "epoch": 0.42283473647791486, "grad_norm": 1.9074675185627277, "learning_rate": 8.169542514418582e-07, "loss": 0.863, "step": 4583 }, { "epoch": 0.42292699803944184, "grad_norm": 2.4817583010469573, "learning_rate": 8.167751897640508e-07, "loss": 0.7977, "step": 4584 }, { "epoch": 0.42301925960096876, "grad_norm": 1.462665257096725, "learning_rate": 8.165961107072741e-07, "loss": 0.6624, "step": 4585 }, { "epoch": 0.42301925960096876, "eval_GEN Loss": 0.4614076316356659, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4181109070777893, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9338341355323792, "eval_runtime": 57.0176, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 4585 }, { "epoch": 0.4231115211624957, "grad_norm": 2.0459432477886086, "learning_rate": 8.164170142877562e-07, "loss": 0.7723, "step": 4586 }, { "epoch": 0.4232037827240226, "grad_norm": 3.3419407264656056, "learning_rate": 8.162379005217272e-07, "loss": 0.926, "step": 4587 }, { "epoch": 0.4232960442855495, "grad_norm": 1.55095469306056, "learning_rate": 8.160587694254187e-07, "loss": 0.7372, "step": 4588 }, { "epoch": 0.4233883058470765, "grad_norm": 1.4707139293394829, "learning_rate": 8.158796210150636e-07, "loss": 0.4803, "step": 4589 }, { "epoch": 0.4234805674086034, "grad_norm": 2.519623897660297, "learning_rate": 8.15700455306897e-07, "loss": 0.7473, "step": 4590 }, { "epoch": 0.4234805674086034, "eval_GEN Loss": 0.4625672698020935, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.42129579186439514, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9314603209495544, "eval_runtime": 55.9069, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4590 }, { "epoch": 0.4235728289701303, "grad_norm": 2.359782990082572, "learning_rate": 8.155212723171549e-07, "loss": 0.7112, "step": 4591 }, { "epoch": 0.42366509053165724, "grad_norm": 1.6720502928040792, "learning_rate": 8.153420720620752e-07, "loss": 0.5934, "step": 4592 }, { "epoch": 0.42375735209318416, "grad_norm": 3.4168160328509702, "learning_rate": 8.151628545578973e-07, "loss": 0.7168, "step": 4593 }, { "epoch": 0.42384961365471113, "grad_norm": 1.701306490892626, "learning_rate": 8.149836198208623e-07, "loss": 0.6829, "step": 4594 }, { "epoch": 0.42394187521623805, "grad_norm": 2.5788102775397332, "learning_rate": 8.148043678672124e-07, "loss": 0.6916, "step": 4595 }, { "epoch": 0.42394187521623805, "eval_GEN Loss": 0.4614197313785553, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.41914960741996765, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9315505027770996, "eval_runtime": 55.938, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4595 }, { "epoch": 0.42403413677776497, "grad_norm": 1.3345508451903472, "learning_rate": 8.146250987131921e-07, "loss": 0.5882, "step": 4596 }, { "epoch": 0.4241263983392919, "grad_norm": 1.7499585612998625, "learning_rate": 8.14445812375047e-07, "loss": 0.8729, "step": 4597 }, { "epoch": 0.4242186599008188, "grad_norm": 1.4828196306298707, "learning_rate": 8.142665088690238e-07, "loss": 0.6487, "step": 4598 }, { "epoch": 0.4243109214623457, "grad_norm": 1.315352403679165, "learning_rate": 8.140871882113721e-07, "loss": 0.6438, "step": 4599 }, { "epoch": 0.4244031830238727, "grad_norm": 2.9421767462635855, "learning_rate": 8.139078504183416e-07, "loss": 0.7858, "step": 4600 }, { "epoch": 0.4244031830238727, "eval_GEN Loss": 0.4607959985733032, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.41784679889678955, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.936448335647583, "eval_runtime": 55.9052, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4600 }, { "epoch": 0.4244954445853996, "grad_norm": 2.305371439555837, "learning_rate": 8.137284955061844e-07, "loss": 0.6501, "step": 4601 }, { "epoch": 0.42458770614692654, "grad_norm": 2.215089595363111, "learning_rate": 8.135491234911539e-07, "loss": 0.6785, "step": 4602 }, { "epoch": 0.42467996770845345, "grad_norm": 1.4951553714909378, "learning_rate": 8.133697343895047e-07, "loss": 0.5542, "step": 4603 }, { "epoch": 0.4247722292699804, "grad_norm": 2.850800151320083, "learning_rate": 8.131903282174941e-07, "loss": 0.8853, "step": 4604 }, { "epoch": 0.42486449083150735, "grad_norm": 2.371802316236942, "learning_rate": 8.130109049913795e-07, "loss": 0.695, "step": 4605 }, { "epoch": 0.42486449083150735, "eval_GEN Loss": 0.461161732673645, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.41691258549690247, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.938551664352417, "eval_runtime": 56.6949, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4605 }, { "epoch": 0.42495675239303426, "grad_norm": 1.490099479498711, "learning_rate": 8.128314647274209e-07, "loss": 0.6135, "step": 4606 }, { "epoch": 0.4250490139545612, "grad_norm": 2.451301183198524, "learning_rate": 8.126520074418791e-07, "loss": 0.7541, "step": 4607 }, { "epoch": 0.4251412755160881, "grad_norm": 1.4735172741829363, "learning_rate": 8.124725331510172e-07, "loss": 0.4611, "step": 4608 }, { "epoch": 0.425233537077615, "grad_norm": 3.3686515207939616, "learning_rate": 8.122930418710992e-07, "loss": 0.8692, "step": 4609 }, { "epoch": 0.425325798639142, "grad_norm": 4.037183790991638, "learning_rate": 8.121135336183911e-07, "loss": 0.7948, "step": 4610 }, { "epoch": 0.425325798639142, "eval_GEN Loss": 0.46080586314201355, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.4177016615867615, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9380708932876587, "eval_runtime": 56.6844, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4610 }, { "epoch": 0.4254180602006689, "grad_norm": 2.502506682640021, "learning_rate": 8.119340084091599e-07, "loss": 0.7651, "step": 4611 }, { "epoch": 0.42551032176219583, "grad_norm": 1.674555973288103, "learning_rate": 8.117544662596747e-07, "loss": 0.6677, "step": 4612 }, { "epoch": 0.42560258332372275, "grad_norm": 2.302023056733967, "learning_rate": 8.115749071862057e-07, "loss": 0.746, "step": 4613 }, { "epoch": 0.42569484488524967, "grad_norm": 1.8770675786824442, "learning_rate": 8.113953312050249e-07, "loss": 0.6307, "step": 4614 }, { "epoch": 0.4257871064467766, "grad_norm": 2.7092998774326196, "learning_rate": 8.11215738332406e-07, "loss": 0.7434, "step": 4615 }, { "epoch": 0.4257871064467766, "eval_GEN Loss": 0.46067067980766296, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.4208820164203644, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.93359375, "eval_runtime": 56.8732, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 4615 }, { "epoch": 0.42587936800830356, "grad_norm": 2.138671816731164, "learning_rate": 8.110361285846235e-07, "loss": 0.7421, "step": 4616 }, { "epoch": 0.4259716295698305, "grad_norm": 1.668999522082496, "learning_rate": 8.108565019779546e-07, "loss": 0.5314, "step": 4617 }, { "epoch": 0.4260638911313574, "grad_norm": 1.531951572352331, "learning_rate": 8.106768585286766e-07, "loss": 0.6277, "step": 4618 }, { "epoch": 0.4261561526928843, "grad_norm": 1.706798350282736, "learning_rate": 8.104971982530694e-07, "loss": 0.7045, "step": 4619 }, { "epoch": 0.42624841425441123, "grad_norm": 2.7010149878128047, "learning_rate": 8.103175211674144e-07, "loss": 0.6296, "step": 4620 }, { "epoch": 0.42624841425441123, "eval_GEN Loss": 0.46250781416893005, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4325137138366699, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9419471025466919, "eval_runtime": 56.5539, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4620 }, { "epoch": 0.4263406758159382, "grad_norm": 2.006218350953062, "learning_rate": 8.101378272879937e-07, "loss": 0.6102, "step": 4621 }, { "epoch": 0.4264329373774651, "grad_norm": 1.6909401200224907, "learning_rate": 8.099581166310918e-07, "loss": 0.6799, "step": 4622 }, { "epoch": 0.42652519893899205, "grad_norm": 2.119976525354725, "learning_rate": 8.097783892129944e-07, "loss": 0.6951, "step": 4623 }, { "epoch": 0.42661746050051896, "grad_norm": 2.6088053954943193, "learning_rate": 8.095986450499885e-07, "loss": 0.9162, "step": 4624 }, { "epoch": 0.4267097220620459, "grad_norm": 2.701107204154422, "learning_rate": 8.094188841583625e-07, "loss": 0.6808, "step": 4625 }, { "epoch": 0.4267097220620459, "eval_GEN Loss": 0.4625371992588043, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.43111729621887207, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9390023946762085, "eval_runtime": 55.7094, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4625 }, { "epoch": 0.42680198362357286, "grad_norm": 2.701849803176283, "learning_rate": 8.092391065544072e-07, "loss": 0.5508, "step": 4626 }, { "epoch": 0.4268942451850998, "grad_norm": 2.3029010462039126, "learning_rate": 8.090593122544138e-07, "loss": 0.7449, "step": 4627 }, { "epoch": 0.4269865067466267, "grad_norm": 1.9004220704761927, "learning_rate": 8.08879501274676e-07, "loss": 0.6365, "step": 4628 }, { "epoch": 0.4270787683081536, "grad_norm": 2.28219599820966, "learning_rate": 8.086996736314883e-07, "loss": 0.7797, "step": 4629 }, { "epoch": 0.42717102986968053, "grad_norm": 1.8548395457488216, "learning_rate": 8.085198293411471e-07, "loss": 0.7731, "step": 4630 }, { "epoch": 0.42717102986968053, "eval_GEN Loss": 0.4615626335144043, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.42481040954589844, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9360576868057251, "eval_runtime": 55.6788, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4630 }, { "epoch": 0.42726329143120745, "grad_norm": 2.3819251450556855, "learning_rate": 8.083399684199501e-07, "loss": 0.8522, "step": 4631 }, { "epoch": 0.4273555529927344, "grad_norm": 2.0137939079075236, "learning_rate": 8.081600908841966e-07, "loss": 0.7005, "step": 4632 }, { "epoch": 0.42744781455426134, "grad_norm": 2.2526220494828597, "learning_rate": 8.079801967501874e-07, "loss": 0.7564, "step": 4633 }, { "epoch": 0.42754007611578826, "grad_norm": 1.9654416441521356, "learning_rate": 8.078002860342246e-07, "loss": 0.5633, "step": 4634 }, { "epoch": 0.4276323376773152, "grad_norm": 2.7547246756504085, "learning_rate": 8.076203587526122e-07, "loss": 0.7943, "step": 4635 }, { "epoch": 0.4276323376773152, "eval_GEN Loss": 0.4605942964553833, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.4180906116962433, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9329326748847961, "eval_runtime": 56.8072, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4635 }, { "epoch": 0.4277245992388421, "grad_norm": 2.5636154455502527, "learning_rate": 8.074404149216555e-07, "loss": 0.8179, "step": 4636 }, { "epoch": 0.42781686080036907, "grad_norm": 2.08056921809316, "learning_rate": 8.072604545576612e-07, "loss": 0.7016, "step": 4637 }, { "epoch": 0.427909122361896, "grad_norm": 3.126376972917456, "learning_rate": 8.070804776769377e-07, "loss": 0.78, "step": 4638 }, { "epoch": 0.4280013839234229, "grad_norm": 2.068847796738703, "learning_rate": 8.069004842957946e-07, "loss": 0.6481, "step": 4639 }, { "epoch": 0.4280936454849498, "grad_norm": 1.8238619739209156, "learning_rate": 8.067204744305434e-07, "loss": 0.6961, "step": 4640 }, { "epoch": 0.4280936454849498, "eval_GEN Loss": 0.460936963558197, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.4079975485801697, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9327524304389954, "eval_runtime": 55.6881, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4640 }, { "epoch": 0.42818590704647674, "grad_norm": 2.1242673765850633, "learning_rate": 8.065404480974967e-07, "loss": 0.7119, "step": 4641 }, { "epoch": 0.4282781686080037, "grad_norm": 1.5893284996553223, "learning_rate": 8.063604053129689e-07, "loss": 0.6776, "step": 4642 }, { "epoch": 0.42837043016953064, "grad_norm": 1.4086468487799528, "learning_rate": 8.061803460932756e-07, "loss": 0.7022, "step": 4643 }, { "epoch": 0.42846269173105755, "grad_norm": 2.1036532308104308, "learning_rate": 8.060002704547341e-07, "loss": 0.7594, "step": 4644 }, { "epoch": 0.4285549532925845, "grad_norm": 1.5355550945957865, "learning_rate": 8.058201784136634e-07, "loss": 0.6933, "step": 4645 }, { "epoch": 0.4285549532925845, "eval_GEN Loss": 0.460313081741333, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3933650553226471, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9323918223381042, "eval_runtime": 55.8774, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4645 }, { "epoch": 0.4286472148541114, "grad_norm": 2.6499314080986034, "learning_rate": 8.056400699863836e-07, "loss": 0.7408, "step": 4646 }, { "epoch": 0.4287394764156383, "grad_norm": 1.76149372202255, "learning_rate": 8.054599451892162e-07, "loss": 0.7295, "step": 4647 }, { "epoch": 0.4288317379771653, "grad_norm": 2.604044507774662, "learning_rate": 8.052798040384844e-07, "loss": 0.8109, "step": 4648 }, { "epoch": 0.4289239995386922, "grad_norm": 2.8657535126567306, "learning_rate": 8.05099646550513e-07, "loss": 0.6307, "step": 4649 }, { "epoch": 0.4290162611002191, "grad_norm": 2.2236652599845037, "learning_rate": 8.049194727416282e-07, "loss": 0.6788, "step": 4650 }, { "epoch": 0.4290162611002191, "eval_GEN Loss": 0.46139371395111084, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.39759257435798645, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9298678040504456, "eval_runtime": 55.5166, "eval_samples_per_second": 1.171, "eval_steps_per_second": 0.09, "step": 4650 }, { "epoch": 0.42910852266174604, "grad_norm": 1.692638007074335, "learning_rate": 8.047392826281575e-07, "loss": 0.7456, "step": 4651 }, { "epoch": 0.42920078422327296, "grad_norm": 1.6430338942600697, "learning_rate": 8.045590762264302e-07, "loss": 0.5751, "step": 4652 }, { "epoch": 0.42929304578479993, "grad_norm": 1.5522883978993964, "learning_rate": 8.043788535527768e-07, "loss": 0.6735, "step": 4653 }, { "epoch": 0.42938530734632685, "grad_norm": 2.316120117388998, "learning_rate": 8.041986146235293e-07, "loss": 0.8173, "step": 4654 }, { "epoch": 0.42947756890785377, "grad_norm": 1.7622682267895373, "learning_rate": 8.040183594550213e-07, "loss": 0.5533, "step": 4655 }, { "epoch": 0.42947756890785377, "eval_GEN Loss": 0.46376433968544006, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.395481139421463, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9258413314819336, "eval_runtime": 57.0198, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 4655 }, { "epoch": 0.4295698304693807, "grad_norm": 2.914084971140689, "learning_rate": 8.03838088063588e-07, "loss": 0.7665, "step": 4656 }, { "epoch": 0.4296620920309076, "grad_norm": 2.912328994077887, "learning_rate": 8.036578004655653e-07, "loss": 0.7404, "step": 4657 }, { "epoch": 0.4297543535924346, "grad_norm": 1.7053312636383033, "learning_rate": 8.034774966772917e-07, "loss": 0.4624, "step": 4658 }, { "epoch": 0.4298466151539615, "grad_norm": 2.221855043794835, "learning_rate": 8.032971767151064e-07, "loss": 0.6911, "step": 4659 }, { "epoch": 0.4299388767154884, "grad_norm": 1.965429233897473, "learning_rate": 8.031168405953502e-07, "loss": 0.6972, "step": 4660 }, { "epoch": 0.4299388767154884, "eval_GEN Loss": 0.46308955550193787, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.39251551032066345, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.925000011920929, "eval_runtime": 56.7625, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4660 }, { "epoch": 0.43003113827701533, "grad_norm": 1.8488615070803485, "learning_rate": 8.029364883343657e-07, "loss": 0.7639, "step": 4661 }, { "epoch": 0.43012339983854225, "grad_norm": 2.1994317831214754, "learning_rate": 8.027561199484965e-07, "loss": 0.7279, "step": 4662 }, { "epoch": 0.43021566140006917, "grad_norm": 1.6644521817599582, "learning_rate": 8.025757354540879e-07, "loss": 0.7061, "step": 4663 }, { "epoch": 0.43030792296159615, "grad_norm": 1.6631871256042647, "learning_rate": 8.023953348674865e-07, "loss": 0.7436, "step": 4664 }, { "epoch": 0.43040018452312306, "grad_norm": 2.0180438596498385, "learning_rate": 8.02214918205041e-07, "loss": 0.7136, "step": 4665 }, { "epoch": 0.43040018452312306, "eval_GEN Loss": 0.46338164806365967, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3920787274837494, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9198918342590332, "eval_runtime": 56.7976, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4665 }, { "epoch": 0.43049244608465, "grad_norm": 1.491738333205516, "learning_rate": 8.020344854831002e-07, "loss": 0.606, "step": 4666 }, { "epoch": 0.4305847076461769, "grad_norm": 3.4494001851431144, "learning_rate": 8.01854036718016e-07, "loss": 1.0821, "step": 4667 }, { "epoch": 0.4306769692077038, "grad_norm": 3.135517556290885, "learning_rate": 8.016735719261405e-07, "loss": 0.6805, "step": 4668 }, { "epoch": 0.4307692307692308, "grad_norm": 1.517568030471835, "learning_rate": 8.014930911238281e-07, "loss": 0.5671, "step": 4669 }, { "epoch": 0.4308614923307577, "grad_norm": 1.295776976555254, "learning_rate": 8.013125943274336e-07, "loss": 0.5483, "step": 4670 }, { "epoch": 0.4308614923307577, "eval_GEN Loss": 0.46382442116737366, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4014551639556885, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9165865182876587, "eval_runtime": 55.8114, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4670 }, { "epoch": 0.43095375389228463, "grad_norm": 3.828373800737746, "learning_rate": 8.011320815533144e-07, "loss": 0.9417, "step": 4671 }, { "epoch": 0.43104601545381155, "grad_norm": 2.1012152877826304, "learning_rate": 8.009515528178288e-07, "loss": 0.8605, "step": 4672 }, { "epoch": 0.43113827701533847, "grad_norm": 1.207061731130644, "learning_rate": 8.007710081373365e-07, "loss": 0.4151, "step": 4673 }, { "epoch": 0.43123053857686544, "grad_norm": 1.759371599435732, "learning_rate": 8.005904475281988e-07, "loss": 0.5326, "step": 4674 }, { "epoch": 0.43132280013839236, "grad_norm": 2.2866238841261746, "learning_rate": 8.004098710067783e-07, "loss": 0.6729, "step": 4675 }, { "epoch": 0.43132280013839236, "eval_GEN Loss": 0.46552661061286926, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.4321240782737732, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9260817170143127, "eval_runtime": 56.7075, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4675 }, { "epoch": 0.4314150616999193, "grad_norm": 1.6642147179732374, "learning_rate": 8.002292785894392e-07, "loss": 0.7467, "step": 4676 }, { "epoch": 0.4315073232614462, "grad_norm": 2.2127939247120905, "learning_rate": 8.00048670292547e-07, "loss": 0.6092, "step": 4677 }, { "epoch": 0.4315995848229731, "grad_norm": 2.1172594949900163, "learning_rate": 7.998680461324688e-07, "loss": 0.7898, "step": 4678 }, { "epoch": 0.43169184638450003, "grad_norm": 2.39404393657184, "learning_rate": 7.996874061255732e-07, "loss": 0.7669, "step": 4679 }, { "epoch": 0.431784107946027, "grad_norm": 2.7934988821095743, "learning_rate": 7.995067502882296e-07, "loss": 0.6697, "step": 4680 }, { "epoch": 0.431784107946027, "eval_GEN Loss": 0.46511808037757874, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4305277168750763, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9160456657409668, "eval_runtime": 56.7632, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4680 }, { "epoch": 0.4318763695075539, "grad_norm": 2.154396039545046, "learning_rate": 7.993260786368098e-07, "loss": 0.6865, "step": 4681 }, { "epoch": 0.43196863106908084, "grad_norm": 2.0249164280493703, "learning_rate": 7.991453911876864e-07, "loss": 0.7408, "step": 4682 }, { "epoch": 0.43206089263060776, "grad_norm": 2.9357024921810475, "learning_rate": 7.989646879572335e-07, "loss": 0.8889, "step": 4683 }, { "epoch": 0.4321531541921347, "grad_norm": 3.294841631264914, "learning_rate": 7.987839689618266e-07, "loss": 0.6859, "step": 4684 }, { "epoch": 0.43224541575366165, "grad_norm": 1.8254910713370607, "learning_rate": 7.986032342178431e-07, "loss": 0.5915, "step": 4685 }, { "epoch": 0.43224541575366165, "eval_GEN Loss": 0.46197250485420227, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.40716394782066345, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.902614176273346, "eval_runtime": 56.7994, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4685 }, { "epoch": 0.4323376773151886, "grad_norm": 1.8117185631419912, "learning_rate": 7.984224837416611e-07, "loss": 0.6526, "step": 4686 }, { "epoch": 0.4324299388767155, "grad_norm": 1.4139995585080387, "learning_rate": 7.982417175496607e-07, "loss": 0.5909, "step": 4687 }, { "epoch": 0.4325222004382424, "grad_norm": 2.021753143309613, "learning_rate": 7.980609356582233e-07, "loss": 0.7153, "step": 4688 }, { "epoch": 0.43261446199976933, "grad_norm": 2.0970960574504085, "learning_rate": 7.978801380837313e-07, "loss": 0.7012, "step": 4689 }, { "epoch": 0.4327067235612963, "grad_norm": 2.2218082423205403, "learning_rate": 7.976993248425692e-07, "loss": 1.0774, "step": 4690 }, { "epoch": 0.4327067235612963, "eval_GEN Loss": 0.46025604009628296, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3830902576446533, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8991586565971375, "eval_runtime": 56.5635, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4690 }, { "epoch": 0.4327989851228232, "grad_norm": 2.6603878210660437, "learning_rate": 7.975184959511223e-07, "loss": 0.6511, "step": 4691 }, { "epoch": 0.43289124668435014, "grad_norm": 1.6778368978873004, "learning_rate": 7.973376514257779e-07, "loss": 0.7687, "step": 4692 }, { "epoch": 0.43298350824587706, "grad_norm": 2.2764375836873696, "learning_rate": 7.971567912829242e-07, "loss": 0.7402, "step": 4693 }, { "epoch": 0.433075769807404, "grad_norm": 1.4311959059918864, "learning_rate": 7.969759155389511e-07, "loss": 0.6343, "step": 4694 }, { "epoch": 0.4331680313689309, "grad_norm": 2.44212455914936, "learning_rate": 7.967950242102501e-07, "loss": 0.9167, "step": 4695 }, { "epoch": 0.4331680313689309, "eval_GEN Loss": 0.459176242351532, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3751288056373596, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9004206657409668, "eval_runtime": 55.9485, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4695 }, { "epoch": 0.43326029293045787, "grad_norm": 1.4632975284469596, "learning_rate": 7.966141173132133e-07, "loss": 0.5776, "step": 4696 }, { "epoch": 0.4333525544919848, "grad_norm": 3.9282786558181506, "learning_rate": 7.964331948642351e-07, "loss": 0.9861, "step": 4697 }, { "epoch": 0.4334448160535117, "grad_norm": 2.837280189139784, "learning_rate": 7.96252256879711e-07, "loss": 0.6906, "step": 4698 }, { "epoch": 0.4335370776150386, "grad_norm": 1.4725248228650922, "learning_rate": 7.960713033760378e-07, "loss": 0.5806, "step": 4699 }, { "epoch": 0.43362933917656554, "grad_norm": 1.8470625783448538, "learning_rate": 7.958903343696137e-07, "loss": 0.4683, "step": 4700 }, { "epoch": 0.43362933917656554, "eval_GEN Loss": 0.4584006667137146, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3794468343257904, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8978966474533081, "eval_runtime": 56.811, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4700 }, { "epoch": 0.4337216007380925, "grad_norm": 1.3481895529730203, "learning_rate": 7.957093498768387e-07, "loss": 0.6283, "step": 4701 }, { "epoch": 0.43381386229961943, "grad_norm": 2.6248365689478286, "learning_rate": 7.955283499141137e-07, "loss": 0.7737, "step": 4702 }, { "epoch": 0.43390612386114635, "grad_norm": 1.6703893914918286, "learning_rate": 7.95347334497841e-07, "loss": 0.6473, "step": 4703 }, { "epoch": 0.43399838542267327, "grad_norm": 3.452037803134213, "learning_rate": 7.951663036444249e-07, "loss": 0.7574, "step": 4704 }, { "epoch": 0.4340906469842002, "grad_norm": 2.41047768541628, "learning_rate": 7.949852573702706e-07, "loss": 0.8327, "step": 4705 }, { "epoch": 0.4340906469842002, "eval_GEN Loss": 0.4581994414329529, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.381397545337677, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8990384340286255, "eval_runtime": 56.7226, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4705 }, { "epoch": 0.4341829085457271, "grad_norm": 1.3016419065676879, "learning_rate": 7.948041956917846e-07, "loss": 0.5911, "step": 4706 }, { "epoch": 0.4342751701072541, "grad_norm": 1.727226107957265, "learning_rate": 7.94623118625375e-07, "loss": 0.7855, "step": 4707 }, { "epoch": 0.434367431668781, "grad_norm": 2.252634808733169, "learning_rate": 7.944420261874515e-07, "loss": 0.6946, "step": 4708 }, { "epoch": 0.4344596932303079, "grad_norm": 2.0864100083778916, "learning_rate": 7.94260918394425e-07, "loss": 0.7626, "step": 4709 }, { "epoch": 0.43455195479183484, "grad_norm": 2.0828395562829902, "learning_rate": 7.940797952627075e-07, "loss": 0.6155, "step": 4710 }, { "epoch": 0.43455195479183484, "eval_GEN Loss": 0.45770710706710815, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3713115453720093, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8979567289352417, "eval_runtime": 56.6738, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4710 }, { "epoch": 0.43464421635336176, "grad_norm": 1.820691974808363, "learning_rate": 7.938986568087129e-07, "loss": 0.7224, "step": 4711 }, { "epoch": 0.43473647791488873, "grad_norm": 2.3119226444689964, "learning_rate": 7.937175030488561e-07, "loss": 0.7963, "step": 4712 }, { "epoch": 0.43482873947641565, "grad_norm": 1.91019505159028, "learning_rate": 7.935363339995537e-07, "loss": 0.7806, "step": 4713 }, { "epoch": 0.43492100103794257, "grad_norm": 1.7068662161076187, "learning_rate": 7.933551496772232e-07, "loss": 0.6858, "step": 4714 }, { "epoch": 0.4350132625994695, "grad_norm": 2.2166897923095057, "learning_rate": 7.931739500982843e-07, "loss": 0.7467, "step": 4715 }, { "epoch": 0.4350132625994695, "eval_GEN Loss": 0.4574187099933624, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9156626506024096, "eval_PRM F1 AUC": 0.8056574122577265, "eval_PRM F1 Neg": 0.6956521739130435, "eval_PRM Loss": 0.3624000549316406, "eval_PRM NPV": 0.6956521739130435, "eval_PRM Precision": 0.9156626506024096, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.909254789352417, "eval_runtime": 56.7973, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4715 }, { "epoch": 0.4351055241609964, "grad_norm": 1.396609586826955, "learning_rate": 7.929927352791573e-07, "loss": 0.6445, "step": 4716 }, { "epoch": 0.4351977857225234, "grad_norm": 2.0369343951905168, "learning_rate": 7.928115052362642e-07, "loss": 0.8543, "step": 4717 }, { "epoch": 0.4352900472840503, "grad_norm": 1.9011948270444372, "learning_rate": 7.926302599860283e-07, "loss": 0.753, "step": 4718 }, { "epoch": 0.4353823088455772, "grad_norm": 1.4725508710005852, "learning_rate": 7.924489995448745e-07, "loss": 0.6633, "step": 4719 }, { "epoch": 0.43547457040710413, "grad_norm": 2.250663894278101, "learning_rate": 7.922677239292286e-07, "loss": 0.8765, "step": 4720 }, { "epoch": 0.43547457040710413, "eval_GEN Loss": 0.4571901857852936, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.36222201585769653, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.9145432710647583, "eval_runtime": 56.6621, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4720 }, { "epoch": 0.43556683196863105, "grad_norm": 3.625856943852072, "learning_rate": 7.920864331555183e-07, "loss": 0.9585, "step": 4721 }, { "epoch": 0.43565909353015797, "grad_norm": 2.0336325468387746, "learning_rate": 7.919051272401727e-07, "loss": 0.7091, "step": 4722 }, { "epoch": 0.43575135509168494, "grad_norm": 1.6368541552059357, "learning_rate": 7.917238061996215e-07, "loss": 0.5716, "step": 4723 }, { "epoch": 0.43584361665321186, "grad_norm": 1.2160055009378001, "learning_rate": 7.915424700502965e-07, "loss": 0.5969, "step": 4724 }, { "epoch": 0.4359358782147388, "grad_norm": 2.3469984690248307, "learning_rate": 7.913611188086307e-07, "loss": 0.7006, "step": 4725 }, { "epoch": 0.4359358782147388, "eval_GEN Loss": 0.45721742510795593, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.370048463344574, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9063701629638672, "eval_runtime": 56.6326, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4725 }, { "epoch": 0.4360281397762657, "grad_norm": 3.291890145643495, "learning_rate": 7.911797524910586e-07, "loss": 0.8145, "step": 4726 }, { "epoch": 0.4361204013377926, "grad_norm": 1.6006830997484989, "learning_rate": 7.909983711140158e-07, "loss": 0.6442, "step": 4727 }, { "epoch": 0.4362126628993196, "grad_norm": 1.2578526713809406, "learning_rate": 7.908169746939392e-07, "loss": 0.5649, "step": 4728 }, { "epoch": 0.4363049244608465, "grad_norm": 1.3801844213572867, "learning_rate": 7.906355632472676e-07, "loss": 0.7988, "step": 4729 }, { "epoch": 0.43639718602237343, "grad_norm": 1.9312663743238359, "learning_rate": 7.904541367904403e-07, "loss": 0.7162, "step": 4730 }, { "epoch": 0.43639718602237343, "eval_GEN Loss": 0.45685502886772156, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3747447729110718, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.9107571840286255, "eval_runtime": 56.5124, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 4730 }, { "epoch": 0.43648944758390035, "grad_norm": 2.9765664384317447, "learning_rate": 7.90272695339899e-07, "loss": 0.9391, "step": 4731 }, { "epoch": 0.43658170914542727, "grad_norm": 1.460876403810774, "learning_rate": 7.900912389120854e-07, "loss": 0.7276, "step": 4732 }, { "epoch": 0.43667397070695424, "grad_norm": 2.2349054837889297, "learning_rate": 7.899097675234442e-07, "loss": 0.7166, "step": 4733 }, { "epoch": 0.43676623226848116, "grad_norm": 1.723480762809233, "learning_rate": 7.897282811904202e-07, "loss": 0.7224, "step": 4734 }, { "epoch": 0.4368584938300081, "grad_norm": 1.8318653693499671, "learning_rate": 7.895467799294601e-07, "loss": 0.7709, "step": 4735 }, { "epoch": 0.4368584938300081, "eval_GEN Loss": 0.45638081431388855, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37848106026649475, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8985576629638672, "eval_runtime": 56.6448, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4735 }, { "epoch": 0.436950755391535, "grad_norm": 1.220438129900743, "learning_rate": 7.893652637570119e-07, "loss": 0.5512, "step": 4736 }, { "epoch": 0.4370430169530619, "grad_norm": 2.851493326437574, "learning_rate": 7.891837326895246e-07, "loss": 0.6397, "step": 4737 }, { "epoch": 0.43713527851458883, "grad_norm": 1.4708804084798588, "learning_rate": 7.890021867434492e-07, "loss": 0.605, "step": 4738 }, { "epoch": 0.4372275400761158, "grad_norm": 1.3433940739755865, "learning_rate": 7.888206259352374e-07, "loss": 0.775, "step": 4739 }, { "epoch": 0.4373198016376427, "grad_norm": 1.475732801001111, "learning_rate": 7.886390502813427e-07, "loss": 0.5992, "step": 4740 }, { "epoch": 0.4373198016376427, "eval_GEN Loss": 0.4555416405200958, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.37685060501098633, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8908653855323792, "eval_runtime": 55.9757, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4740 }, { "epoch": 0.43741206319916964, "grad_norm": 1.3281806608626472, "learning_rate": 7.884574597982196e-07, "loss": 0.5943, "step": 4741 }, { "epoch": 0.43750432476069656, "grad_norm": 1.4371721177648529, "learning_rate": 7.882758545023242e-07, "loss": 0.7683, "step": 4742 }, { "epoch": 0.4375965863222235, "grad_norm": 1.770945879636497, "learning_rate": 7.880942344101139e-07, "loss": 0.6944, "step": 4743 }, { "epoch": 0.43768884788375045, "grad_norm": 2.084975711077187, "learning_rate": 7.879125995380473e-07, "loss": 0.746, "step": 4744 }, { "epoch": 0.43778110944527737, "grad_norm": 1.7872141698098307, "learning_rate": 7.877309499025846e-07, "loss": 0.6366, "step": 4745 }, { "epoch": 0.43778110944527737, "eval_GEN Loss": 0.45531877875328064, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3771788775920868, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8801081776618958, "eval_runtime": 56.7361, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4745 }, { "epoch": 0.4378733710068043, "grad_norm": 2.3334849378057436, "learning_rate": 7.875492855201869e-07, "loss": 0.9366, "step": 4746 }, { "epoch": 0.4379656325683312, "grad_norm": 2.9257632296595646, "learning_rate": 7.873676064073174e-07, "loss": 0.7818, "step": 4747 }, { "epoch": 0.4380578941298581, "grad_norm": 2.858632330477558, "learning_rate": 7.871859125804396e-07, "loss": 0.8169, "step": 4748 }, { "epoch": 0.4381501556913851, "grad_norm": 1.5087171651385534, "learning_rate": 7.870042040560191e-07, "loss": 0.561, "step": 4749 }, { "epoch": 0.438242417252912, "grad_norm": 2.2451100019082593, "learning_rate": 7.868224808505228e-07, "loss": 0.839, "step": 4750 }, { "epoch": 0.438242417252912, "eval_GEN Loss": 0.45469093322753906, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3725024163722992, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8673076629638672, "eval_runtime": 56.6244, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4750 }, { "epoch": 0.43833467881443894, "grad_norm": 1.1889179308205569, "learning_rate": 7.866407429804183e-07, "loss": 0.5852, "step": 4751 }, { "epoch": 0.43842694037596586, "grad_norm": 1.871711653204829, "learning_rate": 7.864589904621756e-07, "loss": 0.6783, "step": 4752 }, { "epoch": 0.4385192019374928, "grad_norm": 1.6205575764181466, "learning_rate": 7.862772233122648e-07, "loss": 0.6055, "step": 4753 }, { "epoch": 0.4386114634990197, "grad_norm": 2.2400422970137446, "learning_rate": 7.860954415471584e-07, "loss": 0.8432, "step": 4754 }, { "epoch": 0.43870372506054667, "grad_norm": 1.5118218747017385, "learning_rate": 7.859136451833292e-07, "loss": 0.5241, "step": 4755 }, { "epoch": 0.43870372506054667, "eval_GEN Loss": 0.4534633755683899, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3655868470668793, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8611177802085876, "eval_runtime": 55.906, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4755 }, { "epoch": 0.4387959866220736, "grad_norm": 2.1666910970961086, "learning_rate": 7.857318342372524e-07, "loss": 0.7509, "step": 4756 }, { "epoch": 0.4388882481836005, "grad_norm": 1.4314443742269678, "learning_rate": 7.855500087254036e-07, "loss": 0.6771, "step": 4757 }, { "epoch": 0.4389805097451274, "grad_norm": 3.240702909316351, "learning_rate": 7.853681686642605e-07, "loss": 0.683, "step": 4758 }, { "epoch": 0.43907277130665434, "grad_norm": 2.185201433066347, "learning_rate": 7.851863140703014e-07, "loss": 0.8244, "step": 4759 }, { "epoch": 0.4391650328681813, "grad_norm": 1.732147338873109, "learning_rate": 7.850044449600065e-07, "loss": 0.7374, "step": 4760 }, { "epoch": 0.4391650328681813, "eval_GEN Loss": 0.453051894903183, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3636787235736847, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8683894276618958, "eval_runtime": 55.8975, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4760 }, { "epoch": 0.43925729442970823, "grad_norm": 1.9485772039693157, "learning_rate": 7.84822561349857e-07, "loss": 0.8307, "step": 4761 }, { "epoch": 0.43934955599123515, "grad_norm": 2.3155495918170725, "learning_rate": 7.846406632563352e-07, "loss": 0.782, "step": 4762 }, { "epoch": 0.43944181755276207, "grad_norm": 2.0666922776645986, "learning_rate": 7.844587506959253e-07, "loss": 0.6995, "step": 4763 }, { "epoch": 0.439534079114289, "grad_norm": 1.7489909174463518, "learning_rate": 7.842768236851126e-07, "loss": 0.6288, "step": 4764 }, { "epoch": 0.43962634067581596, "grad_norm": 2.21609375260544, "learning_rate": 7.840948822403832e-07, "loss": 0.6768, "step": 4765 }, { "epoch": 0.43962634067581596, "eval_GEN Loss": 0.4514404237270355, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.37125304341316223, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8665865659713745, "eval_runtime": 55.9958, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4765 }, { "epoch": 0.4397186022373429, "grad_norm": 1.4894739301367836, "learning_rate": 7.839129263782254e-07, "loss": 0.4688, "step": 4766 }, { "epoch": 0.4398108637988698, "grad_norm": 2.2099234113535813, "learning_rate": 7.837309561151278e-07, "loss": 0.7292, "step": 4767 }, { "epoch": 0.4399031253603967, "grad_norm": 2.7676824290317796, "learning_rate": 7.835489714675813e-07, "loss": 0.8873, "step": 4768 }, { "epoch": 0.43999538692192364, "grad_norm": 1.7029644666170025, "learning_rate": 7.833669724520773e-07, "loss": 0.6308, "step": 4769 }, { "epoch": 0.44008764848345056, "grad_norm": 1.8047244326757594, "learning_rate": 7.831849590851092e-07, "loss": 0.744, "step": 4770 }, { "epoch": 0.44008764848345056, "eval_GEN Loss": 0.45074331760406494, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.37152284383773804, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.861057698726654, "eval_runtime": 56.0084, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4770 }, { "epoch": 0.44017991004497753, "grad_norm": 1.985972040598891, "learning_rate": 7.830029313831708e-07, "loss": 0.6057, "step": 4771 }, { "epoch": 0.44027217160650445, "grad_norm": 1.776340793529188, "learning_rate": 7.828208893627582e-07, "loss": 0.7532, "step": 4772 }, { "epoch": 0.44036443316803137, "grad_norm": 1.6615838048133282, "learning_rate": 7.826388330403684e-07, "loss": 0.8906, "step": 4773 }, { "epoch": 0.4404566947295583, "grad_norm": 1.7970364254549376, "learning_rate": 7.824567624324991e-07, "loss": 0.592, "step": 4774 }, { "epoch": 0.4405489562910852, "grad_norm": 1.517973739074256, "learning_rate": 7.822746775556503e-07, "loss": 0.6721, "step": 4775 }, { "epoch": 0.4405489562910852, "eval_GEN Loss": 0.45179668068885803, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3601956367492676, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8554086685180664, "eval_runtime": 55.8446, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4775 }, { "epoch": 0.4406412178526122, "grad_norm": 1.7242768935423405, "learning_rate": 7.820925784263228e-07, "loss": 0.5971, "step": 4776 }, { "epoch": 0.4407334794141391, "grad_norm": 1.1925857006572884, "learning_rate": 7.819104650610185e-07, "loss": 0.5697, "step": 4777 }, { "epoch": 0.440825740975666, "grad_norm": 1.3765474029365963, "learning_rate": 7.817283374762407e-07, "loss": 0.5928, "step": 4778 }, { "epoch": 0.44091800253719293, "grad_norm": 1.3595181832498626, "learning_rate": 7.815461956884946e-07, "loss": 0.6216, "step": 4779 }, { "epoch": 0.44101026409871985, "grad_norm": 1.9319352038786122, "learning_rate": 7.813640397142855e-07, "loss": 0.6597, "step": 4780 }, { "epoch": 0.44101026409871985, "eval_GEN Loss": 0.45005446672439575, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.34828728437423706, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8575119972229004, "eval_runtime": 55.7231, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4780 }, { "epoch": 0.4411025256602468, "grad_norm": 1.63841362992308, "learning_rate": 7.81181869570121e-07, "loss": 0.7085, "step": 4781 }, { "epoch": 0.44119478722177374, "grad_norm": 2.0986174305316956, "learning_rate": 7.809996852725098e-07, "loss": 0.6645, "step": 4782 }, { "epoch": 0.44128704878330066, "grad_norm": 2.5137942401289015, "learning_rate": 7.808174868379614e-07, "loss": 0.8704, "step": 4783 }, { "epoch": 0.4413793103448276, "grad_norm": 1.656877859233539, "learning_rate": 7.806352742829874e-07, "loss": 0.7192, "step": 4784 }, { "epoch": 0.4414715719063545, "grad_norm": 1.7358323922658172, "learning_rate": 7.804530476240996e-07, "loss": 0.7667, "step": 4785 }, { "epoch": 0.4414715719063545, "eval_GEN Loss": 0.44923657178878784, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9156626506024096, "eval_PRM F1 AUC": 0.8056574122577265, "eval_PRM F1 Neg": 0.6956521739130435, "eval_PRM Loss": 0.34491243958473206, "eval_PRM NPV": 0.6956521739130435, "eval_PRM Precision": 0.9156626506024096, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8598557710647583, "eval_runtime": 55.8686, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4785 }, { "epoch": 0.4415638334678814, "grad_norm": 1.605281302286443, "learning_rate": 7.802708068778122e-07, "loss": 0.6515, "step": 4786 }, { "epoch": 0.4416560950294084, "grad_norm": 1.6389882506750895, "learning_rate": 7.800885520606395e-07, "loss": 0.8425, "step": 4787 }, { "epoch": 0.4417483565909353, "grad_norm": 1.776386047484792, "learning_rate": 7.799062831890984e-07, "loss": 0.6836, "step": 4788 }, { "epoch": 0.44184061815246223, "grad_norm": 2.2046869659686985, "learning_rate": 7.79724000279706e-07, "loss": 0.7659, "step": 4789 }, { "epoch": 0.44193287971398915, "grad_norm": 2.3941912374817376, "learning_rate": 7.795417033489812e-07, "loss": 0.7922, "step": 4790 }, { "epoch": 0.44193287971398915, "eval_GEN Loss": 0.4503163695335388, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3538946211338043, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8618389368057251, "eval_runtime": 55.6367, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4790 }, { "epoch": 0.44202514127551606, "grad_norm": 1.5441442386693927, "learning_rate": 7.793593924134441e-07, "loss": 0.6572, "step": 4791 }, { "epoch": 0.44211740283704304, "grad_norm": 1.1243489760331138, "learning_rate": 7.791770674896156e-07, "loss": 0.5188, "step": 4792 }, { "epoch": 0.44220966439856996, "grad_norm": 1.8425652076029724, "learning_rate": 7.789947285940187e-07, "loss": 0.6093, "step": 4793 }, { "epoch": 0.4423019259600969, "grad_norm": 1.8732889695357566, "learning_rate": 7.78812375743177e-07, "loss": 0.5471, "step": 4794 }, { "epoch": 0.4423941875216238, "grad_norm": 1.4563730659789382, "learning_rate": 7.78630008953616e-07, "loss": 0.4675, "step": 4795 }, { "epoch": 0.4423941875216238, "eval_GEN Loss": 0.45053258538246155, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.37071627378463745, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8669471144676208, "eval_runtime": 56.7245, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4795 }, { "epoch": 0.4424864490831507, "grad_norm": 2.007318523948068, "learning_rate": 7.784476282418616e-07, "loss": 0.8277, "step": 4796 }, { "epoch": 0.4425787106446777, "grad_norm": 1.799163404813176, "learning_rate": 7.782652336244415e-07, "loss": 0.7566, "step": 4797 }, { "epoch": 0.4426709722062046, "grad_norm": 2.303023717998823, "learning_rate": 7.780828251178847e-07, "loss": 0.8035, "step": 4798 }, { "epoch": 0.4427632337677315, "grad_norm": 1.7002716298587928, "learning_rate": 7.779004027387215e-07, "loss": 0.5458, "step": 4799 }, { "epoch": 0.44285549532925844, "grad_norm": 1.9925217701470759, "learning_rate": 7.77717966503483e-07, "loss": 0.7271, "step": 4800 }, { "epoch": 0.44285549532925844, "eval_GEN Loss": 0.45304542779922485, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.38917091488838196, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8785457015037537, "eval_runtime": 56.6945, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4800 }, { "epoch": 0.44294775689078536, "grad_norm": 2.986719044717841, "learning_rate": 7.775355164287022e-07, "loss": 0.7804, "step": 4801 }, { "epoch": 0.4430400184523123, "grad_norm": 2.2562939012523913, "learning_rate": 7.773530525309125e-07, "loss": 0.6427, "step": 4802 }, { "epoch": 0.44313228001383925, "grad_norm": 1.9290747727583886, "learning_rate": 7.771705748266495e-07, "loss": 0.6314, "step": 4803 }, { "epoch": 0.44322454157536617, "grad_norm": 3.0839909549121973, "learning_rate": 7.769880833324496e-07, "loss": 0.8221, "step": 4804 }, { "epoch": 0.4433168031368931, "grad_norm": 1.921391650958218, "learning_rate": 7.768055780648503e-07, "loss": 0.6413, "step": 4805 }, { "epoch": 0.4433168031368931, "eval_GEN Loss": 0.45261216163635254, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3995911180973053, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8856971263885498, "eval_runtime": 57.0424, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 4805 }, { "epoch": 0.44340906469842, "grad_norm": 2.9780937426633463, "learning_rate": 7.766230590403904e-07, "loss": 0.8061, "step": 4806 }, { "epoch": 0.4435013262599469, "grad_norm": 1.8450868215652818, "learning_rate": 7.764405262756104e-07, "loss": 0.6345, "step": 4807 }, { "epoch": 0.4435935878214739, "grad_norm": 2.3754753751792403, "learning_rate": 7.762579797870515e-07, "loss": 0.7644, "step": 4808 }, { "epoch": 0.4436858493830008, "grad_norm": 2.1365312100168774, "learning_rate": 7.760754195912564e-07, "loss": 0.8568, "step": 4809 }, { "epoch": 0.44377811094452774, "grad_norm": 1.8446715708338701, "learning_rate": 7.758928457047689e-07, "loss": 0.7715, "step": 4810 }, { "epoch": 0.44377811094452774, "eval_GEN Loss": 0.4512128233909607, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.38094592094421387, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8855168223381042, "eval_runtime": 56.854, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 4810 }, { "epoch": 0.44387037250605466, "grad_norm": 1.841589076809374, "learning_rate": 7.757102581441343e-07, "loss": 0.668, "step": 4811 }, { "epoch": 0.4439626340675816, "grad_norm": 2.114693763730368, "learning_rate": 7.755276569258989e-07, "loss": 0.693, "step": 4812 }, { "epoch": 0.44405489562910855, "grad_norm": 3.1022000937263647, "learning_rate": 7.753450420666102e-07, "loss": 0.8962, "step": 4813 }, { "epoch": 0.44414715719063547, "grad_norm": 2.4705606480548057, "learning_rate": 7.751624135828173e-07, "loss": 0.9391, "step": 4814 }, { "epoch": 0.4442394187521624, "grad_norm": 2.3808550835265363, "learning_rate": 7.749797714910699e-07, "loss": 0.8386, "step": 4815 }, { "epoch": 0.4442394187521624, "eval_GEN Loss": 0.4507255554199219, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3729810118675232, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8896634578704834, "eval_runtime": 56.8345, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4815 }, { "epoch": 0.4443316803136893, "grad_norm": 1.2881464996014005, "learning_rate": 7.747971158079198e-07, "loss": 0.535, "step": 4816 }, { "epoch": 0.4444239418752162, "grad_norm": 1.9251732899434935, "learning_rate": 7.74614446549919e-07, "loss": 0.6671, "step": 4817 }, { "epoch": 0.44451620343674314, "grad_norm": 1.1064141952953248, "learning_rate": 7.744317637336219e-07, "loss": 0.493, "step": 4818 }, { "epoch": 0.4446084649982701, "grad_norm": 1.7220802946659477, "learning_rate": 7.742490673755828e-07, "loss": 0.7089, "step": 4819 }, { "epoch": 0.44470072655979703, "grad_norm": 1.667914324171535, "learning_rate": 7.740663574923585e-07, "loss": 0.7239, "step": 4820 }, { "epoch": 0.44470072655979703, "eval_GEN Loss": 0.45077958703041077, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36934369802474976, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.885036051273346, "eval_runtime": 56.9004, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 4820 }, { "epoch": 0.44479298812132395, "grad_norm": 2.4051284281544008, "learning_rate": 7.738836341005061e-07, "loss": 0.6486, "step": 4821 }, { "epoch": 0.44488524968285087, "grad_norm": 2.100640589879822, "learning_rate": 7.737008972165845e-07, "loss": 0.7158, "step": 4822 }, { "epoch": 0.4449775112443778, "grad_norm": 1.4744789673232082, "learning_rate": 7.735181468571537e-07, "loss": 0.6284, "step": 4823 }, { "epoch": 0.44506977280590476, "grad_norm": 2.804631358799138, "learning_rate": 7.733353830387745e-07, "loss": 0.8886, "step": 4824 }, { "epoch": 0.4451620343674317, "grad_norm": 1.8843128731509087, "learning_rate": 7.731526057780095e-07, "loss": 0.6063, "step": 4825 }, { "epoch": 0.4451620343674317, "eval_GEN Loss": 0.45132166147232056, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37580814957618713, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8762620091438293, "eval_runtime": 56.7269, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4825 }, { "epoch": 0.4452542959289586, "grad_norm": 2.570645657839632, "learning_rate": 7.729698150914221e-07, "loss": 0.8172, "step": 4826 }, { "epoch": 0.4453465574904855, "grad_norm": 3.5212540585522487, "learning_rate": 7.727870109955773e-07, "loss": 0.5646, "step": 4827 }, { "epoch": 0.44543881905201244, "grad_norm": 2.8120732974797917, "learning_rate": 7.726041935070407e-07, "loss": 0.9753, "step": 4828 }, { "epoch": 0.4455310806135394, "grad_norm": 1.9330917674393349, "learning_rate": 7.724213626423797e-07, "loss": 0.7229, "step": 4829 }, { "epoch": 0.44562334217506633, "grad_norm": 2.480624792920063, "learning_rate": 7.72238518418163e-07, "loss": 0.8723, "step": 4830 }, { "epoch": 0.44562334217506633, "eval_GEN Loss": 0.45189520716667175, "eval_GEN top-5 accuracy": 0.9798334064007015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3793484568595886, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8654447197914124, "eval_runtime": 56.795, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 4830 }, { "epoch": 0.44571560373659325, "grad_norm": 2.6109557418036973, "learning_rate": 7.720556608509598e-07, "loss": 0.7072, "step": 4831 }, { "epoch": 0.44580786529812017, "grad_norm": 2.0740767068097172, "learning_rate": 7.718727899573414e-07, "loss": 0.7491, "step": 4832 }, { "epoch": 0.4459001268596471, "grad_norm": 2.0795582649768, "learning_rate": 7.716899057538794e-07, "loss": 0.5855, "step": 4833 }, { "epoch": 0.445992388421174, "grad_norm": 2.373221478656409, "learning_rate": 7.715070082571474e-07, "loss": 0.8048, "step": 4834 }, { "epoch": 0.446084649982701, "grad_norm": 1.4641729344224168, "learning_rate": 7.713240974837196e-07, "loss": 0.5786, "step": 4835 }, { "epoch": 0.446084649982701, "eval_GEN Loss": 0.4521447420120239, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.38413938879966736, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8606970906257629, "eval_runtime": 56.7193, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4835 }, { "epoch": 0.4461769115442279, "grad_norm": 2.628735964238196, "learning_rate": 7.711411734501717e-07, "loss": 1.0273, "step": 4836 }, { "epoch": 0.4462691731057548, "grad_norm": 2.1616387352950093, "learning_rate": 7.709582361730808e-07, "loss": 0.8302, "step": 4837 }, { "epoch": 0.44636143466728173, "grad_norm": 1.9641014678194397, "learning_rate": 7.707752856690247e-07, "loss": 0.7127, "step": 4838 }, { "epoch": 0.44645369622880865, "grad_norm": 1.913015786658051, "learning_rate": 7.705923219545829e-07, "loss": 0.5397, "step": 4839 }, { "epoch": 0.4465459577903356, "grad_norm": 1.6983209753666597, "learning_rate": 7.704093450463354e-07, "loss": 0.565, "step": 4840 }, { "epoch": 0.4465459577903356, "eval_GEN Loss": 0.4515858292579651, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.37640830874443054, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8536658883094788, "eval_runtime": 56.537, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 4840 }, { "epoch": 0.44663821935186254, "grad_norm": 2.812214292873485, "learning_rate": 7.702263549608645e-07, "loss": 0.6776, "step": 4841 }, { "epoch": 0.44673048091338946, "grad_norm": 1.8700123400300712, "learning_rate": 7.700433517147525e-07, "loss": 0.7706, "step": 4842 }, { "epoch": 0.4468227424749164, "grad_norm": 1.7716181250568908, "learning_rate": 7.698603353245838e-07, "loss": 0.6339, "step": 4843 }, { "epoch": 0.4469150040364433, "grad_norm": 1.9982389798193847, "learning_rate": 7.696773058069435e-07, "loss": 0.6139, "step": 4844 }, { "epoch": 0.44700726559797027, "grad_norm": 1.7480786363303933, "learning_rate": 7.694942631784177e-07, "loss": 0.7797, "step": 4845 }, { "epoch": 0.44700726559797027, "eval_GEN Loss": 0.4507410228252411, "eval_GEN top-5 accuracy": 0.979395002192021, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.370062917470932, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8489783406257629, "eval_runtime": 56.7104, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4845 }, { "epoch": 0.4470995271594972, "grad_norm": 1.8108676716619183, "learning_rate": 7.693112074555948e-07, "loss": 0.6209, "step": 4846 }, { "epoch": 0.4471917887210241, "grad_norm": 1.5820263693056011, "learning_rate": 7.69128138655063e-07, "loss": 0.6006, "step": 4847 }, { "epoch": 0.447284050282551, "grad_norm": 2.126790408860593, "learning_rate": 7.689450567934124e-07, "loss": 0.6374, "step": 4848 }, { "epoch": 0.44737631184407795, "grad_norm": 2.1815452008407012, "learning_rate": 7.687619618872341e-07, "loss": 0.6349, "step": 4849 }, { "epoch": 0.44746857340560486, "grad_norm": 2.4343238388434125, "learning_rate": 7.685788539531206e-07, "loss": 0.7702, "step": 4850 }, { "epoch": 0.44746857340560486, "eval_GEN Loss": 0.4504643380641937, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3582235276699066, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8538461327552795, "eval_runtime": 56.693, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4850 }, { "epoch": 0.44756083496713184, "grad_norm": 2.2663135345932623, "learning_rate": 7.683957330076652e-07, "loss": 0.6538, "step": 4851 }, { "epoch": 0.44765309652865876, "grad_norm": 2.132805764674252, "learning_rate": 7.68212599067463e-07, "loss": 0.9194, "step": 4852 }, { "epoch": 0.4477453580901857, "grad_norm": 1.6010715966128504, "learning_rate": 7.680294521491096e-07, "loss": 0.7194, "step": 4853 }, { "epoch": 0.4478376196517126, "grad_norm": 2.4274324377270005, "learning_rate": 7.678462922692019e-07, "loss": 1.0255, "step": 4854 }, { "epoch": 0.4479298812132395, "grad_norm": 1.4969939309329234, "learning_rate": 7.676631194443386e-07, "loss": 0.6899, "step": 4855 }, { "epoch": 0.4479298812132395, "eval_GEN Loss": 0.45059728622436523, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35486912727355957, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.867968738079071, "eval_runtime": 56.6536, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4855 }, { "epoch": 0.4480221427747665, "grad_norm": 1.9979014362941518, "learning_rate": 7.674799336911188e-07, "loss": 0.8014, "step": 4856 }, { "epoch": 0.4481144043362934, "grad_norm": 1.4919786696966808, "learning_rate": 7.67296735026143e-07, "loss": 0.5706, "step": 4857 }, { "epoch": 0.4482066658978203, "grad_norm": 1.6622866502173277, "learning_rate": 7.671135234660132e-07, "loss": 0.6627, "step": 4858 }, { "epoch": 0.44829892745934724, "grad_norm": 1.574304262988785, "learning_rate": 7.669302990273322e-07, "loss": 0.6814, "step": 4859 }, { "epoch": 0.44839118902087416, "grad_norm": 1.8139931423670066, "learning_rate": 7.667470617267042e-07, "loss": 0.7405, "step": 4860 }, { "epoch": 0.44839118902087416, "eval_GEN Loss": 0.4502272605895996, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3589043915271759, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8643028736114502, "eval_runtime": 55.8577, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4860 }, { "epoch": 0.44848345058240113, "grad_norm": 1.3678175189899773, "learning_rate": 7.665638115807342e-07, "loss": 0.6269, "step": 4861 }, { "epoch": 0.44857571214392805, "grad_norm": 1.6185558412626861, "learning_rate": 7.663805486060289e-07, "loss": 0.7329, "step": 4862 }, { "epoch": 0.44866797370545497, "grad_norm": 2.9892987671955757, "learning_rate": 7.661972728191957e-07, "loss": 1.0226, "step": 4863 }, { "epoch": 0.4487602352669819, "grad_norm": 2.179069975887705, "learning_rate": 7.660139842368435e-07, "loss": 0.8208, "step": 4864 }, { "epoch": 0.4488524968285088, "grad_norm": 2.0548584731826938, "learning_rate": 7.658306828755818e-07, "loss": 0.8413, "step": 4865 }, { "epoch": 0.4488524968285088, "eval_GEN Loss": 0.4502057433128357, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.37014564871788025, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.856249988079071, "eval_runtime": 55.7607, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4865 }, { "epoch": 0.4489447583900357, "grad_norm": 1.4487256427379562, "learning_rate": 7.656473687520221e-07, "loss": 0.6295, "step": 4866 }, { "epoch": 0.4490370199515627, "grad_norm": 2.277522339618264, "learning_rate": 7.654640418827765e-07, "loss": 0.8831, "step": 4867 }, { "epoch": 0.4491292815130896, "grad_norm": 1.9571596028049818, "learning_rate": 7.652807022844584e-07, "loss": 0.8194, "step": 4868 }, { "epoch": 0.44922154307461654, "grad_norm": 1.6935564321127696, "learning_rate": 7.650973499736821e-07, "loss": 0.6988, "step": 4869 }, { "epoch": 0.44931380463614345, "grad_norm": 1.4444543691657843, "learning_rate": 7.649139849670635e-07, "loss": 0.6097, "step": 4870 }, { "epoch": 0.44931380463614345, "eval_GEN Loss": 0.44942644238471985, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.39153990149497986, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8543269038200378, "eval_runtime": 56.7582, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4870 }, { "epoch": 0.4494060661976704, "grad_norm": 1.481849699332203, "learning_rate": 7.647306072812194e-07, "loss": 0.6118, "step": 4871 }, { "epoch": 0.44949832775919735, "grad_norm": 2.17582434683825, "learning_rate": 7.645472169327676e-07, "loss": 0.666, "step": 4872 }, { "epoch": 0.44959058932072427, "grad_norm": 1.6633709925166593, "learning_rate": 7.643638139383275e-07, "loss": 0.6538, "step": 4873 }, { "epoch": 0.4496828508822512, "grad_norm": 2.537791126561003, "learning_rate": 7.641803983145191e-07, "loss": 0.9678, "step": 4874 }, { "epoch": 0.4497751124437781, "grad_norm": 2.181364453374548, "learning_rate": 7.639969700779641e-07, "loss": 0.7047, "step": 4875 }, { "epoch": 0.4497751124437781, "eval_GEN Loss": 0.4490335285663605, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3929685950279236, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8465144038200378, "eval_runtime": 56.6371, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4875 }, { "epoch": 0.449867374005305, "grad_norm": 2.6966577165027434, "learning_rate": 7.638135292452847e-07, "loss": 0.6698, "step": 4876 }, { "epoch": 0.449959635566832, "grad_norm": 1.4443608177416574, "learning_rate": 7.636300758331047e-07, "loss": 0.5998, "step": 4877 }, { "epoch": 0.4500518971283589, "grad_norm": 2.831607100701258, "learning_rate": 7.634466098580492e-07, "loss": 0.9286, "step": 4878 }, { "epoch": 0.45014415868988583, "grad_norm": 1.7507049828430707, "learning_rate": 7.632631313367439e-07, "loss": 0.725, "step": 4879 }, { "epoch": 0.45023642025141275, "grad_norm": 1.9510999148381207, "learning_rate": 7.630796402858162e-07, "loss": 0.7925, "step": 4880 }, { "epoch": 0.45023642025141275, "eval_GEN Loss": 0.4499054551124573, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3835833668708801, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8394832015037537, "eval_runtime": 56.6716, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4880 }, { "epoch": 0.45032868181293967, "grad_norm": 3.04660900868595, "learning_rate": 7.62896136721894e-07, "loss": 0.7816, "step": 4881 }, { "epoch": 0.4504209433744666, "grad_norm": 1.3937106977820775, "learning_rate": 7.627126206616069e-07, "loss": 0.5557, "step": 4882 }, { "epoch": 0.45051320493599356, "grad_norm": 1.7126895050649609, "learning_rate": 7.625290921215854e-07, "loss": 0.5991, "step": 4883 }, { "epoch": 0.4506054664975205, "grad_norm": 1.4418365448775643, "learning_rate": 7.62345551118461e-07, "loss": 0.7152, "step": 4884 }, { "epoch": 0.4506977280590474, "grad_norm": 1.9764253270485501, "learning_rate": 7.621619976688665e-07, "loss": 0.766, "step": 4885 }, { "epoch": 0.4506977280590474, "eval_GEN Loss": 0.4499186873435974, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.368186891078949, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8313100934028625, "eval_runtime": 55.758, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4885 }, { "epoch": 0.4507899896205743, "grad_norm": 1.5134741205242028, "learning_rate": 7.619784317894361e-07, "loss": 0.7556, "step": 4886 }, { "epoch": 0.45088225118210123, "grad_norm": 1.3158162165921703, "learning_rate": 7.617948534968045e-07, "loss": 0.674, "step": 4887 }, { "epoch": 0.4509745127436282, "grad_norm": 1.9197816874277895, "learning_rate": 7.616112628076078e-07, "loss": 0.887, "step": 4888 }, { "epoch": 0.4510667743051551, "grad_norm": 2.2854476850128242, "learning_rate": 7.614276597384838e-07, "loss": 0.787, "step": 4889 }, { "epoch": 0.45115903586668205, "grad_norm": 2.2649618336356916, "learning_rate": 7.612440443060701e-07, "loss": 0.6828, "step": 4890 }, { "epoch": 0.45115903586668205, "eval_GEN Loss": 0.4500063955783844, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35555335879325867, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8332932591438293, "eval_runtime": 55.6629, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4890 }, { "epoch": 0.45125129742820896, "grad_norm": 1.5049490150529958, "learning_rate": 7.610604165270069e-07, "loss": 0.7353, "step": 4891 }, { "epoch": 0.4513435589897359, "grad_norm": 2.8899498641832517, "learning_rate": 7.608767764179346e-07, "loss": 0.8419, "step": 4892 }, { "epoch": 0.45143582055126286, "grad_norm": 1.198976224826009, "learning_rate": 7.606931239954949e-07, "loss": 0.4259, "step": 4893 }, { "epoch": 0.4515280821127898, "grad_norm": 3.0269633309098025, "learning_rate": 7.605094592763306e-07, "loss": 0.6835, "step": 4894 }, { "epoch": 0.4516203436743167, "grad_norm": 2.557644373174563, "learning_rate": 7.60325782277086e-07, "loss": 0.7251, "step": 4895 }, { "epoch": 0.4516203436743167, "eval_GEN Loss": 0.44926685094833374, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3499768078327179, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8364182710647583, "eval_runtime": 56.7091, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 4895 }, { "epoch": 0.4517126052358436, "grad_norm": 3.5459197690003723, "learning_rate": 7.601420930144059e-07, "loss": 0.7886, "step": 4896 }, { "epoch": 0.45180486679737053, "grad_norm": 3.054037733353994, "learning_rate": 7.599583915049366e-07, "loss": 0.8192, "step": 4897 }, { "epoch": 0.45189712835889745, "grad_norm": 1.515783930843749, "learning_rate": 7.597746777653256e-07, "loss": 0.536, "step": 4898 }, { "epoch": 0.4519893899204244, "grad_norm": 1.682670060532119, "learning_rate": 7.595909518122208e-07, "loss": 0.5172, "step": 4899 }, { "epoch": 0.45208165148195134, "grad_norm": 1.6412395197587741, "learning_rate": 7.594072136622725e-07, "loss": 0.629, "step": 4900 }, { "epoch": 0.45208165148195134, "eval_GEN Loss": 0.4507950246334076, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3577316701412201, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8379206657409668, "eval_runtime": 55.6547, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4900 }, { "epoch": 0.45217391304347826, "grad_norm": 1.7267695826749865, "learning_rate": 7.592234633321306e-07, "loss": 0.6973, "step": 4901 }, { "epoch": 0.4522661746050052, "grad_norm": 2.099310162832629, "learning_rate": 7.590397008384473e-07, "loss": 0.6818, "step": 4902 }, { "epoch": 0.4523584361665321, "grad_norm": 2.1240867507643793, "learning_rate": 7.588559261978755e-07, "loss": 0.6809, "step": 4903 }, { "epoch": 0.45245069772805907, "grad_norm": 1.808799001425262, "learning_rate": 7.586721394270688e-07, "loss": 0.7394, "step": 4904 }, { "epoch": 0.452542959289586, "grad_norm": 1.7549151744918023, "learning_rate": 7.584883405426825e-07, "loss": 0.5799, "step": 4905 }, { "epoch": 0.452542959289586, "eval_GEN Loss": 0.4503755569458008, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3593742549419403, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8368990421295166, "eval_runtime": 55.5806, "eval_samples_per_second": 1.169, "eval_steps_per_second": 0.09, "step": 4905 }, { "epoch": 0.4526352208511129, "grad_norm": 1.7321911269492725, "learning_rate": 7.583045295613728e-07, "loss": 0.7793, "step": 4906 }, { "epoch": 0.4527274824126398, "grad_norm": 1.9116750763601016, "learning_rate": 7.581207064997967e-07, "loss": 0.8343, "step": 4907 }, { "epoch": 0.45281974397416674, "grad_norm": 1.6655752312170424, "learning_rate": 7.579368713746124e-07, "loss": 0.5265, "step": 4908 }, { "epoch": 0.4529120055356937, "grad_norm": 2.322114515471997, "learning_rate": 7.577530242024799e-07, "loss": 0.7986, "step": 4909 }, { "epoch": 0.45300426709722064, "grad_norm": 1.4256121672929263, "learning_rate": 7.575691650000591e-07, "loss": 0.5562, "step": 4910 }, { "epoch": 0.45300426709722064, "eval_GEN Loss": 0.45039743185043335, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.35517624020576477, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8301081657409668, "eval_runtime": 55.9073, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4910 }, { "epoch": 0.45309652865874755, "grad_norm": 2.6454278418593553, "learning_rate": 7.573852937840121e-07, "loss": 0.6819, "step": 4911 }, { "epoch": 0.4531887902202745, "grad_norm": 1.89941985235204, "learning_rate": 7.572014105710014e-07, "loss": 0.6334, "step": 4912 }, { "epoch": 0.4532810517818014, "grad_norm": 1.5715184696915319, "learning_rate": 7.570175153776907e-07, "loss": 0.5503, "step": 4913 }, { "epoch": 0.4533733133433283, "grad_norm": 1.810656663596407, "learning_rate": 7.56833608220745e-07, "loss": 0.6956, "step": 4914 }, { "epoch": 0.4534655749048553, "grad_norm": 1.5651193704295547, "learning_rate": 7.566496891168301e-07, "loss": 0.6991, "step": 4915 }, { "epoch": 0.4534655749048553, "eval_GEN Loss": 0.4512878954410553, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3510670065879822, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8298677802085876, "eval_runtime": 55.9225, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 4915 }, { "epoch": 0.4535578364663822, "grad_norm": 1.7080790164245894, "learning_rate": 7.564657580826133e-07, "loss": 0.7094, "step": 4916 }, { "epoch": 0.4536500980279091, "grad_norm": 1.5394826523159315, "learning_rate": 7.562818151347626e-07, "loss": 0.5616, "step": 4917 }, { "epoch": 0.45374235958943604, "grad_norm": 3.019054420024775, "learning_rate": 7.560978602899471e-07, "loss": 0.8298, "step": 4918 }, { "epoch": 0.45383462115096296, "grad_norm": 2.6445069351837147, "learning_rate": 7.559138935648372e-07, "loss": 0.888, "step": 4919 }, { "epoch": 0.45392688271248993, "grad_norm": 1.9833660274217133, "learning_rate": 7.55729914976104e-07, "loss": 0.789, "step": 4920 }, { "epoch": 0.45392688271248993, "eval_GEN Loss": 0.4534490406513214, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.35090965032577515, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.828906238079071, "eval_runtime": 55.7499, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4920 }, { "epoch": 0.45401914427401685, "grad_norm": 1.719519788288224, "learning_rate": 7.555459245404205e-07, "loss": 0.5588, "step": 4921 }, { "epoch": 0.45411140583554377, "grad_norm": 3.2076227876162653, "learning_rate": 7.553619222744596e-07, "loss": 0.7524, "step": 4922 }, { "epoch": 0.4542036673970707, "grad_norm": 1.6974159171648042, "learning_rate": 7.551779081948961e-07, "loss": 0.8009, "step": 4923 }, { "epoch": 0.4542959289585976, "grad_norm": 1.736419123915355, "learning_rate": 7.549938823184056e-07, "loss": 0.6365, "step": 4924 }, { "epoch": 0.4543881905201246, "grad_norm": 2.2744503247127934, "learning_rate": 7.548098446616651e-07, "loss": 0.6579, "step": 4925 }, { "epoch": 0.4543881905201246, "eval_GEN Loss": 0.4548953175544739, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3620133697986603, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8353365659713745, "eval_runtime": 55.964, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 4925 }, { "epoch": 0.4544804520816515, "grad_norm": 1.6173522818511181, "learning_rate": 7.546257952413519e-07, "loss": 0.6222, "step": 4926 }, { "epoch": 0.4545727136431784, "grad_norm": 1.8907619268153513, "learning_rate": 7.544417340741451e-07, "loss": 0.6265, "step": 4927 }, { "epoch": 0.45466497520470533, "grad_norm": 1.5789035785743983, "learning_rate": 7.542576611767249e-07, "loss": 0.5191, "step": 4928 }, { "epoch": 0.45475723676623225, "grad_norm": 2.7755379481121105, "learning_rate": 7.540735765657718e-07, "loss": 0.7507, "step": 4929 }, { "epoch": 0.45484949832775917, "grad_norm": 1.6912425593118265, "learning_rate": 7.53889480257968e-07, "loss": 0.6981, "step": 4930 }, { "epoch": 0.45484949832775917, "eval_GEN Loss": 0.45486512780189514, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3667934834957123, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8427283763885498, "eval_runtime": 55.7022, "eval_samples_per_second": 1.167, "eval_steps_per_second": 0.09, "step": 4930 }, { "epoch": 0.45494175988928615, "grad_norm": 1.5819340154822799, "learning_rate": 7.537053722699967e-07, "loss": 0.5739, "step": 4931 }, { "epoch": 0.45503402145081306, "grad_norm": 2.354660028094656, "learning_rate": 7.535212526185421e-07, "loss": 0.6705, "step": 4932 }, { "epoch": 0.45512628301234, "grad_norm": 4.948548157757214, "learning_rate": 7.53337121320289e-07, "loss": 0.6655, "step": 4933 }, { "epoch": 0.4552185445738669, "grad_norm": 1.6124851947984569, "learning_rate": 7.531529783919241e-07, "loss": 0.6446, "step": 4934 }, { "epoch": 0.4553108061353938, "grad_norm": 2.3429487197378043, "learning_rate": 7.529688238501347e-07, "loss": 0.7762, "step": 4935 }, { "epoch": 0.4553108061353938, "eval_GEN Loss": 0.4550427496433258, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3717118501663208, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8502404093742371, "eval_runtime": 55.7811, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4935 }, { "epoch": 0.4554030676969208, "grad_norm": 1.801149240150357, "learning_rate": 7.527846577116088e-07, "loss": 0.6255, "step": 4936 }, { "epoch": 0.4554953292584477, "grad_norm": 2.528651265330128, "learning_rate": 7.526004799930363e-07, "loss": 0.7562, "step": 4937 }, { "epoch": 0.45558759081997463, "grad_norm": 1.6882324453823547, "learning_rate": 7.524162907111073e-07, "loss": 0.6666, "step": 4938 }, { "epoch": 0.45567985238150155, "grad_norm": 2.246075343274532, "learning_rate": 7.522320898825136e-07, "loss": 0.8669, "step": 4939 }, { "epoch": 0.45577211394302847, "grad_norm": 2.1686667106183077, "learning_rate": 7.520478775239476e-07, "loss": 0.8487, "step": 4940 }, { "epoch": 0.45577211394302847, "eval_GEN Loss": 0.454032838344574, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.37621140480041504, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8484975695610046, "eval_runtime": 55.7576, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 4940 }, { "epoch": 0.45586437550455544, "grad_norm": 1.8626894533226532, "learning_rate": 7.518636536521031e-07, "loss": 0.6564, "step": 4941 }, { "epoch": 0.45595663706608236, "grad_norm": 1.7787638907297374, "learning_rate": 7.516794182836745e-07, "loss": 0.743, "step": 4942 }, { "epoch": 0.4560488986276093, "grad_norm": 2.312516016602605, "learning_rate": 7.514951714353575e-07, "loss": 0.7205, "step": 4943 }, { "epoch": 0.4561411601891362, "grad_norm": 1.65867382744602, "learning_rate": 7.513109131238491e-07, "loss": 0.6606, "step": 4944 }, { "epoch": 0.4562334217506631, "grad_norm": 2.4769185946808716, "learning_rate": 7.51126643365847e-07, "loss": 0.8568, "step": 4945 }, { "epoch": 0.4562334217506631, "eval_GEN Loss": 0.4549756348133087, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.380465030670166, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.852343738079071, "eval_runtime": 55.5162, "eval_samples_per_second": 1.171, "eval_steps_per_second": 0.09, "step": 4945 }, { "epoch": 0.45632568331219003, "grad_norm": 1.8883562084182937, "learning_rate": 7.509423621780498e-07, "loss": 0.5834, "step": 4946 }, { "epoch": 0.456417944873717, "grad_norm": 1.2885661165766986, "learning_rate": 7.507580695771576e-07, "loss": 0.6534, "step": 4947 }, { "epoch": 0.4565102064352439, "grad_norm": 2.4289534962266615, "learning_rate": 7.505737655798711e-07, "loss": 0.8856, "step": 4948 }, { "epoch": 0.45660246799677084, "grad_norm": 2.9740327471298547, "learning_rate": 7.503894502028925e-07, "loss": 0.7971, "step": 4949 }, { "epoch": 0.45669472955829776, "grad_norm": 2.5123813406885085, "learning_rate": 7.502051234629242e-07, "loss": 0.853, "step": 4950 }, { "epoch": 0.45669472955829776, "eval_GEN Loss": 0.45578035712242126, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.38547927141189575, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8516826629638672, "eval_runtime": 55.8223, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 4950 }, { "epoch": 0.4567869911198247, "grad_norm": 1.794647228204393, "learning_rate": 7.500207853766708e-07, "loss": 0.8264, "step": 4951 }, { "epoch": 0.45687925268135166, "grad_norm": 2.0793792597008207, "learning_rate": 7.498364359608369e-07, "loss": 0.6547, "step": 4952 }, { "epoch": 0.4569715142428786, "grad_norm": 2.056497126713187, "learning_rate": 7.496520752321289e-07, "loss": 0.6192, "step": 4953 }, { "epoch": 0.4570637758044055, "grad_norm": 2.2606158939808143, "learning_rate": 7.494677032072535e-07, "loss": 0.7396, "step": 4954 }, { "epoch": 0.4571560373659324, "grad_norm": 2.4449165214326536, "learning_rate": 7.492833199029191e-07, "loss": 0.5905, "step": 4955 }, { "epoch": 0.4571560373659324, "eval_GEN Loss": 0.4551500976085663, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3771830201148987, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8567307591438293, "eval_runtime": 55.802, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 4955 }, { "epoch": 0.45724829892745933, "grad_norm": 1.8396518642624526, "learning_rate": 7.490989253358343e-07, "loss": 0.7613, "step": 4956 }, { "epoch": 0.4573405604889863, "grad_norm": 1.965138443022425, "learning_rate": 7.489145195227098e-07, "loss": 0.8779, "step": 4957 }, { "epoch": 0.4574328220505132, "grad_norm": 2.9043037437403765, "learning_rate": 7.487301024802564e-07, "loss": 0.8048, "step": 4958 }, { "epoch": 0.45752508361204014, "grad_norm": 1.731255930748899, "learning_rate": 7.485456742251862e-07, "loss": 0.6119, "step": 4959 }, { "epoch": 0.45761734517356706, "grad_norm": 1.7769125894703208, "learning_rate": 7.483612347742128e-07, "loss": 0.7566, "step": 4960 }, { "epoch": 0.45761734517356706, "eval_GEN Loss": 0.4544562101364136, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3793272078037262, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8551682829856873, "eval_runtime": 55.6503, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4960 }, { "epoch": 0.457709606735094, "grad_norm": 4.190430959023868, "learning_rate": 7.4817678414405e-07, "loss": 0.9238, "step": 4961 }, { "epoch": 0.4578018682966209, "grad_norm": 2.030988211476841, "learning_rate": 7.479923223514132e-07, "loss": 0.6298, "step": 4962 }, { "epoch": 0.45789412985814787, "grad_norm": 1.3911046802032352, "learning_rate": 7.478078494130185e-07, "loss": 0.5927, "step": 4963 }, { "epoch": 0.4579863914196748, "grad_norm": 2.0391226148920407, "learning_rate": 7.476233653455832e-07, "loss": 0.6528, "step": 4964 }, { "epoch": 0.4580786529812017, "grad_norm": 1.485347592023389, "learning_rate": 7.474388701658257e-07, "loss": 0.4887, "step": 4965 }, { "epoch": 0.4580786529812017, "eval_GEN Loss": 0.4552704095840454, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3841768205165863, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8591346144676208, "eval_runtime": 55.8689, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 4965 }, { "epoch": 0.4581709145427286, "grad_norm": 1.4323814822172904, "learning_rate": 7.472543638904647e-07, "loss": 0.6845, "step": 4966 }, { "epoch": 0.45826317610425554, "grad_norm": 2.1472832595312035, "learning_rate": 7.470698465362211e-07, "loss": 0.6259, "step": 4967 }, { "epoch": 0.4583554376657825, "grad_norm": 2.501451537834362, "learning_rate": 7.468853181198158e-07, "loss": 0.6265, "step": 4968 }, { "epoch": 0.45844769922730944, "grad_norm": 2.622597194908958, "learning_rate": 7.467007786579711e-07, "loss": 0.677, "step": 4969 }, { "epoch": 0.45853996078883635, "grad_norm": 2.290725397699514, "learning_rate": 7.465162281674101e-07, "loss": 0.6437, "step": 4970 }, { "epoch": 0.45853996078883635, "eval_GEN Loss": 0.45411595702171326, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.38517871499061584, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8573918342590332, "eval_runtime": 56.6704, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4970 }, { "epoch": 0.45863222235036327, "grad_norm": 1.316164557732957, "learning_rate": 7.463316666648576e-07, "loss": 0.5487, "step": 4971 }, { "epoch": 0.4587244839118902, "grad_norm": 1.5575148524141749, "learning_rate": 7.461470941670382e-07, "loss": 0.588, "step": 4972 }, { "epoch": 0.45881674547341716, "grad_norm": 2.990129029813399, "learning_rate": 7.459625106906786e-07, "loss": 0.7117, "step": 4973 }, { "epoch": 0.4589090070349441, "grad_norm": 1.852256905245319, "learning_rate": 7.457779162525057e-07, "loss": 0.699, "step": 4974 }, { "epoch": 0.459001268596471, "grad_norm": 2.412081676613645, "learning_rate": 7.45593310869248e-07, "loss": 0.803, "step": 4975 }, { "epoch": 0.459001268596471, "eval_GEN Loss": 0.4546949565410614, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3785286545753479, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8506009578704834, "eval_runtime": 56.5675, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 4975 }, { "epoch": 0.4590935301579979, "grad_norm": 2.119126372478069, "learning_rate": 7.454086945576347e-07, "loss": 0.7081, "step": 4976 }, { "epoch": 0.45918579171952484, "grad_norm": 1.6973209128827462, "learning_rate": 7.45224067334396e-07, "loss": 0.5334, "step": 4977 }, { "epoch": 0.45927805328105176, "grad_norm": 2.5467791459503486, "learning_rate": 7.450394292162632e-07, "loss": 0.6277, "step": 4978 }, { "epoch": 0.45937031484257873, "grad_norm": 1.6195247991899393, "learning_rate": 7.448547802199682e-07, "loss": 0.6766, "step": 4979 }, { "epoch": 0.45946257640410565, "grad_norm": 1.810499278714975, "learning_rate": 7.446701203622444e-07, "loss": 0.78, "step": 4980 }, { "epoch": 0.45946257640410565, "eval_GEN Loss": 0.4546329379081726, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3770916163921356, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8491586446762085, "eval_runtime": 56.642, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 4980 }, { "epoch": 0.45955483796563257, "grad_norm": 1.85580055262651, "learning_rate": 7.444854496598258e-07, "loss": 0.7662, "step": 4981 }, { "epoch": 0.4596470995271595, "grad_norm": 2.0377196482168047, "learning_rate": 7.443007681294479e-07, "loss": 0.7649, "step": 4982 }, { "epoch": 0.4597393610886864, "grad_norm": 1.665173827861678, "learning_rate": 7.441160757878464e-07, "loss": 0.7277, "step": 4983 }, { "epoch": 0.4598316226502134, "grad_norm": 2.1355473520302497, "learning_rate": 7.439313726517587e-07, "loss": 0.7198, "step": 4984 }, { "epoch": 0.4599238842117403, "grad_norm": 1.6984430104742805, "learning_rate": 7.437466587379228e-07, "loss": 0.7415, "step": 4985 }, { "epoch": 0.4599238842117403, "eval_GEN Loss": 0.4541141390800476, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3625849485397339, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8465144038200378, "eval_runtime": 56.6906, "eval_samples_per_second": 1.147, "eval_steps_per_second": 0.088, "step": 4985 }, { "epoch": 0.4600161457732672, "grad_norm": 2.277599877041432, "learning_rate": 7.435619340630779e-07, "loss": 0.8739, "step": 4986 }, { "epoch": 0.46010840733479413, "grad_norm": 1.6156176606162993, "learning_rate": 7.433771986439639e-07, "loss": 0.4829, "step": 4987 }, { "epoch": 0.46020066889632105, "grad_norm": 3.514341557894376, "learning_rate": 7.431924524973216e-07, "loss": 0.5859, "step": 4988 }, { "epoch": 0.460292930457848, "grad_norm": 2.1047453883562546, "learning_rate": 7.430076956398935e-07, "loss": 0.9115, "step": 4989 }, { "epoch": 0.46038519201937494, "grad_norm": 2.455887802964566, "learning_rate": 7.428229280884223e-07, "loss": 0.5133, "step": 4990 }, { "epoch": 0.46038519201937494, "eval_GEN Loss": 0.4544925391674042, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35270726680755615, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8459134697914124, "eval_runtime": 56.7642, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 4990 }, { "epoch": 0.46047745358090186, "grad_norm": 3.9077373950571075, "learning_rate": 7.426381498596516e-07, "loss": 0.8558, "step": 4991 }, { "epoch": 0.4605697151424288, "grad_norm": 2.56746837662475, "learning_rate": 7.424533609703267e-07, "loss": 0.759, "step": 4992 }, { "epoch": 0.4606619767039557, "grad_norm": 1.8135864506998511, "learning_rate": 7.422685614371935e-07, "loss": 0.6546, "step": 4993 }, { "epoch": 0.4607542382654826, "grad_norm": 3.2581595976135134, "learning_rate": 7.420837512769985e-07, "loss": 0.7769, "step": 4994 }, { "epoch": 0.4608464998270096, "grad_norm": 1.9800663331541388, "learning_rate": 7.418989305064897e-07, "loss": 0.7336, "step": 4995 }, { "epoch": 0.4608464998270096, "eval_GEN Loss": 0.45363399386405945, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.35003408789634705, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8316105604171753, "eval_runtime": 55.6593, "eval_samples_per_second": 1.168, "eval_steps_per_second": 0.09, "step": 4995 }, { "epoch": 0.4609387613885365, "grad_norm": 1.642342666630142, "learning_rate": 7.41714099142416e-07, "loss": 0.7434, "step": 4996 }, { "epoch": 0.46103102295006343, "grad_norm": 2.6641933098372927, "learning_rate": 7.415292572015268e-07, "loss": 0.7207, "step": 4997 }, { "epoch": 0.46112328451159035, "grad_norm": 1.8617530860482736, "learning_rate": 7.413444047005728e-07, "loss": 0.6419, "step": 4998 }, { "epoch": 0.46121554607311727, "grad_norm": 2.5155258952253807, "learning_rate": 7.411595416563057e-07, "loss": 0.8348, "step": 4999 }, { "epoch": 0.46130780763464424, "grad_norm": 2.209655647381459, "learning_rate": 7.409746680854783e-07, "loss": 0.6957, "step": 5000 }, { "epoch": 0.46130780763464424, "eval_GEN Loss": 0.4548896849155426, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3599395453929901, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8376802802085876, "eval_runtime": 56.1551, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5000 }, { "epoch": 0.46130780763464424, "eval_GEN Loss": 0.4548896849155426, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3599395453929901, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8376802802085876, "eval_runtime": 59.4587, "eval_samples_per_second": 1.093, "eval_steps_per_second": 0.084, "step": 5000 }, { "epoch": 0.46140006919617116, "grad_norm": 2.7067113255619684, "learning_rate": 7.407897840048439e-07, "loss": 0.8162, "step": 5001 }, { "epoch": 0.4614923307576981, "grad_norm": 2.12178759708444, "learning_rate": 7.406048894311568e-07, "loss": 0.727, "step": 5002 }, { "epoch": 0.461584592319225, "grad_norm": 1.8190661582980172, "learning_rate": 7.40419984381173e-07, "loss": 0.6795, "step": 5003 }, { "epoch": 0.4616768538807519, "grad_norm": 1.3721530474945036, "learning_rate": 7.402350688716482e-07, "loss": 0.5978, "step": 5004 }, { "epoch": 0.4617691154422789, "grad_norm": 1.7562678905050004, "learning_rate": 7.400501429193403e-07, "loss": 0.7952, "step": 5005 }, { "epoch": 0.4617691154422789, "eval_GEN Loss": 0.45453813672065735, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.35906457901000977, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8402042984962463, "eval_runtime": 56.1529, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5005 }, { "epoch": 0.4618613770038058, "grad_norm": 2.4780285134679896, "learning_rate": 7.398652065410072e-07, "loss": 0.8005, "step": 5006 }, { "epoch": 0.4619536385653327, "grad_norm": 1.88312588904045, "learning_rate": 7.396802597534082e-07, "loss": 0.6413, "step": 5007 }, { "epoch": 0.46204590012685964, "grad_norm": 1.4645991239752205, "learning_rate": 7.394953025733039e-07, "loss": 0.5477, "step": 5008 }, { "epoch": 0.46213816168838656, "grad_norm": 2.0395367910475386, "learning_rate": 7.393103350174548e-07, "loss": 0.7686, "step": 5009 }, { "epoch": 0.4622304232499135, "grad_norm": 2.4257728132476406, "learning_rate": 7.391253571026233e-07, "loss": 0.8361, "step": 5010 }, { "epoch": 0.4622304232499135, "eval_GEN Loss": 0.45380106568336487, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.35521697998046875, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8528245091438293, "eval_runtime": 56.0426, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5010 }, { "epoch": 0.46232268481144045, "grad_norm": 1.3892915940415596, "learning_rate": 7.389403688455722e-07, "loss": 0.5731, "step": 5011 }, { "epoch": 0.4624149463729674, "grad_norm": 1.7736855073548408, "learning_rate": 7.387553702630657e-07, "loss": 0.6036, "step": 5012 }, { "epoch": 0.4625072079344943, "grad_norm": 1.7878406039450523, "learning_rate": 7.385703613718684e-07, "loss": 0.7931, "step": 5013 }, { "epoch": 0.4625994694960212, "grad_norm": 1.9160742750891022, "learning_rate": 7.383853421887463e-07, "loss": 0.7088, "step": 5014 }, { "epoch": 0.46269173105754813, "grad_norm": 2.7915606736543404, "learning_rate": 7.382003127304658e-07, "loss": 0.8506, "step": 5015 }, { "epoch": 0.46269173105754813, "eval_GEN Loss": 0.4532504379749298, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35240551829338074, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8615384697914124, "eval_runtime": 56.313, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 5015 }, { "epoch": 0.4627839926190751, "grad_norm": 1.6132212882824946, "learning_rate": 7.380152730137949e-07, "loss": 0.5568, "step": 5016 }, { "epoch": 0.462876254180602, "grad_norm": 2.549938417532724, "learning_rate": 7.37830223055502e-07, "loss": 0.7152, "step": 5017 }, { "epoch": 0.46296851574212894, "grad_norm": 1.7712908446958595, "learning_rate": 7.376451628723569e-07, "loss": 0.6925, "step": 5018 }, { "epoch": 0.46306077730365586, "grad_norm": 3.128437455798419, "learning_rate": 7.374600924811296e-07, "loss": 0.8224, "step": 5019 }, { "epoch": 0.4631530388651828, "grad_norm": 1.9791790601762616, "learning_rate": 7.372750118985917e-07, "loss": 0.614, "step": 5020 }, { "epoch": 0.4631530388651828, "eval_GEN Loss": 0.4533977210521698, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3550493121147156, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8611778616905212, "eval_runtime": 56.0306, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5020 }, { "epoch": 0.46324530042670975, "grad_norm": 1.388050522751467, "learning_rate": 7.370899211415159e-07, "loss": 0.7774, "step": 5021 }, { "epoch": 0.46333756198823667, "grad_norm": 1.747726247085499, "learning_rate": 7.369048202266745e-07, "loss": 0.7084, "step": 5022 }, { "epoch": 0.4634298235497636, "grad_norm": 2.2135411390193234, "learning_rate": 7.367197091708424e-07, "loss": 0.7332, "step": 5023 }, { "epoch": 0.4635220851112905, "grad_norm": 1.8369068917789173, "learning_rate": 7.365345879907943e-07, "loss": 0.6202, "step": 5024 }, { "epoch": 0.4636143466728174, "grad_norm": 1.806852679985912, "learning_rate": 7.363494567033064e-07, "loss": 0.4765, "step": 5025 }, { "epoch": 0.4636143466728174, "eval_GEN Loss": 0.45390281081199646, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3648715019226074, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8573918342590332, "eval_runtime": 56.1191, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5025 }, { "epoch": 0.46370660823434434, "grad_norm": 1.4699544492015268, "learning_rate": 7.361643153251555e-07, "loss": 0.704, "step": 5026 }, { "epoch": 0.4637988697958713, "grad_norm": 1.4038699548176106, "learning_rate": 7.359791638731193e-07, "loss": 0.5527, "step": 5027 }, { "epoch": 0.46389113135739823, "grad_norm": 1.87849515605073, "learning_rate": 7.357940023639766e-07, "loss": 0.6512, "step": 5028 }, { "epoch": 0.46398339291892515, "grad_norm": 2.126658122016276, "learning_rate": 7.356088308145068e-07, "loss": 0.6247, "step": 5029 }, { "epoch": 0.46407565448045207, "grad_norm": 2.0712560673444216, "learning_rate": 7.35423649241491e-07, "loss": 0.8045, "step": 5030 }, { "epoch": 0.46407565448045207, "eval_GEN Loss": 0.45462509989738464, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.36842361092567444, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8561298251152039, "eval_runtime": 56.0137, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5030 }, { "epoch": 0.464167916041979, "grad_norm": 1.5830389649738412, "learning_rate": 7.3523845766171e-07, "loss": 0.5395, "step": 5031 }, { "epoch": 0.46426017760350596, "grad_norm": 2.2103854863883274, "learning_rate": 7.350532560919466e-07, "loss": 0.6877, "step": 5032 }, { "epoch": 0.4643524391650329, "grad_norm": 2.288749988547474, "learning_rate": 7.348680445489839e-07, "loss": 0.6593, "step": 5033 }, { "epoch": 0.4644447007265598, "grad_norm": 1.5438028160684356, "learning_rate": 7.34682823049606e-07, "loss": 0.6673, "step": 5034 }, { "epoch": 0.4645369622880867, "grad_norm": 4.871030781022834, "learning_rate": 7.344975916105982e-07, "loss": 0.8547, "step": 5035 }, { "epoch": 0.4645369622880867, "eval_GEN Loss": 0.4546084702014923, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3676494359970093, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8586538434028625, "eval_runtime": 56.279, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 5035 }, { "epoch": 0.46462922384961364, "grad_norm": 1.5343028266558845, "learning_rate": 7.343123502487462e-07, "loss": 0.5158, "step": 5036 }, { "epoch": 0.4647214854111406, "grad_norm": 2.1405612714632016, "learning_rate": 7.341270989808369e-07, "loss": 0.8536, "step": 5037 }, { "epoch": 0.46481374697266753, "grad_norm": 1.8346968824684529, "learning_rate": 7.339418378236582e-07, "loss": 0.6444, "step": 5038 }, { "epoch": 0.46490600853419445, "grad_norm": 1.8217731434927098, "learning_rate": 7.337565667939986e-07, "loss": 0.5204, "step": 5039 }, { "epoch": 0.46499827009572137, "grad_norm": 2.00965647161763, "learning_rate": 7.335712859086477e-07, "loss": 0.5763, "step": 5040 }, { "epoch": 0.46499827009572137, "eval_GEN Loss": 0.45483699440956116, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3752996027469635, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8609976172447205, "eval_runtime": 56.9326, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5040 }, { "epoch": 0.4650905316572483, "grad_norm": 1.4407392729086983, "learning_rate": 7.333859951843961e-07, "loss": 0.5312, "step": 5041 }, { "epoch": 0.4651827932187752, "grad_norm": 3.0170753936874153, "learning_rate": 7.332006946380349e-07, "loss": 0.7523, "step": 5042 }, { "epoch": 0.4652750547803022, "grad_norm": 2.337011363403034, "learning_rate": 7.330153842863564e-07, "loss": 0.7113, "step": 5043 }, { "epoch": 0.4653673163418291, "grad_norm": 2.324311884644493, "learning_rate": 7.32830064146154e-07, "loss": 0.7147, "step": 5044 }, { "epoch": 0.465459577903356, "grad_norm": 2.811513151785612, "learning_rate": 7.326447342342213e-07, "loss": 0.793, "step": 5045 }, { "epoch": 0.465459577903356, "eval_GEN Loss": 0.454935222864151, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.37348663806915283, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8635817170143127, "eval_runtime": 57.3585, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 5045 }, { "epoch": 0.46555183946488293, "grad_norm": 3.2708127733930366, "learning_rate": 7.324593945673534e-07, "loss": 0.8651, "step": 5046 }, { "epoch": 0.46564410102640985, "grad_norm": 1.505502552154379, "learning_rate": 7.32274045162346e-07, "loss": 0.5853, "step": 5047 }, { "epoch": 0.4657363625879368, "grad_norm": 1.8062837518494395, "learning_rate": 7.320886860359957e-07, "loss": 0.6556, "step": 5048 }, { "epoch": 0.46582862414946374, "grad_norm": 1.818245222720958, "learning_rate": 7.319033172051003e-07, "loss": 0.6722, "step": 5049 }, { "epoch": 0.46592088571099066, "grad_norm": 1.8648658449301783, "learning_rate": 7.317179386864578e-07, "loss": 0.6746, "step": 5050 }, { "epoch": 0.46592088571099066, "eval_GEN Loss": 0.4539273679256439, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3722047507762909, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8698317408561707, "eval_runtime": 56.8782, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5050 }, { "epoch": 0.4660131472725176, "grad_norm": 2.2196674283474684, "learning_rate": 7.315325504968679e-07, "loss": 0.8624, "step": 5051 }, { "epoch": 0.4661054088340445, "grad_norm": 2.015022296503588, "learning_rate": 7.313471526531304e-07, "loss": 0.7873, "step": 5052 }, { "epoch": 0.4661976703955714, "grad_norm": 1.7687754303636722, "learning_rate": 7.311617451720468e-07, "loss": 0.5923, "step": 5053 }, { "epoch": 0.4662899319570984, "grad_norm": 2.7695579726561017, "learning_rate": 7.309763280704185e-07, "loss": 0.7969, "step": 5054 }, { "epoch": 0.4663821935186253, "grad_norm": 2.086311649772454, "learning_rate": 7.307909013650485e-07, "loss": 0.6385, "step": 5055 }, { "epoch": 0.4663821935186253, "eval_GEN Loss": 0.454171359539032, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37217000126838684, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8818509578704834, "eval_runtime": 57.0836, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5055 }, { "epoch": 0.46647445508015223, "grad_norm": 2.423632088097247, "learning_rate": 7.306054650727408e-07, "loss": 0.7068, "step": 5056 }, { "epoch": 0.46656671664167915, "grad_norm": 2.8181258585146636, "learning_rate": 7.304200192102994e-07, "loss": 0.7914, "step": 5057 }, { "epoch": 0.46665897820320607, "grad_norm": 1.7320971750959886, "learning_rate": 7.302345637945301e-07, "loss": 0.7426, "step": 5058 }, { "epoch": 0.46675123976473304, "grad_norm": 1.8793704435233403, "learning_rate": 7.300490988422389e-07, "loss": 0.7716, "step": 5059 }, { "epoch": 0.46684350132625996, "grad_norm": 2.402469871242015, "learning_rate": 7.29863624370233e-07, "loss": 0.8563, "step": 5060 }, { "epoch": 0.46684350132625996, "eval_GEN Loss": 0.4526033103466034, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3724413216114044, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8876802921295166, "eval_runtime": 56.7141, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 5060 }, { "epoch": 0.4669357628877869, "grad_norm": 2.0657185880156765, "learning_rate": 7.296781403953204e-07, "loss": 0.7754, "step": 5061 }, { "epoch": 0.4670280244493138, "grad_norm": 2.313504391601341, "learning_rate": 7.2949264693431e-07, "loss": 0.8808, "step": 5062 }, { "epoch": 0.4671202860108407, "grad_norm": 2.2238607732103897, "learning_rate": 7.293071440040115e-07, "loss": 0.7532, "step": 5063 }, { "epoch": 0.4672125475723677, "grad_norm": 2.193863913937959, "learning_rate": 7.291216316212352e-07, "loss": 0.7969, "step": 5064 }, { "epoch": 0.4673048091338946, "grad_norm": 2.7591302238274067, "learning_rate": 7.289361098027929e-07, "loss": 0.9396, "step": 5065 }, { "epoch": 0.4673048091338946, "eval_GEN Loss": 0.4525662362575531, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3728674054145813, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.889723539352417, "eval_runtime": 56.806, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 5065 }, { "epoch": 0.4673970706954215, "grad_norm": 1.5936550803694347, "learning_rate": 7.287505785654967e-07, "loss": 0.7361, "step": 5066 }, { "epoch": 0.46748933225694844, "grad_norm": 2.7565690591040184, "learning_rate": 7.285650379261598e-07, "loss": 0.6908, "step": 5067 }, { "epoch": 0.46758159381847536, "grad_norm": 3.176072041387618, "learning_rate": 7.283794879015961e-07, "loss": 0.569, "step": 5068 }, { "epoch": 0.4676738553800023, "grad_norm": 2.0247784961820274, "learning_rate": 7.281939285086206e-07, "loss": 0.7417, "step": 5069 }, { "epoch": 0.46776611694152925, "grad_norm": 2.287330852521404, "learning_rate": 7.280083597640487e-07, "loss": 0.6428, "step": 5070 }, { "epoch": 0.46776611694152925, "eval_GEN Loss": 0.4507974088191986, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.37081706523895264, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.892848551273346, "eval_runtime": 57.2218, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 5070 }, { "epoch": 0.46785837850305617, "grad_norm": 1.787432744853157, "learning_rate": 7.278227816846973e-07, "loss": 0.6817, "step": 5071 }, { "epoch": 0.4679506400645831, "grad_norm": 2.2107821531372798, "learning_rate": 7.276371942873835e-07, "loss": 0.7092, "step": 5072 }, { "epoch": 0.46804290162611, "grad_norm": 1.3837364426466616, "learning_rate": 7.274515975889254e-07, "loss": 0.5814, "step": 5073 }, { "epoch": 0.4681351631876369, "grad_norm": 1.7985594531525406, "learning_rate": 7.272659916061425e-07, "loss": 0.8108, "step": 5074 }, { "epoch": 0.4682274247491639, "grad_norm": 1.9199106465870939, "learning_rate": 7.270803763558544e-07, "loss": 0.8308, "step": 5075 }, { "epoch": 0.4682274247491639, "eval_GEN Loss": 0.44933125376701355, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.37206703424453735, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8855769038200378, "eval_runtime": 56.9505, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5075 }, { "epoch": 0.4683196863106908, "grad_norm": 2.463455795698566, "learning_rate": 7.268947518548821e-07, "loss": 0.7697, "step": 5076 }, { "epoch": 0.46841194787221774, "grad_norm": 2.874404632500906, "learning_rate": 7.267091181200467e-07, "loss": 0.8153, "step": 5077 }, { "epoch": 0.46850420943374466, "grad_norm": 2.4923299863830546, "learning_rate": 7.265234751681711e-07, "loss": 0.7399, "step": 5078 }, { "epoch": 0.4685964709952716, "grad_norm": 1.5281997745911582, "learning_rate": 7.263378230160782e-07, "loss": 0.658, "step": 5079 }, { "epoch": 0.46868873255679855, "grad_norm": 1.7985456344737891, "learning_rate": 7.261521616805924e-07, "loss": 0.7047, "step": 5080 }, { "epoch": 0.46868873255679855, "eval_GEN Loss": 0.4491855800151825, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.37689054012298584, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8745793104171753, "eval_runtime": 56.9695, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5080 }, { "epoch": 0.46878099411832547, "grad_norm": 2.0913762851907363, "learning_rate": 7.259664911785386e-07, "loss": 0.6215, "step": 5081 }, { "epoch": 0.4688732556798524, "grad_norm": 1.5638629129034076, "learning_rate": 7.257808115267421e-07, "loss": 0.4873, "step": 5082 }, { "epoch": 0.4689655172413793, "grad_norm": 2.164702316827533, "learning_rate": 7.255951227420302e-07, "loss": 0.6571, "step": 5083 }, { "epoch": 0.4690577788029062, "grad_norm": 2.412829118144822, "learning_rate": 7.2540942484123e-07, "loss": 0.8016, "step": 5084 }, { "epoch": 0.46915004036443314, "grad_norm": 1.3096900701965073, "learning_rate": 7.252237178411695e-07, "loss": 0.4223, "step": 5085 }, { "epoch": 0.46915004036443314, "eval_GEN Loss": 0.44931694865226746, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.38048338890075684, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8737379908561707, "eval_runtime": 57.0819, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5085 }, { "epoch": 0.4692423019259601, "grad_norm": 1.948996004626328, "learning_rate": 7.250380017586778e-07, "loss": 0.6351, "step": 5086 }, { "epoch": 0.46933456348748703, "grad_norm": 1.8026106839660214, "learning_rate": 7.248522766105849e-07, "loss": 0.6097, "step": 5087 }, { "epoch": 0.46942682504901395, "grad_norm": 2.164064771988493, "learning_rate": 7.246665424137218e-07, "loss": 0.7806, "step": 5088 }, { "epoch": 0.46951908661054087, "grad_norm": 1.613706639959414, "learning_rate": 7.244807991849195e-07, "loss": 0.6596, "step": 5089 }, { "epoch": 0.4696113481720678, "grad_norm": 2.3712685183221525, "learning_rate": 7.242950469410107e-07, "loss": 0.7883, "step": 5090 }, { "epoch": 0.4696113481720678, "eval_GEN Loss": 0.4510478675365448, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38527318835258484, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8720552921295166, "eval_runtime": 56.8755, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5090 }, { "epoch": 0.46970360973359476, "grad_norm": 2.276037316259212, "learning_rate": 7.241092856988285e-07, "loss": 0.6113, "step": 5091 }, { "epoch": 0.4697958712951217, "grad_norm": 1.7068547107149992, "learning_rate": 7.239235154752068e-07, "loss": 0.618, "step": 5092 }, { "epoch": 0.4698881328566486, "grad_norm": 2.530119601417081, "learning_rate": 7.237377362869803e-07, "loss": 0.6887, "step": 5093 }, { "epoch": 0.4699803944181755, "grad_norm": 2.4407010639824707, "learning_rate": 7.235519481509849e-07, "loss": 0.6864, "step": 5094 }, { "epoch": 0.47007265597970244, "grad_norm": 1.7997938557305775, "learning_rate": 7.233661510840569e-07, "loss": 0.7253, "step": 5095 }, { "epoch": 0.47007265597970244, "eval_GEN Loss": 0.4525219798088074, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38727328181266785, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8754807710647583, "eval_runtime": 56.8761, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5095 }, { "epoch": 0.4701649175412294, "grad_norm": 2.211371195133455, "learning_rate": 7.231803451030333e-07, "loss": 0.6904, "step": 5096 }, { "epoch": 0.47025717910275633, "grad_norm": 2.0086818614357567, "learning_rate": 7.229945302247523e-07, "loss": 0.7053, "step": 5097 }, { "epoch": 0.47034944066428325, "grad_norm": 1.4113434575765516, "learning_rate": 7.228087064660526e-07, "loss": 0.4507, "step": 5098 }, { "epoch": 0.47044170222581017, "grad_norm": 1.398962836622668, "learning_rate": 7.226228738437742e-07, "loss": 0.5859, "step": 5099 }, { "epoch": 0.4705339637873371, "grad_norm": 1.4946768671069908, "learning_rate": 7.224370323747572e-07, "loss": 0.4889, "step": 5100 }, { "epoch": 0.4705339637873371, "eval_GEN Loss": 0.45279768109321594, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38907113671302795, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8787860870361328, "eval_runtime": 55.8832, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5100 }, { "epoch": 0.470626225348864, "grad_norm": 2.3383201415241044, "learning_rate": 7.222511820758429e-07, "loss": 0.4256, "step": 5101 }, { "epoch": 0.470718486910391, "grad_norm": 1.79794722342997, "learning_rate": 7.220653229638735e-07, "loss": 0.7079, "step": 5102 }, { "epoch": 0.4708107484719179, "grad_norm": 3.171432883188932, "learning_rate": 7.218794550556918e-07, "loss": 0.8181, "step": 5103 }, { "epoch": 0.4709030100334448, "grad_norm": 2.208938669611532, "learning_rate": 7.216935783681413e-07, "loss": 0.8015, "step": 5104 }, { "epoch": 0.47099527159497173, "grad_norm": 2.153117180210697, "learning_rate": 7.215076929180665e-07, "loss": 0.71, "step": 5105 }, { "epoch": 0.47099527159497173, "eval_GEN Loss": 0.4537142515182495, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38435226678848267, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8871394395828247, "eval_runtime": 56.9305, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5105 }, { "epoch": 0.47108753315649865, "grad_norm": 2.220470581117704, "learning_rate": 7.213217987223127e-07, "loss": 0.5352, "step": 5106 }, { "epoch": 0.4711797947180256, "grad_norm": 2.032867880446119, "learning_rate": 7.211358957977259e-07, "loss": 0.6381, "step": 5107 }, { "epoch": 0.47127205627955254, "grad_norm": 2.0415010372873588, "learning_rate": 7.20949984161153e-07, "loss": 0.6994, "step": 5108 }, { "epoch": 0.47136431784107946, "grad_norm": 2.303231922389577, "learning_rate": 7.207640638294414e-07, "loss": 0.5732, "step": 5109 }, { "epoch": 0.4714565794026064, "grad_norm": 1.4978672085006846, "learning_rate": 7.205781348194396e-07, "loss": 0.5702, "step": 5110 }, { "epoch": 0.4714565794026064, "eval_GEN Loss": 0.4545291066169739, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3925088346004486, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8809494972229004, "eval_runtime": 57.1008, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5110 }, { "epoch": 0.4715488409641333, "grad_norm": 1.4202900446675153, "learning_rate": 7.203921971479968e-07, "loss": 0.7645, "step": 5111 }, { "epoch": 0.47164110252566027, "grad_norm": 1.4239250838673285, "learning_rate": 7.202062508319628e-07, "loss": 0.4531, "step": 5112 }, { "epoch": 0.4717333640871872, "grad_norm": 2.1938255651255125, "learning_rate": 7.200202958881887e-07, "loss": 0.6896, "step": 5113 }, { "epoch": 0.4718256256487141, "grad_norm": 2.6117244888705877, "learning_rate": 7.198343323335257e-07, "loss": 0.7723, "step": 5114 }, { "epoch": 0.471917887210241, "grad_norm": 1.5317893098235305, "learning_rate": 7.196483601848262e-07, "loss": 0.4548, "step": 5115 }, { "epoch": 0.471917887210241, "eval_GEN Loss": 0.45550304651260376, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.39157402515411377, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8848557472229004, "eval_runtime": 56.978, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5115 }, { "epoch": 0.47201014877176795, "grad_norm": 1.9377004210644144, "learning_rate": 7.194623794589434e-07, "loss": 0.6559, "step": 5116 }, { "epoch": 0.47210241033329486, "grad_norm": 1.828466470272906, "learning_rate": 7.192763901727312e-07, "loss": 0.7857, "step": 5117 }, { "epoch": 0.47219467189482184, "grad_norm": 1.5361180199722646, "learning_rate": 7.190903923430439e-07, "loss": 0.6142, "step": 5118 }, { "epoch": 0.47228693345634876, "grad_norm": 1.7745590042597699, "learning_rate": 7.189043859867373e-07, "loss": 0.6132, "step": 5119 }, { "epoch": 0.4723791950178757, "grad_norm": 2.226042914514901, "learning_rate": 7.187183711206674e-07, "loss": 0.8591, "step": 5120 }, { "epoch": 0.4723791950178757, "eval_GEN Loss": 0.4559136629104614, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.40007543563842773, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8827524185180664, "eval_runtime": 56.8679, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5120 }, { "epoch": 0.4724714565794026, "grad_norm": 2.620935302288477, "learning_rate": 7.185323477616912e-07, "loss": 0.7482, "step": 5121 }, { "epoch": 0.4725637181409295, "grad_norm": 1.6450529327033225, "learning_rate": 7.183463159266666e-07, "loss": 0.6573, "step": 5122 }, { "epoch": 0.4726559797024565, "grad_norm": 2.352858416292999, "learning_rate": 7.181602756324515e-07, "loss": 0.9948, "step": 5123 }, { "epoch": 0.4727482412639834, "grad_norm": 1.7865987241169718, "learning_rate": 7.17974226895906e-07, "loss": 0.6848, "step": 5124 }, { "epoch": 0.4728405028255103, "grad_norm": 1.7123959014992016, "learning_rate": 7.177881697338894e-07, "loss": 0.6813, "step": 5125 }, { "epoch": 0.4728405028255103, "eval_GEN Loss": 0.4559193551540375, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4114290177822113, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8768630027770996, "eval_runtime": 57.0534, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5125 }, { "epoch": 0.47293276438703724, "grad_norm": 2.04663881539211, "learning_rate": 7.176021041632631e-07, "loss": 0.7118, "step": 5126 }, { "epoch": 0.47302502594856416, "grad_norm": 2.6776198243205966, "learning_rate": 7.174160302008881e-07, "loss": 0.6973, "step": 5127 }, { "epoch": 0.47311728751009113, "grad_norm": 1.6418948160744598, "learning_rate": 7.172299478636271e-07, "loss": 0.6213, "step": 5128 }, { "epoch": 0.47320954907161805, "grad_norm": 2.8690272079941255, "learning_rate": 7.17043857168343e-07, "loss": 0.7417, "step": 5129 }, { "epoch": 0.47330181063314497, "grad_norm": 1.1993464845017578, "learning_rate": 7.168577581318997e-07, "loss": 0.5456, "step": 5130 }, { "epoch": 0.47330181063314497, "eval_GEN Loss": 0.4547041654586792, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41597992181777954, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8706430196762085, "eval_runtime": 57.0273, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5130 }, { "epoch": 0.4733940721946719, "grad_norm": 1.9465517463727136, "learning_rate": 7.16671650771162e-07, "loss": 0.8358, "step": 5131 }, { "epoch": 0.4734863337561988, "grad_norm": 1.8268278784790175, "learning_rate": 7.164855351029946e-07, "loss": 0.715, "step": 5132 }, { "epoch": 0.4735785953177257, "grad_norm": 2.0052176556492154, "learning_rate": 7.162994111442643e-07, "loss": 0.6842, "step": 5133 }, { "epoch": 0.4736708568792527, "grad_norm": 2.4355445122472745, "learning_rate": 7.161132789118376e-07, "loss": 0.8427, "step": 5134 }, { "epoch": 0.4737631184407796, "grad_norm": 2.3282268279173244, "learning_rate": 7.159271384225822e-07, "loss": 0.6944, "step": 5135 }, { "epoch": 0.4737631184407796, "eval_GEN Loss": 0.4557361602783203, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4122553765773773, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8661658763885498, "eval_runtime": 56.977, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5135 }, { "epoch": 0.47385538000230654, "grad_norm": 1.6230923484554836, "learning_rate": 7.157409896933662e-07, "loss": 0.513, "step": 5136 }, { "epoch": 0.47394764156383345, "grad_norm": 2.2480729691934465, "learning_rate": 7.155548327410589e-07, "loss": 0.7338, "step": 5137 }, { "epoch": 0.4740399031253604, "grad_norm": 2.0887636152064255, "learning_rate": 7.153686675825303e-07, "loss": 0.8269, "step": 5138 }, { "epoch": 0.47413216468688735, "grad_norm": 1.745936403040148, "learning_rate": 7.151824942346506e-07, "loss": 0.7087, "step": 5139 }, { "epoch": 0.47422442624841427, "grad_norm": 2.0170746844200753, "learning_rate": 7.149963127142916e-07, "loss": 0.7581, "step": 5140 }, { "epoch": 0.47422442624841427, "eval_GEN Loss": 0.454622745513916, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3961091935634613, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8699519038200378, "eval_runtime": 57.3264, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 5140 }, { "epoch": 0.4743166878099412, "grad_norm": 2.3863603030959357, "learning_rate": 7.148101230383249e-07, "loss": 0.7058, "step": 5141 }, { "epoch": 0.4744089493714681, "grad_norm": 1.9004999377579204, "learning_rate": 7.146239252236236e-07, "loss": 0.7619, "step": 5142 }, { "epoch": 0.474501210932995, "grad_norm": 3.6732319229582657, "learning_rate": 7.144377192870611e-07, "loss": 0.9118, "step": 5143 }, { "epoch": 0.474593472494522, "grad_norm": 1.7264576270023173, "learning_rate": 7.142515052455115e-07, "loss": 0.6357, "step": 5144 }, { "epoch": 0.4746857340560489, "grad_norm": 2.359619777938543, "learning_rate": 7.140652831158502e-07, "loss": 0.5823, "step": 5145 }, { "epoch": 0.4746857340560489, "eval_GEN Loss": 0.45397472381591797, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3940119743347168, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8619591593742371, "eval_runtime": 57.0116, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5145 }, { "epoch": 0.47477799561757583, "grad_norm": 1.6106076421255604, "learning_rate": 7.138790529149527e-07, "loss": 0.7212, "step": 5146 }, { "epoch": 0.47487025717910275, "grad_norm": 2.0259306344925423, "learning_rate": 7.136928146596955e-07, "loss": 0.6053, "step": 5147 }, { "epoch": 0.47496251874062967, "grad_norm": 1.6065960512544113, "learning_rate": 7.135065683669559e-07, "loss": 0.6733, "step": 5148 }, { "epoch": 0.4750547803021566, "grad_norm": 1.444029212159895, "learning_rate": 7.133203140536119e-07, "loss": 0.5625, "step": 5149 }, { "epoch": 0.47514704186368356, "grad_norm": 1.4843418653644926, "learning_rate": 7.131340517365416e-07, "loss": 0.5783, "step": 5150 }, { "epoch": 0.47514704186368356, "eval_GEN Loss": 0.4531204104423523, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38726702332496643, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8589242696762085, "eval_runtime": 56.9574, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5150 }, { "epoch": 0.4752393034252105, "grad_norm": 1.5817808742086008, "learning_rate": 7.129477814326252e-07, "loss": 0.5946, "step": 5151 }, { "epoch": 0.4753315649867374, "grad_norm": 1.460580481807368, "learning_rate": 7.127615031587422e-07, "loss": 0.4786, "step": 5152 }, { "epoch": 0.4754238265482643, "grad_norm": 1.3479219163336957, "learning_rate": 7.125752169317738e-07, "loss": 0.6951, "step": 5153 }, { "epoch": 0.47551608810979124, "grad_norm": 2.3794729109811437, "learning_rate": 7.123889227686012e-07, "loss": 0.5835, "step": 5154 }, { "epoch": 0.4756083496713182, "grad_norm": 1.442657015355961, "learning_rate": 7.122026206861071e-07, "loss": 0.642, "step": 5155 }, { "epoch": 0.4756083496713182, "eval_GEN Loss": 0.4528181850910187, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38641172647476196, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8630709052085876, "eval_runtime": 57.1138, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5155 }, { "epoch": 0.4757006112328451, "grad_norm": 2.7190006837188876, "learning_rate": 7.120163107011742e-07, "loss": 0.6531, "step": 5156 }, { "epoch": 0.47579287279437205, "grad_norm": 1.9709544623185276, "learning_rate": 7.118299928306861e-07, "loss": 0.7453, "step": 5157 }, { "epoch": 0.47588513435589896, "grad_norm": 2.6801911887485454, "learning_rate": 7.116436670915275e-07, "loss": 0.8869, "step": 5158 }, { "epoch": 0.4759773959174259, "grad_norm": 1.7750062814924263, "learning_rate": 7.114573335005833e-07, "loss": 0.652, "step": 5159 }, { "epoch": 0.47606965747895286, "grad_norm": 2.3567181828796664, "learning_rate": 7.112709920747396e-07, "loss": 0.9111, "step": 5160 }, { "epoch": 0.47606965747895286, "eval_GEN Loss": 0.45227521657943726, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3909215033054352, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8601862788200378, "eval_runtime": 56.9395, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5160 }, { "epoch": 0.4761619190404798, "grad_norm": 2.194198177977186, "learning_rate": 7.110846428308827e-07, "loss": 0.7354, "step": 5161 }, { "epoch": 0.4762541806020067, "grad_norm": 2.187742195631896, "learning_rate": 7.108982857858999e-07, "loss": 0.6999, "step": 5162 }, { "epoch": 0.4763464421635336, "grad_norm": 2.587428140092144, "learning_rate": 7.107119209566795e-07, "loss": 0.7428, "step": 5163 }, { "epoch": 0.47643870372506053, "grad_norm": 2.19618091416778, "learning_rate": 7.105255483601096e-07, "loss": 0.6541, "step": 5164 }, { "epoch": 0.47653096528658745, "grad_norm": 2.531905122440746, "learning_rate": 7.103391680130802e-07, "loss": 0.5322, "step": 5165 }, { "epoch": 0.47653096528658745, "eval_GEN Loss": 0.4539846181869507, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3947306275367737, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8542067408561707, "eval_runtime": 57.1469, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5165 }, { "epoch": 0.4766232268481144, "grad_norm": 1.3711006996310622, "learning_rate": 7.10152779932481e-07, "loss": 0.5025, "step": 5166 }, { "epoch": 0.47671548840964134, "grad_norm": 1.8268291181931455, "learning_rate": 7.099663841352028e-07, "loss": 0.7869, "step": 5167 }, { "epoch": 0.47680774997116826, "grad_norm": 1.4220976902649436, "learning_rate": 7.097799806381369e-07, "loss": 0.691, "step": 5168 }, { "epoch": 0.4769000115326952, "grad_norm": 1.463257449346647, "learning_rate": 7.09593569458176e-07, "loss": 0.484, "step": 5169 }, { "epoch": 0.4769922730942221, "grad_norm": 1.6085475289980447, "learning_rate": 7.094071506122126e-07, "loss": 0.694, "step": 5170 }, { "epoch": 0.4769922730942221, "eval_GEN Loss": 0.45384788513183594, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.400400310754776, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.852734386920929, "eval_runtime": 57.029, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5170 }, { "epoch": 0.47708453465574907, "grad_norm": 1.4325758806418858, "learning_rate": 7.092207241171403e-07, "loss": 0.4627, "step": 5171 }, { "epoch": 0.477176796217276, "grad_norm": 2.492623663285177, "learning_rate": 7.090342899898535e-07, "loss": 0.7547, "step": 5172 }, { "epoch": 0.4772690577788029, "grad_norm": 2.29572195626681, "learning_rate": 7.088478482472469e-07, "loss": 0.7318, "step": 5173 }, { "epoch": 0.4773613193403298, "grad_norm": 2.010808233941498, "learning_rate": 7.086613989062166e-07, "loss": 0.7228, "step": 5174 }, { "epoch": 0.47745358090185674, "grad_norm": 2.1544330380469705, "learning_rate": 7.084749419836584e-07, "loss": 0.7485, "step": 5175 }, { "epoch": 0.47745358090185674, "eval_GEN Loss": 0.4545189440250397, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.40309926867485046, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8510516881942749, "eval_runtime": 56.8987, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5175 }, { "epoch": 0.4775458424633837, "grad_norm": 2.6601106642280774, "learning_rate": 7.082884774964695e-07, "loss": 0.8032, "step": 5176 }, { "epoch": 0.47763810402491064, "grad_norm": 2.007433127821485, "learning_rate": 7.08102005461548e-07, "loss": 0.5858, "step": 5177 }, { "epoch": 0.47773036558643756, "grad_norm": 1.4918198081790441, "learning_rate": 7.079155258957918e-07, "loss": 0.5138, "step": 5178 }, { "epoch": 0.4778226271479645, "grad_norm": 2.163007234531863, "learning_rate": 7.077290388161002e-07, "loss": 0.6594, "step": 5179 }, { "epoch": 0.4779148887094914, "grad_norm": 1.4897017291948196, "learning_rate": 7.075425442393726e-07, "loss": 0.4628, "step": 5180 }, { "epoch": 0.4779148887094914, "eval_GEN Loss": 0.4547669291496277, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.4033930003643036, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8590144515037537, "eval_runtime": 57.2548, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 5180 }, { "epoch": 0.4780071502710183, "grad_norm": 1.9258626212556063, "learning_rate": 7.0735604218251e-07, "loss": 0.6087, "step": 5181 }, { "epoch": 0.4780994118325453, "grad_norm": 2.28974034251776, "learning_rate": 7.071695326624131e-07, "loss": 0.8241, "step": 5182 }, { "epoch": 0.4781916733940722, "grad_norm": 1.9451768134183076, "learning_rate": 7.06983015695984e-07, "loss": 0.6111, "step": 5183 }, { "epoch": 0.4782839349555991, "grad_norm": 1.7855982553106744, "learning_rate": 7.067964913001248e-07, "loss": 0.6938, "step": 5184 }, { "epoch": 0.47837619651712604, "grad_norm": 2.647037022700238, "learning_rate": 7.066099594917386e-07, "loss": 0.7507, "step": 5185 }, { "epoch": 0.47837619651712604, "eval_GEN Loss": 0.45579272508621216, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.39723771810531616, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8635216355323792, "eval_runtime": 57.1465, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5185 }, { "epoch": 0.47846845807865296, "grad_norm": 1.776777841316948, "learning_rate": 7.064234202877299e-07, "loss": 0.5116, "step": 5186 }, { "epoch": 0.47856071964017993, "grad_norm": 2.620251845163259, "learning_rate": 7.062368737050023e-07, "loss": 0.7962, "step": 5187 }, { "epoch": 0.47865298120170685, "grad_norm": 2.2445756250721667, "learning_rate": 7.060503197604615e-07, "loss": 0.8248, "step": 5188 }, { "epoch": 0.47874524276323377, "grad_norm": 1.4831656885723061, "learning_rate": 7.058637584710132e-07, "loss": 0.5301, "step": 5189 }, { "epoch": 0.4788375043247607, "grad_norm": 1.779821887123542, "learning_rate": 7.056771898535637e-07, "loss": 0.6972, "step": 5190 }, { "epoch": 0.4788375043247607, "eval_GEN Loss": 0.45584121346473694, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3892309069633484, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.864182710647583, "eval_runtime": 56.393, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 5190 }, { "epoch": 0.4789297658862876, "grad_norm": 2.492927688323933, "learning_rate": 7.054906139250203e-07, "loss": 0.8204, "step": 5191 }, { "epoch": 0.4790220274478146, "grad_norm": 1.7765893379252926, "learning_rate": 7.053040307022908e-07, "loss": 0.6122, "step": 5192 }, { "epoch": 0.4791142890093415, "grad_norm": 1.9918833157583509, "learning_rate": 7.051174402022836e-07, "loss": 0.8381, "step": 5193 }, { "epoch": 0.4792065505708684, "grad_norm": 2.711561464201588, "learning_rate": 7.04930842441908e-07, "loss": 0.8139, "step": 5194 }, { "epoch": 0.47929881213239534, "grad_norm": 1.9574358701621304, "learning_rate": 7.047442374380735e-07, "loss": 0.9135, "step": 5195 }, { "epoch": 0.47929881213239534, "eval_GEN Loss": 0.45503878593444824, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3805941045284271, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8561298251152039, "eval_runtime": 57.2169, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 5195 }, { "epoch": 0.47939107369392225, "grad_norm": 1.6285532549314672, "learning_rate": 7.045576252076906e-07, "loss": 0.5365, "step": 5196 }, { "epoch": 0.4794833352554492, "grad_norm": 1.9037082434030226, "learning_rate": 7.043710057676708e-07, "loss": 0.7226, "step": 5197 }, { "epoch": 0.47957559681697615, "grad_norm": 2.9557749614441087, "learning_rate": 7.041843791349252e-07, "loss": 0.7866, "step": 5198 }, { "epoch": 0.47966785837850306, "grad_norm": 2.0333084216099566, "learning_rate": 7.039977453263668e-07, "loss": 0.7874, "step": 5199 }, { "epoch": 0.47976011994003, "grad_norm": 2.424506833445163, "learning_rate": 7.038111043589082e-07, "loss": 0.6121, "step": 5200 }, { "epoch": 0.47976011994003, "eval_GEN Loss": 0.4545009434223175, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3824561834335327, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8465144038200378, "eval_runtime": 55.9585, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5200 }, { "epoch": 0.4798523815015569, "grad_norm": 2.5559351598451663, "learning_rate": 7.036244562494632e-07, "loss": 0.7845, "step": 5201 }, { "epoch": 0.4799446430630838, "grad_norm": 2.2314949555685524, "learning_rate": 7.034378010149464e-07, "loss": 0.8598, "step": 5202 }, { "epoch": 0.4800369046246108, "grad_norm": 1.771406660320865, "learning_rate": 7.032511386722725e-07, "loss": 0.6033, "step": 5203 }, { "epoch": 0.4801291661861377, "grad_norm": 1.6293935945849385, "learning_rate": 7.030644692383574e-07, "loss": 0.6703, "step": 5204 }, { "epoch": 0.48022142774766463, "grad_norm": 2.3459462350856515, "learning_rate": 7.02877792730117e-07, "loss": 0.7753, "step": 5205 }, { "epoch": 0.48022142774766463, "eval_GEN Loss": 0.45547547936439514, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.38673368096351624, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8392428159713745, "eval_runtime": 56.3321, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 5205 }, { "epoch": 0.48031368930919155, "grad_norm": 2.0476417457635625, "learning_rate": 7.026911091644685e-07, "loss": 0.5857, "step": 5206 }, { "epoch": 0.48040595087071847, "grad_norm": 2.6130898361690718, "learning_rate": 7.025044185583294e-07, "loss": 0.7884, "step": 5207 }, { "epoch": 0.48049821243224544, "grad_norm": 2.7280461669377836, "learning_rate": 7.02317720928618e-07, "loss": 0.8181, "step": 5208 }, { "epoch": 0.48059047399377236, "grad_norm": 1.9592728889141435, "learning_rate": 7.021310162922529e-07, "loss": 0.4972, "step": 5209 }, { "epoch": 0.4806827355552993, "grad_norm": 1.608124517285177, "learning_rate": 7.019443046661536e-07, "loss": 0.704, "step": 5210 }, { "epoch": 0.4806827355552993, "eval_GEN Loss": 0.45613721013069153, "eval_GEN top-5 accuracy": 0.9802718106093818, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3874301612377167, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8382211327552795, "eval_runtime": 56.94, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5210 }, { "epoch": 0.4807749971168262, "grad_norm": 1.5230859080244517, "learning_rate": 7.017575860672405e-07, "loss": 0.7766, "step": 5211 }, { "epoch": 0.4808672586783531, "grad_norm": 1.9267952241297335, "learning_rate": 7.015708605124341e-07, "loss": 0.7211, "step": 5212 }, { "epoch": 0.48095952023988003, "grad_norm": 1.4519094395938636, "learning_rate": 7.013841280186559e-07, "loss": 0.5166, "step": 5213 }, { "epoch": 0.481051781801407, "grad_norm": 2.3445278078078173, "learning_rate": 7.011973886028276e-07, "loss": 0.7989, "step": 5214 }, { "epoch": 0.4811440433629339, "grad_norm": 1.691756769115954, "learning_rate": 7.010106422818721e-07, "loss": 0.5971, "step": 5215 }, { "epoch": 0.4811440433629339, "eval_GEN Loss": 0.4556802809238434, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.38873884081840515, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8487980961799622, "eval_runtime": 56.8543, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5215 }, { "epoch": 0.48123630492446084, "grad_norm": 1.802999799757807, "learning_rate": 7.008238890727126e-07, "loss": 0.5515, "step": 5216 }, { "epoch": 0.48132856648598776, "grad_norm": 1.8219936925582225, "learning_rate": 7.006371289922729e-07, "loss": 0.6504, "step": 5217 }, { "epoch": 0.4814208280475147, "grad_norm": 2.355122805261264, "learning_rate": 7.004503620574774e-07, "loss": 0.5954, "step": 5218 }, { "epoch": 0.48151308960904166, "grad_norm": 2.379794620209546, "learning_rate": 7.002635882852514e-07, "loss": 0.8481, "step": 5219 }, { "epoch": 0.4816053511705686, "grad_norm": 1.90758756145585, "learning_rate": 7.000768076925206e-07, "loss": 0.6619, "step": 5220 }, { "epoch": 0.4816053511705686, "eval_GEN Loss": 0.4542737901210785, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3854510486125946, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8481971025466919, "eval_runtime": 57.0533, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5220 }, { "epoch": 0.4816976127320955, "grad_norm": 3.0051105138458714, "learning_rate": 6.998900202962112e-07, "loss": 1.0516, "step": 5221 }, { "epoch": 0.4817898742936224, "grad_norm": 2.7415948732632804, "learning_rate": 6.997032261132504e-07, "loss": 0.8773, "step": 5222 }, { "epoch": 0.48188213585514933, "grad_norm": 2.258862406169709, "learning_rate": 6.995164251605656e-07, "loss": 0.6689, "step": 5223 }, { "epoch": 0.4819743974166763, "grad_norm": 2.1954831673549444, "learning_rate": 6.993296174550851e-07, "loss": 0.6622, "step": 5224 }, { "epoch": 0.4820666589782032, "grad_norm": 1.8295149116691556, "learning_rate": 6.991428030137378e-07, "loss": 0.635, "step": 5225 }, { "epoch": 0.4820666589782032, "eval_GEN Loss": 0.45466727018356323, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3981640338897705, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8440504670143127, "eval_runtime": 56.9997, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5225 }, { "epoch": 0.48215892053973014, "grad_norm": 2.179482741930736, "learning_rate": 6.989559818534528e-07, "loss": 0.585, "step": 5226 }, { "epoch": 0.48225118210125706, "grad_norm": 2.275504388013781, "learning_rate": 6.987691539911604e-07, "loss": 0.8416, "step": 5227 }, { "epoch": 0.482343443662784, "grad_norm": 4.377120183949515, "learning_rate": 6.98582319443791e-07, "loss": 0.828, "step": 5228 }, { "epoch": 0.4824357052243109, "grad_norm": 2.358082474145734, "learning_rate": 6.983954782282762e-07, "loss": 0.7529, "step": 5229 }, { "epoch": 0.48252796678583787, "grad_norm": 1.837887386840773, "learning_rate": 6.982086303615474e-07, "loss": 0.6731, "step": 5230 }, { "epoch": 0.48252796678583787, "eval_GEN Loss": 0.4544956088066101, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.41106152534484863, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8397235870361328, "eval_runtime": 56.972, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5230 }, { "epoch": 0.4826202283473648, "grad_norm": 2.1499456058806854, "learning_rate": 6.980217758605376e-07, "loss": 0.67, "step": 5231 }, { "epoch": 0.4827124899088917, "grad_norm": 1.9579157896174768, "learning_rate": 6.978349147421792e-07, "loss": 0.517, "step": 5232 }, { "epoch": 0.4828047514704186, "grad_norm": 1.593411874212292, "learning_rate": 6.976480470234064e-07, "loss": 0.6599, "step": 5233 }, { "epoch": 0.48289701303194554, "grad_norm": 2.4090608036087646, "learning_rate": 6.974611727211532e-07, "loss": 0.7177, "step": 5234 }, { "epoch": 0.4829892745934725, "grad_norm": 1.8910307830148436, "learning_rate": 6.972742918523543e-07, "loss": 0.6528, "step": 5235 }, { "epoch": 0.4829892745934725, "eval_GEN Loss": 0.45305076241493225, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.4001941382884979, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8360576629638672, "eval_runtime": 57.0692, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5235 }, { "epoch": 0.48308153615499944, "grad_norm": 1.6775285133926343, "learning_rate": 6.970874044339456e-07, "loss": 0.6113, "step": 5236 }, { "epoch": 0.48317379771652635, "grad_norm": 1.7670550664090225, "learning_rate": 6.969005104828628e-07, "loss": 0.6992, "step": 5237 }, { "epoch": 0.4832660592780533, "grad_norm": 2.3591351876350544, "learning_rate": 6.967136100160423e-07, "loss": 0.8459, "step": 5238 }, { "epoch": 0.4833583208395802, "grad_norm": 1.7154889733433574, "learning_rate": 6.965267030504218e-07, "loss": 0.6989, "step": 5239 }, { "epoch": 0.48345058240110717, "grad_norm": 1.7899312131087537, "learning_rate": 6.963397896029389e-07, "loss": 0.7776, "step": 5240 }, { "epoch": 0.48345058240110717, "eval_GEN Loss": 0.45219671726226807, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3848111629486084, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.825901448726654, "eval_runtime": 57.3464, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 5240 }, { "epoch": 0.4835428439626341, "grad_norm": 1.6626219442429087, "learning_rate": 6.961528696905319e-07, "loss": 0.4935, "step": 5241 }, { "epoch": 0.483635105524161, "grad_norm": 1.9741679459119226, "learning_rate": 6.959659433301398e-07, "loss": 0.7495, "step": 5242 }, { "epoch": 0.4837273670856879, "grad_norm": 2.0565465955960684, "learning_rate": 6.957790105387023e-07, "loss": 0.768, "step": 5243 }, { "epoch": 0.48381962864721484, "grad_norm": 1.6202149805079193, "learning_rate": 6.955920713331593e-07, "loss": 0.5754, "step": 5244 }, { "epoch": 0.48391189020874176, "grad_norm": 2.096721738680497, "learning_rate": 6.95405125730452e-07, "loss": 0.6087, "step": 5245 }, { "epoch": 0.48391189020874176, "eval_GEN Loss": 0.44955992698669434, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36730650067329407, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8174278736114502, "eval_runtime": 56.8954, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5245 }, { "epoch": 0.48400415177026873, "grad_norm": 2.068915987831929, "learning_rate": 6.952181737475211e-07, "loss": 0.7889, "step": 5246 }, { "epoch": 0.48409641333179565, "grad_norm": 3.8325826876473013, "learning_rate": 6.950312154013089e-07, "loss": 1.0302, "step": 5247 }, { "epoch": 0.48418867489332257, "grad_norm": 1.9637459727397324, "learning_rate": 6.948442507087576e-07, "loss": 0.6689, "step": 5248 }, { "epoch": 0.4842809364548495, "grad_norm": 2.762891364446571, "learning_rate": 6.946572796868104e-07, "loss": 0.8855, "step": 5249 }, { "epoch": 0.4843731980163764, "grad_norm": 2.1530391528433257, "learning_rate": 6.944703023524112e-07, "loss": 0.6426, "step": 5250 }, { "epoch": 0.4843731980163764, "eval_GEN Loss": 0.4485835134983063, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36420589685440063, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8185096383094788, "eval_runtime": 56.9424, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5250 }, { "epoch": 0.4844654595779034, "grad_norm": 2.0008509803524825, "learning_rate": 6.942833187225034e-07, "loss": 0.824, "step": 5251 }, { "epoch": 0.4845577211394303, "grad_norm": 1.960311753148518, "learning_rate": 6.940963288140325e-07, "loss": 0.7545, "step": 5252 }, { "epoch": 0.4846499827009572, "grad_norm": 1.3413756549474434, "learning_rate": 6.939093326439434e-07, "loss": 0.5284, "step": 5253 }, { "epoch": 0.48474224426248413, "grad_norm": 1.9894747202957694, "learning_rate": 6.937223302291822e-07, "loss": 0.7973, "step": 5254 }, { "epoch": 0.48483450582401105, "grad_norm": 1.759063512480689, "learning_rate": 6.935353215866951e-07, "loss": 0.6741, "step": 5255 }, { "epoch": 0.48483450582401105, "eval_GEN Loss": 0.4480225443840027, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36728835105895996, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8156850934028625, "eval_runtime": 57.2178, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 5255 }, { "epoch": 0.484926767385538, "grad_norm": 1.491915891124898, "learning_rate": 6.933483067334294e-07, "loss": 0.5801, "step": 5256 }, { "epoch": 0.48501902894706495, "grad_norm": 2.0845843025329245, "learning_rate": 6.931612856863325e-07, "loss": 0.6767, "step": 5257 }, { "epoch": 0.48511129050859186, "grad_norm": 1.5642273161958855, "learning_rate": 6.929742584623525e-07, "loss": 0.5683, "step": 5258 }, { "epoch": 0.4852035520701188, "grad_norm": 2.5893263445624237, "learning_rate": 6.927872250784384e-07, "loss": 0.6369, "step": 5259 }, { "epoch": 0.4852958136316457, "grad_norm": 1.2458234380785356, "learning_rate": 6.926001855515393e-07, "loss": 0.5813, "step": 5260 }, { "epoch": 0.4852958136316457, "eval_GEN Loss": 0.4472184181213379, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3686789274215698, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8165264129638672, "eval_runtime": 56.9367, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5260 }, { "epoch": 0.4853880751931726, "grad_norm": 1.581440521752215, "learning_rate": 6.92413139898605e-07, "loss": 0.786, "step": 5261 }, { "epoch": 0.4854803367546996, "grad_norm": 1.5327262570013092, "learning_rate": 6.922260881365856e-07, "loss": 0.5722, "step": 5262 }, { "epoch": 0.4855725983162265, "grad_norm": 1.4168198725177674, "learning_rate": 6.920390302824326e-07, "loss": 0.6875, "step": 5263 }, { "epoch": 0.48566485987775343, "grad_norm": 2.422176650756517, "learning_rate": 6.918519663530969e-07, "loss": 0.6631, "step": 5264 }, { "epoch": 0.48575712143928035, "grad_norm": 1.7701288755458642, "learning_rate": 6.916648963655307e-07, "loss": 0.7341, "step": 5265 }, { "epoch": 0.48575712143928035, "eval_GEN Loss": 0.4470852017402649, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3640540540218353, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8079326748847961, "eval_runtime": 56.8738, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5265 }, { "epoch": 0.48584938300080727, "grad_norm": 1.7090349597529397, "learning_rate": 6.914778203366869e-07, "loss": 0.7307, "step": 5266 }, { "epoch": 0.48594164456233424, "grad_norm": 2.779896632306925, "learning_rate": 6.912907382835183e-07, "loss": 0.8955, "step": 5267 }, { "epoch": 0.48603390612386116, "grad_norm": 2.20005024888692, "learning_rate": 6.911036502229787e-07, "loss": 0.5906, "step": 5268 }, { "epoch": 0.4861261676853881, "grad_norm": 2.1280670399395465, "learning_rate": 6.909165561720222e-07, "loss": 0.8027, "step": 5269 }, { "epoch": 0.486218429246915, "grad_norm": 1.6687512000626807, "learning_rate": 6.907294561476037e-07, "loss": 0.6215, "step": 5270 }, { "epoch": 0.486218429246915, "eval_GEN Loss": 0.4470643103122711, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3521527647972107, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8014423251152039, "eval_runtime": 56.7835, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5270 }, { "epoch": 0.4863106908084419, "grad_norm": 2.2499979855580134, "learning_rate": 6.905423501666783e-07, "loss": 0.7928, "step": 5271 }, { "epoch": 0.4864029523699689, "grad_norm": 1.992079898857959, "learning_rate": 6.90355238246202e-07, "loss": 0.6365, "step": 5272 }, { "epoch": 0.4864952139314958, "grad_norm": 1.4559410529854675, "learning_rate": 6.901681204031313e-07, "loss": 0.7427, "step": 5273 }, { "epoch": 0.4865874754930227, "grad_norm": 2.067170454428522, "learning_rate": 6.899809966544227e-07, "loss": 0.7457, "step": 5274 }, { "epoch": 0.48667973705454964, "grad_norm": 1.6369716772006289, "learning_rate": 6.897938670170341e-07, "loss": 0.7078, "step": 5275 }, { "epoch": 0.48667973705454964, "eval_GEN Loss": 0.4474409520626068, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34140706062316895, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7974759340286255, "eval_runtime": 56.8206, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 5275 }, { "epoch": 0.48677199861607656, "grad_norm": 1.4788365121185179, "learning_rate": 6.896067315079232e-07, "loss": 0.6799, "step": 5276 }, { "epoch": 0.4868642601776035, "grad_norm": 2.1363573710573203, "learning_rate": 6.894195901440487e-07, "loss": 0.5151, "step": 5277 }, { "epoch": 0.48695652173913045, "grad_norm": 1.8554383469279967, "learning_rate": 6.892324429423693e-07, "loss": 0.7398, "step": 5278 }, { "epoch": 0.4870487833006574, "grad_norm": 1.6473985297077354, "learning_rate": 6.890452899198451e-07, "loss": 0.6842, "step": 5279 }, { "epoch": 0.4871410448621843, "grad_norm": 3.1026351804226437, "learning_rate": 6.888581310934357e-07, "loss": 0.7763, "step": 5280 }, { "epoch": 0.4871410448621843, "eval_GEN Loss": 0.4462141692638397, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34138959646224976, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7909255027770996, "eval_runtime": 56.9441, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5280 }, { "epoch": 0.4872333064237112, "grad_norm": 1.6365805040511665, "learning_rate": 6.88670966480102e-07, "loss": 0.7779, "step": 5281 }, { "epoch": 0.48732556798523813, "grad_norm": 2.12076730473845, "learning_rate": 6.884837960968052e-07, "loss": 0.7995, "step": 5282 }, { "epoch": 0.4874178295467651, "grad_norm": 2.363166860900109, "learning_rate": 6.882966199605068e-07, "loss": 0.5774, "step": 5283 }, { "epoch": 0.487510091108292, "grad_norm": 1.6241267104316373, "learning_rate": 6.881094380881691e-07, "loss": 0.6776, "step": 5284 }, { "epoch": 0.48760235266981894, "grad_norm": 2.0364138614679925, "learning_rate": 6.879222504967548e-07, "loss": 0.576, "step": 5285 }, { "epoch": 0.48760235266981894, "eval_GEN Loss": 0.44705772399902344, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35496506094932556, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7960336804389954, "eval_runtime": 56.9523, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5285 }, { "epoch": 0.48769461423134586, "grad_norm": 2.635721145838595, "learning_rate": 6.877350572032271e-07, "loss": 0.7694, "step": 5286 }, { "epoch": 0.4877868757928728, "grad_norm": 1.5140355336761933, "learning_rate": 6.875478582245496e-07, "loss": 0.6093, "step": 5287 }, { "epoch": 0.48787913735439975, "grad_norm": 2.3256957216941037, "learning_rate": 6.873606535776871e-07, "loss": 0.6791, "step": 5288 }, { "epoch": 0.48797139891592667, "grad_norm": 1.7210983351479296, "learning_rate": 6.871734432796038e-07, "loss": 0.7426, "step": 5289 }, { "epoch": 0.4880636604774536, "grad_norm": 1.5890358545413577, "learning_rate": 6.869862273472649e-07, "loss": 0.5699, "step": 5290 }, { "epoch": 0.4880636604774536, "eval_GEN Loss": 0.4460275173187256, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35815712809562683, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.797656238079071, "eval_runtime": 57.0192, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5290 }, { "epoch": 0.4881559220389805, "grad_norm": 2.5064781849329405, "learning_rate": 6.867990057976371e-07, "loss": 0.8195, "step": 5291 }, { "epoch": 0.4882481836005074, "grad_norm": 1.8625365679955745, "learning_rate": 6.866117786476856e-07, "loss": 0.7233, "step": 5292 }, { "epoch": 0.48834044516203434, "grad_norm": 2.277230977017301, "learning_rate": 6.864245459143781e-07, "loss": 0.7609, "step": 5293 }, { "epoch": 0.4884327067235613, "grad_norm": 1.8683812192306888, "learning_rate": 6.862373076146813e-07, "loss": 0.7193, "step": 5294 }, { "epoch": 0.48852496828508823, "grad_norm": 2.48020799517351, "learning_rate": 6.860500637655636e-07, "loss": 0.7651, "step": 5295 }, { "epoch": 0.48852496828508823, "eval_GEN Loss": 0.4468909502029419, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3436923027038574, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8056490421295166, "eval_runtime": 57.1115, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5295 }, { "epoch": 0.48861722984661515, "grad_norm": 1.473216831609417, "learning_rate": 6.858628143839929e-07, "loss": 0.5809, "step": 5296 }, { "epoch": 0.48870949140814207, "grad_norm": 1.9755506591841607, "learning_rate": 6.856755594869381e-07, "loss": 0.8222, "step": 5297 }, { "epoch": 0.488801752969669, "grad_norm": 1.5284099930878887, "learning_rate": 6.854882990913687e-07, "loss": 0.5885, "step": 5298 }, { "epoch": 0.48889401453119596, "grad_norm": 1.7758627821233632, "learning_rate": 6.853010332142543e-07, "loss": 0.7167, "step": 5299 }, { "epoch": 0.4889862760927229, "grad_norm": 1.5634232353168074, "learning_rate": 6.851137618725653e-07, "loss": 0.7106, "step": 5300 }, { "epoch": 0.4889862760927229, "eval_GEN Loss": 0.4465012848377228, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3342447578907013, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8126803040504456, "eval_runtime": 56.9877, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5300 }, { "epoch": 0.4890785376542498, "grad_norm": 2.6141711469472466, "learning_rate": 6.849264850832726e-07, "loss": 0.7316, "step": 5301 }, { "epoch": 0.4891707992157767, "grad_norm": 1.2038400856147284, "learning_rate": 6.847392028633477e-07, "loss": 0.5244, "step": 5302 }, { "epoch": 0.48926306077730364, "grad_norm": 1.9171984515197855, "learning_rate": 6.845519152297621e-07, "loss": 0.7391, "step": 5303 }, { "epoch": 0.4893553223388306, "grad_norm": 1.5080920641884723, "learning_rate": 6.843646221994882e-07, "loss": 0.5356, "step": 5304 }, { "epoch": 0.48944758390035753, "grad_norm": 1.9844877480169987, "learning_rate": 6.841773237894987e-07, "loss": 0.7359, "step": 5305 }, { "epoch": 0.48944758390035753, "eval_GEN Loss": 0.44728758931159973, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3298676013946533, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8248196840286255, "eval_runtime": 56.1483, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5305 }, { "epoch": 0.48953984546188445, "grad_norm": 1.4518058936310503, "learning_rate": 6.839900200167671e-07, "loss": 0.6502, "step": 5306 }, { "epoch": 0.48963210702341137, "grad_norm": 2.0476658423428478, "learning_rate": 6.83802710898267e-07, "loss": 0.7773, "step": 5307 }, { "epoch": 0.4897243685849383, "grad_norm": 2.0519564629039593, "learning_rate": 6.836153964509727e-07, "loss": 0.8156, "step": 5308 }, { "epoch": 0.4898166301464652, "grad_norm": 1.81761581673439, "learning_rate": 6.83428076691859e-07, "loss": 0.6593, "step": 5309 }, { "epoch": 0.4899088917079922, "grad_norm": 2.672855257437952, "learning_rate": 6.832407516379008e-07, "loss": 0.8058, "step": 5310 }, { "epoch": 0.4899088917079922, "eval_GEN Loss": 0.44662582874298096, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.33568885922431946, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8215144276618958, "eval_runtime": 56.204, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5310 }, { "epoch": 0.4900011532695191, "grad_norm": 1.860207961091584, "learning_rate": 6.830534213060743e-07, "loss": 0.6694, "step": 5311 }, { "epoch": 0.490093414831046, "grad_norm": 2.115848034239761, "learning_rate": 6.82866085713355e-07, "loss": 0.8381, "step": 5312 }, { "epoch": 0.49018567639257293, "grad_norm": 2.64452835030952, "learning_rate": 6.826787448767203e-07, "loss": 0.688, "step": 5313 }, { "epoch": 0.49027793795409985, "grad_norm": 1.6983972816246264, "learning_rate": 6.824913988131466e-07, "loss": 0.6176, "step": 5314 }, { "epoch": 0.4903701995156268, "grad_norm": 1.6903718140001671, "learning_rate": 6.82304047539612e-07, "loss": 0.6261, "step": 5315 }, { "epoch": 0.4903701995156268, "eval_GEN Loss": 0.44688019156455994, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.342485636472702, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8103365302085876, "eval_runtime": 56.2325, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 5315 }, { "epoch": 0.49046246107715374, "grad_norm": 1.421827599988636, "learning_rate": 6.821166910730945e-07, "loss": 0.5952, "step": 5316 }, { "epoch": 0.49055472263868066, "grad_norm": 2.755023399008064, "learning_rate": 6.819293294305724e-07, "loss": 0.7919, "step": 5317 }, { "epoch": 0.4906469842002076, "grad_norm": 1.6907977088060233, "learning_rate": 6.81741962629025e-07, "loss": 0.6388, "step": 5318 }, { "epoch": 0.4907392457617345, "grad_norm": 1.6207587284030915, "learning_rate": 6.815545906854318e-07, "loss": 0.7324, "step": 5319 }, { "epoch": 0.4908315073232615, "grad_norm": 2.225927847159523, "learning_rate": 6.813672136167721e-07, "loss": 0.7203, "step": 5320 }, { "epoch": 0.4908315073232615, "eval_GEN Loss": 0.4494723081588745, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.36387911438941956, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8150240182876587, "eval_runtime": 56.0469, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5320 }, { "epoch": 0.4909237688847884, "grad_norm": 2.2015135179171783, "learning_rate": 6.811798314400273e-07, "loss": 0.6268, "step": 5321 }, { "epoch": 0.4910160304463153, "grad_norm": 2.2393102380882226, "learning_rate": 6.809924441721774e-07, "loss": 0.6547, "step": 5322 }, { "epoch": 0.49110829200784223, "grad_norm": 1.7537161098600234, "learning_rate": 6.808050518302042e-07, "loss": 0.5325, "step": 5323 }, { "epoch": 0.49120055356936915, "grad_norm": 1.2906021116491815, "learning_rate": 6.806176544310892e-07, "loss": 0.6426, "step": 5324 }, { "epoch": 0.49129281513089607, "grad_norm": 1.9974792960826502, "learning_rate": 6.80430251991815e-07, "loss": 0.679, "step": 5325 }, { "epoch": 0.49129281513089607, "eval_GEN Loss": 0.4499535858631134, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.36459141969680786, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8209735751152039, "eval_runtime": 57.0593, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5325 }, { "epoch": 0.49138507669242304, "grad_norm": 1.1443403678356325, "learning_rate": 6.802428445293641e-07, "loss": 0.4434, "step": 5326 }, { "epoch": 0.49147733825394996, "grad_norm": 2.731626540661461, "learning_rate": 6.800554320607197e-07, "loss": 0.8061, "step": 5327 }, { "epoch": 0.4915695998154769, "grad_norm": 2.5640268822139842, "learning_rate": 6.798680146028652e-07, "loss": 0.7692, "step": 5328 }, { "epoch": 0.4916618613770038, "grad_norm": 1.8352041128013685, "learning_rate": 6.79680592172785e-07, "loss": 0.7452, "step": 5329 }, { "epoch": 0.4917541229385307, "grad_norm": 3.0560220596924625, "learning_rate": 6.794931647874633e-07, "loss": 0.7506, "step": 5330 }, { "epoch": 0.4917541229385307, "eval_GEN Loss": 0.450395405292511, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.36391282081604004, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8243990540504456, "eval_runtime": 56.9449, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5330 }, { "epoch": 0.4918463845000577, "grad_norm": 2.152776686633733, "learning_rate": 6.793057324638856e-07, "loss": 0.6401, "step": 5331 }, { "epoch": 0.4919386460615846, "grad_norm": 2.5168826209881043, "learning_rate": 6.791182952190368e-07, "loss": 0.8717, "step": 5332 }, { "epoch": 0.4920309076231115, "grad_norm": 2.3676226383038066, "learning_rate": 6.789308530699027e-07, "loss": 0.7366, "step": 5333 }, { "epoch": 0.49212316918463844, "grad_norm": 1.9040576623375032, "learning_rate": 6.787434060334699e-07, "loss": 0.4843, "step": 5334 }, { "epoch": 0.49221543074616536, "grad_norm": 2.8890583792703532, "learning_rate": 6.785559541267252e-07, "loss": 0.7706, "step": 5335 }, { "epoch": 0.49221543074616536, "eval_GEN Loss": 0.45038849115371704, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.3705781102180481, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8191706538200378, "eval_runtime": 57.0635, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5335 }, { "epoch": 0.49230769230769234, "grad_norm": 2.041391306641227, "learning_rate": 6.783684973666556e-07, "loss": 0.778, "step": 5336 }, { "epoch": 0.49239995386921925, "grad_norm": 1.9756797188732005, "learning_rate": 6.781810357702485e-07, "loss": 0.6249, "step": 5337 }, { "epoch": 0.49249221543074617, "grad_norm": 1.7579491473289928, "learning_rate": 6.779935693544925e-07, "loss": 0.6769, "step": 5338 }, { "epoch": 0.4925844769922731, "grad_norm": 2.13608671854341, "learning_rate": 6.778060981363757e-07, "loss": 0.6017, "step": 5339 }, { "epoch": 0.4926767385538, "grad_norm": 2.0925763268408892, "learning_rate": 6.776186221328872e-07, "loss": 0.7173, "step": 5340 }, { "epoch": 0.4926767385538, "eval_GEN Loss": 0.4509439468383789, "eval_GEN top-5 accuracy": 0.9811486190267427, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.36796844005584717, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8223557472229004, "eval_runtime": 57.1216, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5340 }, { "epoch": 0.4927690001153269, "grad_norm": 2.0678768149898046, "learning_rate": 6.774311413610164e-07, "loss": 0.5205, "step": 5341 }, { "epoch": 0.4928612616768539, "grad_norm": 1.5818730639382448, "learning_rate": 6.772436558377529e-07, "loss": 0.5392, "step": 5342 }, { "epoch": 0.4929535232383808, "grad_norm": 1.578573842014058, "learning_rate": 6.770561655800872e-07, "loss": 0.5474, "step": 5343 }, { "epoch": 0.49304578479990774, "grad_norm": 1.4540592075319834, "learning_rate": 6.7686867060501e-07, "loss": 0.6563, "step": 5344 }, { "epoch": 0.49313804636143466, "grad_norm": 2.1491498180359008, "learning_rate": 6.76681170929512e-07, "loss": 0.7054, "step": 5345 }, { "epoch": 0.49313804636143466, "eval_GEN Loss": 0.4497039318084717, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3457697331905365, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8236778974533081, "eval_runtime": 56.1501, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5345 }, { "epoch": 0.4932303079229616, "grad_norm": 2.0504780862670384, "learning_rate": 6.76493666570585e-07, "loss": 0.704, "step": 5346 }, { "epoch": 0.49332256948448855, "grad_norm": 1.7484850342032314, "learning_rate": 6.763061575452208e-07, "loss": 0.6603, "step": 5347 }, { "epoch": 0.49341483104601547, "grad_norm": 4.827275380694562, "learning_rate": 6.76118643870412e-07, "loss": 0.8325, "step": 5348 }, { "epoch": 0.4935070926075424, "grad_norm": 1.6240631926413094, "learning_rate": 6.759311255631511e-07, "loss": 0.5855, "step": 5349 }, { "epoch": 0.4935993541690693, "grad_norm": 2.1716725231765954, "learning_rate": 6.757436026404316e-07, "loss": 0.7991, "step": 5350 }, { "epoch": 0.4935993541690693, "eval_GEN Loss": 0.450387179851532, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3395482897758484, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8339543342590332, "eval_runtime": 56.1222, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5350 }, { "epoch": 0.4936916157305962, "grad_norm": 2.6442971753578925, "learning_rate": 6.755560751192466e-07, "loss": 0.7841, "step": 5351 }, { "epoch": 0.4937838772921232, "grad_norm": 1.8697794199632625, "learning_rate": 6.753685430165909e-07, "loss": 0.5577, "step": 5352 }, { "epoch": 0.4938761388536501, "grad_norm": 1.7356087440370314, "learning_rate": 6.751810063494582e-07, "loss": 0.6546, "step": 5353 }, { "epoch": 0.49396840041517703, "grad_norm": 1.6895436657503966, "learning_rate": 6.74993465134844e-07, "loss": 0.5187, "step": 5354 }, { "epoch": 0.49406066197670395, "grad_norm": 2.4659194123763784, "learning_rate": 6.748059193897432e-07, "loss": 0.5702, "step": 5355 }, { "epoch": 0.49406066197670395, "eval_GEN Loss": 0.4511547088623047, "eval_GEN top-5 accuracy": 0.9807102148180622, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3382248878479004, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8170071840286255, "eval_runtime": 56.1855, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5355 }, { "epoch": 0.49415292353823087, "grad_norm": 2.1798344295938277, "learning_rate": 6.746183691311515e-07, "loss": 0.6553, "step": 5356 }, { "epoch": 0.4942451850997578, "grad_norm": 1.4630114908439404, "learning_rate": 6.744308143760653e-07, "loss": 0.3919, "step": 5357 }, { "epoch": 0.49433744666128476, "grad_norm": 1.9726959122968153, "learning_rate": 6.742432551414807e-07, "loss": 0.5807, "step": 5358 }, { "epoch": 0.4944297082228117, "grad_norm": 1.911391527182438, "learning_rate": 6.74055691444395e-07, "loss": 0.5738, "step": 5359 }, { "epoch": 0.4945219697843386, "grad_norm": 2.153556167819473, "learning_rate": 6.738681233018052e-07, "loss": 0.7155, "step": 5360 }, { "epoch": 0.4945219697843386, "eval_GEN Loss": 0.45182299613952637, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3424991965293884, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8098557591438293, "eval_runtime": 56.1699, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5360 }, { "epoch": 0.4946142313458655, "grad_norm": 1.3380819161671886, "learning_rate": 6.736805507307091e-07, "loss": 0.4587, "step": 5361 }, { "epoch": 0.49470649290739244, "grad_norm": 1.609264967465174, "learning_rate": 6.734929737481049e-07, "loss": 0.6314, "step": 5362 }, { "epoch": 0.4947987544689194, "grad_norm": 2.1969369378552854, "learning_rate": 6.733053923709911e-07, "loss": 0.6888, "step": 5363 }, { "epoch": 0.49489101603044633, "grad_norm": 2.9079206194035603, "learning_rate": 6.731178066163667e-07, "loss": 0.8226, "step": 5364 }, { "epoch": 0.49498327759197325, "grad_norm": 1.7013706886436466, "learning_rate": 6.729302165012308e-07, "loss": 0.6857, "step": 5365 }, { "epoch": 0.49498327759197325, "eval_GEN Loss": 0.45275840163230896, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3535032868385315, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8089542984962463, "eval_runtime": 57.0212, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5365 }, { "epoch": 0.49507553915350017, "grad_norm": 3.055339057607085, "learning_rate": 6.727426220425833e-07, "loss": 0.6637, "step": 5366 }, { "epoch": 0.4951678007150271, "grad_norm": 3.064071408834588, "learning_rate": 6.725550232574244e-07, "loss": 0.8068, "step": 5367 }, { "epoch": 0.49526006227655406, "grad_norm": 1.9861601957831896, "learning_rate": 6.723674201627542e-07, "loss": 0.5864, "step": 5368 }, { "epoch": 0.495352323838081, "grad_norm": 1.760216195628246, "learning_rate": 6.721798127755738e-07, "loss": 0.5811, "step": 5369 }, { "epoch": 0.4954445853996079, "grad_norm": 1.9234521423271544, "learning_rate": 6.719922011128846e-07, "loss": 0.63, "step": 5370 }, { "epoch": 0.4954445853996079, "eval_GEN Loss": 0.4542452394962311, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3676982820034027, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8007211685180664, "eval_runtime": 56.9076, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5370 }, { "epoch": 0.4955368469611348, "grad_norm": 4.284644481133725, "learning_rate": 6.718045851916882e-07, "loss": 0.7964, "step": 5371 }, { "epoch": 0.49562910852266173, "grad_norm": 2.0028894437463887, "learning_rate": 6.716169650289865e-07, "loss": 0.7363, "step": 5372 }, { "epoch": 0.49572137008418865, "grad_norm": 2.144137154834869, "learning_rate": 6.714293406417822e-07, "loss": 0.5705, "step": 5373 }, { "epoch": 0.4958136316457156, "grad_norm": 2.5817758556092167, "learning_rate": 6.712417120470779e-07, "loss": 0.7776, "step": 5374 }, { "epoch": 0.49590589320724254, "grad_norm": 2.0782714950109806, "learning_rate": 6.71054079261877e-07, "loss": 0.6583, "step": 5375 }, { "epoch": 0.49590589320724254, "eval_GEN Loss": 0.45588478446006775, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.38793742656707764, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.801562488079071, "eval_runtime": 57.4271, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 5375 }, { "epoch": 0.49599815476876946, "grad_norm": 2.001035735329717, "learning_rate": 6.708664423031827e-07, "loss": 0.6731, "step": 5376 }, { "epoch": 0.4960904163302964, "grad_norm": 2.332978069944789, "learning_rate": 6.706788011879995e-07, "loss": 0.785, "step": 5377 }, { "epoch": 0.4961826778918233, "grad_norm": 2.736623131959861, "learning_rate": 6.704911559333311e-07, "loss": 0.8087, "step": 5378 }, { "epoch": 0.4962749394533503, "grad_norm": 2.063822361254413, "learning_rate": 6.703035065561828e-07, "loss": 0.6044, "step": 5379 }, { "epoch": 0.4963672010148772, "grad_norm": 2.317484513119575, "learning_rate": 6.701158530735594e-07, "loss": 0.8709, "step": 5380 }, { "epoch": 0.4963672010148772, "eval_GEN Loss": 0.45652472972869873, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.39784377813339233, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8067908883094788, "eval_runtime": 57.0199, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5380 }, { "epoch": 0.4964594625764041, "grad_norm": 3.112630717948118, "learning_rate": 6.699281955024662e-07, "loss": 0.7308, "step": 5381 }, { "epoch": 0.496551724137931, "grad_norm": 1.987573531136003, "learning_rate": 6.697405338599094e-07, "loss": 0.7909, "step": 5382 }, { "epoch": 0.49664398569945795, "grad_norm": 2.444518663352251, "learning_rate": 6.695528681628948e-07, "loss": 0.5878, "step": 5383 }, { "epoch": 0.49673624726098486, "grad_norm": 2.343245036266173, "learning_rate": 6.693651984284294e-07, "loss": 0.7793, "step": 5384 }, { "epoch": 0.49682850882251184, "grad_norm": 1.5951875386786545, "learning_rate": 6.691775246735198e-07, "loss": 0.5789, "step": 5385 }, { "epoch": 0.49682850882251184, "eval_GEN Loss": 0.4562091827392578, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM Loss": 0.37973442673683167, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8067908883094788, "eval_runtime": 56.9084, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5385 }, { "epoch": 0.49692077038403876, "grad_norm": 2.1124250582811164, "learning_rate": 6.689898469151731e-07, "loss": 0.7686, "step": 5386 }, { "epoch": 0.4970130319455657, "grad_norm": 2.0727756665632997, "learning_rate": 6.688021651703977e-07, "loss": 0.7537, "step": 5387 }, { "epoch": 0.4971052935070926, "grad_norm": 2.616003629661462, "learning_rate": 6.686144794562008e-07, "loss": 0.7142, "step": 5388 }, { "epoch": 0.4971975550686195, "grad_norm": 1.5203767248738134, "learning_rate": 6.684267897895913e-07, "loss": 0.6204, "step": 5389 }, { "epoch": 0.4972898166301465, "grad_norm": 1.9512324385217645, "learning_rate": 6.682390961875778e-07, "loss": 0.5374, "step": 5390 }, { "epoch": 0.4972898166301465, "eval_GEN Loss": 0.45478516817092896, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.36571550369262695, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8127403855323792, "eval_runtime": 57.1449, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5390 }, { "epoch": 0.4973820781916734, "grad_norm": 1.4738202871144412, "learning_rate": 6.680513986671694e-07, "loss": 0.5949, "step": 5391 }, { "epoch": 0.4974743397532003, "grad_norm": 1.7733729051241283, "learning_rate": 6.678636972453752e-07, "loss": 0.7049, "step": 5392 }, { "epoch": 0.49756660131472724, "grad_norm": 1.939250174031338, "learning_rate": 6.676759919392055e-07, "loss": 0.5788, "step": 5393 }, { "epoch": 0.49765886287625416, "grad_norm": 2.3747288110963685, "learning_rate": 6.6748828276567e-07, "loss": 0.795, "step": 5394 }, { "epoch": 0.49775112443778113, "grad_norm": 2.9061416111132727, "learning_rate": 6.673005697417796e-07, "loss": 0.8745, "step": 5395 }, { "epoch": 0.49775112443778113, "eval_GEN Loss": 0.45501068234443665, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.36809226870536804, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8237980604171753, "eval_runtime": 56.9494, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5395 }, { "epoch": 0.49784338599930805, "grad_norm": 3.1436169531618363, "learning_rate": 6.671128528845451e-07, "loss": 0.8051, "step": 5396 }, { "epoch": 0.49793564756083497, "grad_norm": 1.6992799879594964, "learning_rate": 6.669251322109774e-07, "loss": 0.5165, "step": 5397 }, { "epoch": 0.4980279091223619, "grad_norm": 2.2401723426623024, "learning_rate": 6.667374077380884e-07, "loss": 0.6152, "step": 5398 }, { "epoch": 0.4981201706838888, "grad_norm": 2.2107837788809386, "learning_rate": 6.665496794828897e-07, "loss": 0.5946, "step": 5399 }, { "epoch": 0.4982124322454157, "grad_norm": 1.6727488904202323, "learning_rate": 6.663619474623936e-07, "loss": 0.7889, "step": 5400 }, { "epoch": 0.4982124322454157, "eval_GEN Loss": 0.4545566141605377, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.36905550956726074, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.82421875, "eval_runtime": 57.01, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5400 }, { "epoch": 0.4983046938069427, "grad_norm": 1.8715144924018392, "learning_rate": 6.661742116936127e-07, "loss": 0.7323, "step": 5401 }, { "epoch": 0.4983969553684696, "grad_norm": 1.6604704677527897, "learning_rate": 6.659864721935601e-07, "loss": 0.7212, "step": 5402 }, { "epoch": 0.49848921692999654, "grad_norm": 1.987516402032218, "learning_rate": 6.657987289792487e-07, "loss": 0.669, "step": 5403 }, { "epoch": 0.49858147849152346, "grad_norm": 1.8688347553106244, "learning_rate": 6.656109820676925e-07, "loss": 0.6931, "step": 5404 }, { "epoch": 0.4986737400530504, "grad_norm": 2.034281868142649, "learning_rate": 6.65423231475905e-07, "loss": 0.716, "step": 5405 }, { "epoch": 0.4986737400530504, "eval_GEN Loss": 0.4538855254650116, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.3652361035346985, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8247596025466919, "eval_runtime": 57.0532, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5405 }, { "epoch": 0.49876600161457735, "grad_norm": 1.6288873410610847, "learning_rate": 6.652354772209006e-07, "loss": 0.6637, "step": 5406 }, { "epoch": 0.49885826317610427, "grad_norm": 1.5656643356743964, "learning_rate": 6.65047719319694e-07, "loss": 0.6057, "step": 5407 }, { "epoch": 0.4989505247376312, "grad_norm": 1.6299631948319757, "learning_rate": 6.648599577893e-07, "loss": 0.6127, "step": 5408 }, { "epoch": 0.4990427862991581, "grad_norm": 1.702755699879321, "learning_rate": 6.646721926467339e-07, "loss": 0.5994, "step": 5409 }, { "epoch": 0.499135047860685, "grad_norm": 3.589979624708464, "learning_rate": 6.644844239090112e-07, "loss": 0.9457, "step": 5410 }, { "epoch": 0.499135047860685, "eval_GEN Loss": 0.4547160863876343, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.3665526807308197, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8256610631942749, "eval_runtime": 56.2881, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 5410 }, { "epoch": 0.499227309422212, "grad_norm": 1.6479613828704325, "learning_rate": 6.642966515931479e-07, "loss": 0.6721, "step": 5411 }, { "epoch": 0.4993195709837389, "grad_norm": 1.6721222848404582, "learning_rate": 6.641088757161602e-07, "loss": 0.5791, "step": 5412 }, { "epoch": 0.49941183254526583, "grad_norm": 1.829226217748743, "learning_rate": 6.639210962950648e-07, "loss": 0.5236, "step": 5413 }, { "epoch": 0.49950409410679275, "grad_norm": 2.740195528075589, "learning_rate": 6.63733313346878e-07, "loss": 1.0691, "step": 5414 }, { "epoch": 0.49959635566831967, "grad_norm": 1.655673885608047, "learning_rate": 6.635455268886178e-07, "loss": 0.7143, "step": 5415 }, { "epoch": 0.49959635566831967, "eval_GEN Loss": 0.4547809064388275, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.366292268037796, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8237379789352417, "eval_runtime": 55.9876, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5415 }, { "epoch": 0.4996886172298466, "grad_norm": 1.6264253408039486, "learning_rate": 6.633577369373011e-07, "loss": 0.7096, "step": 5416 }, { "epoch": 0.49978087879137356, "grad_norm": 1.7625467364431346, "learning_rate": 6.631699435099458e-07, "loss": 0.7648, "step": 5417 }, { "epoch": 0.4998731403529005, "grad_norm": 2.074764247398275, "learning_rate": 6.629821466235703e-07, "loss": 0.9023, "step": 5418 }, { "epoch": 0.4999654019144274, "grad_norm": 2.1254888892678334, "learning_rate": 6.627943462951927e-07, "loss": 0.6951, "step": 5419 }, { "epoch": 0.5000576634759544, "grad_norm": 2.6891150492828753, "learning_rate": 6.62606542541832e-07, "loss": 0.802, "step": 5420 }, { "epoch": 0.5000576634759544, "eval_GEN Loss": 0.45398253202438354, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.36442112922668457, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8206129670143127, "eval_runtime": 56.0997, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5420 }, { "epoch": 0.5001499250374812, "grad_norm": 2.0201184339551874, "learning_rate": 6.624187353805074e-07, "loss": 0.702, "step": 5421 }, { "epoch": 0.5002421865990082, "grad_norm": 2.3399697792985856, "learning_rate": 6.622309248282379e-07, "loss": 0.7101, "step": 5422 }, { "epoch": 0.5003344481605351, "grad_norm": 2.135422838143364, "learning_rate": 6.620431109020435e-07, "loss": 0.7063, "step": 5423 }, { "epoch": 0.500426709722062, "grad_norm": 2.489749782368745, "learning_rate": 6.61855293618944e-07, "loss": 0.7711, "step": 5424 }, { "epoch": 0.500518971283589, "grad_norm": 1.3855730214581048, "learning_rate": 6.616674729959599e-07, "loss": 0.6106, "step": 5425 }, { "epoch": 0.500518971283589, "eval_GEN Loss": 0.45412665605545044, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3666369915008545, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8161057829856873, "eval_runtime": 56.1123, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5425 }, { "epoch": 0.5006112328451159, "grad_norm": 1.3272155925293556, "learning_rate": 6.614796490501115e-07, "loss": 0.6366, "step": 5426 }, { "epoch": 0.5007034944066429, "grad_norm": 2.1145973955106676, "learning_rate": 6.6129182179842e-07, "loss": 0.7024, "step": 5427 }, { "epoch": 0.5007957559681697, "grad_norm": 2.5293290018023358, "learning_rate": 6.611039912579066e-07, "loss": 0.8289, "step": 5428 }, { "epoch": 0.5008880175296967, "grad_norm": 1.5676897344160272, "learning_rate": 6.609161574455924e-07, "loss": 0.5495, "step": 5429 }, { "epoch": 0.5009802790912237, "grad_norm": 3.3303208604994645, "learning_rate": 6.607283203784998e-07, "loss": 0.7964, "step": 5430 }, { "epoch": 0.5009802790912237, "eval_GEN Loss": 0.45513907074928284, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.360712468624115, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8195913434028625, "eval_runtime": 56.9918, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5430 }, { "epoch": 0.5010725406527505, "grad_norm": 3.7595432486827267, "learning_rate": 6.605404800736503e-07, "loss": 0.8711, "step": 5431 }, { "epoch": 0.5011648022142775, "grad_norm": 2.627078265387286, "learning_rate": 6.603526365480668e-07, "loss": 0.6738, "step": 5432 }, { "epoch": 0.5012570637758044, "grad_norm": 2.6429378518009465, "learning_rate": 6.601647898187716e-07, "loss": 0.6676, "step": 5433 }, { "epoch": 0.5013493253373313, "grad_norm": 2.722049499771568, "learning_rate": 6.599769399027878e-07, "loss": 0.6811, "step": 5434 }, { "epoch": 0.5014415868988583, "grad_norm": 1.4470770848772276, "learning_rate": 6.597890868171386e-07, "loss": 0.6866, "step": 5435 }, { "epoch": 0.5014415868988583, "eval_GEN Loss": 0.4540416896343231, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3607963025569916, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8190504908561707, "eval_runtime": 56.9832, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5435 }, { "epoch": 0.5015338484603852, "grad_norm": 1.9127432052001523, "learning_rate": 6.596012305788475e-07, "loss": 0.7095, "step": 5436 }, { "epoch": 0.5016261100219122, "grad_norm": 2.2172935253083663, "learning_rate": 6.594133712049388e-07, "loss": 0.605, "step": 5437 }, { "epoch": 0.501718371583439, "grad_norm": 1.641051612826847, "learning_rate": 6.592255087124359e-07, "loss": 0.6216, "step": 5438 }, { "epoch": 0.501810633144966, "grad_norm": 1.6979544953964563, "learning_rate": 6.590376431183637e-07, "loss": 0.5428, "step": 5439 }, { "epoch": 0.5019028947064929, "grad_norm": 2.1467404588705676, "learning_rate": 6.588497744397466e-07, "loss": 0.7389, "step": 5440 }, { "epoch": 0.5019028947064929, "eval_GEN Loss": 0.45337560772895813, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3668665289878845, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8161057829856873, "eval_runtime": 56.8802, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5440 }, { "epoch": 0.5019951562680198, "grad_norm": 1.4820446537651433, "learning_rate": 6.586619026936098e-07, "loss": 0.4924, "step": 5441 }, { "epoch": 0.5020874178295468, "grad_norm": 2.0683425402986195, "learning_rate": 6.584740278969781e-07, "loss": 0.6854, "step": 5442 }, { "epoch": 0.5021796793910737, "grad_norm": 1.972650996423103, "learning_rate": 6.582861500668774e-07, "loss": 0.6211, "step": 5443 }, { "epoch": 0.5022719409526006, "grad_norm": 1.6768732144416927, "learning_rate": 6.580982692203336e-07, "loss": 0.6594, "step": 5444 }, { "epoch": 0.5023642025141275, "grad_norm": 1.4297668074282555, "learning_rate": 6.579103853743723e-07, "loss": 0.6192, "step": 5445 }, { "epoch": 0.5023642025141275, "eval_GEN Loss": 0.45275557041168213, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.36501815915107727, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.817187488079071, "eval_runtime": 56.8935, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5445 }, { "epoch": 0.5024564640756545, "grad_norm": 2.1662347756102536, "learning_rate": 6.577224985460203e-07, "loss": 0.8818, "step": 5446 }, { "epoch": 0.5025487256371814, "grad_norm": 2.805474911619233, "learning_rate": 6.575346087523038e-07, "loss": 0.6586, "step": 5447 }, { "epoch": 0.5026409871987083, "grad_norm": 2.4613990663451557, "learning_rate": 6.573467160102499e-07, "loss": 0.731, "step": 5448 }, { "epoch": 0.5027332487602353, "grad_norm": 2.672508482952123, "learning_rate": 6.571588203368859e-07, "loss": 0.6714, "step": 5449 }, { "epoch": 0.5028255103217621, "grad_norm": 1.9437550254584974, "learning_rate": 6.569709217492388e-07, "loss": 0.6021, "step": 5450 }, { "epoch": 0.5028255103217621, "eval_GEN Loss": 0.45298442244529724, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 Neg": 0.56, "eval_PRM Loss": 0.3683602809906006, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.814182698726654, "eval_runtime": 56.9659, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5450 }, { "epoch": 0.5029177718832891, "grad_norm": 1.7321248464517225, "learning_rate": 6.567830202643364e-07, "loss": 0.6699, "step": 5451 }, { "epoch": 0.5030100334448161, "grad_norm": 2.4750252339150975, "learning_rate": 6.565951158992066e-07, "loss": 0.9109, "step": 5452 }, { "epoch": 0.503102295006343, "grad_norm": 2.634638626363284, "learning_rate": 6.564072086708778e-07, "loss": 0.7955, "step": 5453 }, { "epoch": 0.5031945565678699, "grad_norm": 1.6395064924775584, "learning_rate": 6.562192985963782e-07, "loss": 0.6858, "step": 5454 }, { "epoch": 0.5032868181293968, "grad_norm": 1.4335354477364892, "learning_rate": 6.560313856927368e-07, "loss": 0.5962, "step": 5455 }, { "epoch": 0.5032868181293968, "eval_GEN Loss": 0.45385411381721497, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37499240040779114, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8122596144676208, "eval_runtime": 55.8162, "eval_samples_per_second": 1.165, "eval_steps_per_second": 0.09, "step": 5455 }, { "epoch": 0.5033790796909238, "grad_norm": 1.7245348399522396, "learning_rate": 6.558434699769823e-07, "loss": 0.561, "step": 5456 }, { "epoch": 0.5034713412524507, "grad_norm": 1.6520992887483557, "learning_rate": 6.556555514661441e-07, "loss": 0.5182, "step": 5457 }, { "epoch": 0.5035636028139776, "grad_norm": 2.422561033032992, "learning_rate": 6.554676301772513e-07, "loss": 0.8372, "step": 5458 }, { "epoch": 0.5036558643755046, "grad_norm": 2.160409185498644, "learning_rate": 6.55279706127334e-07, "loss": 0.7205, "step": 5459 }, { "epoch": 0.5037481259370314, "grad_norm": 2.3532418096194796, "learning_rate": 6.550917793334222e-07, "loss": 0.8254, "step": 5460 }, { "epoch": 0.5037481259370314, "eval_GEN Loss": 0.45260241627693176, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37423551082611084, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8088942170143127, "eval_runtime": 57.224, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 5460 }, { "epoch": 0.5038403874985584, "grad_norm": 1.632385273839656, "learning_rate": 6.54903849812546e-07, "loss": 0.718, "step": 5461 }, { "epoch": 0.5039326490600854, "grad_norm": 3.2164196949458637, "learning_rate": 6.547159175817358e-07, "loss": 0.6709, "step": 5462 }, { "epoch": 0.5040249106216123, "grad_norm": 2.539974019144695, "learning_rate": 6.545279826580222e-07, "loss": 0.6778, "step": 5463 }, { "epoch": 0.5041171721831392, "grad_norm": 1.5656824653769785, "learning_rate": 6.543400450584367e-07, "loss": 0.7191, "step": 5464 }, { "epoch": 0.5042094337446661, "grad_norm": 2.996472846432877, "learning_rate": 6.541521048000097e-07, "loss": 0.8314, "step": 5465 }, { "epoch": 0.5042094337446661, "eval_GEN Loss": 0.4532241225242615, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3812357485294342, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8083533644676208, "eval_runtime": 56.9482, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5465 }, { "epoch": 0.5043016953061931, "grad_norm": 1.8805944386335982, "learning_rate": 6.539641618997735e-07, "loss": 0.569, "step": 5466 }, { "epoch": 0.50439395686772, "grad_norm": 1.8413663881340374, "learning_rate": 6.53776216374759e-07, "loss": 0.5572, "step": 5467 }, { "epoch": 0.5044862184292469, "grad_norm": 2.196195960121717, "learning_rate": 6.535882682419986e-07, "loss": 0.6794, "step": 5468 }, { "epoch": 0.5045784799907739, "grad_norm": 2.1369344315377234, "learning_rate": 6.534003175185244e-07, "loss": 0.8377, "step": 5469 }, { "epoch": 0.5046707415523007, "grad_norm": 2.2361857974130404, "learning_rate": 6.532123642213687e-07, "loss": 0.8286, "step": 5470 }, { "epoch": 0.5046707415523007, "eval_GEN Loss": 0.45523300766944885, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8734177215189873, "eval_PRM F1 AUC": 0.785227867993714, "eval_PRM F1 Neg": 0.6296296296296297, "eval_PRM Loss": 0.3966497778892517, "eval_PRM NPV": 0.5483870967741935, "eval_PRM Precision": 0.92, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8161057829856873, "eval_runtime": 57.4002, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 5470 }, { "epoch": 0.5047630031138277, "grad_norm": 1.8081581035357366, "learning_rate": 6.530244083675642e-07, "loss": 0.5698, "step": 5471 }, { "epoch": 0.5048552646753546, "grad_norm": 1.8973859609431274, "learning_rate": 6.528364499741436e-07, "loss": 0.5867, "step": 5472 }, { "epoch": 0.5049475262368815, "grad_norm": 1.8247995373845391, "learning_rate": 6.526484890581402e-07, "loss": 0.6612, "step": 5473 }, { "epoch": 0.5050397877984085, "grad_norm": 1.7687336333132908, "learning_rate": 6.524605256365872e-07, "loss": 0.7571, "step": 5474 }, { "epoch": 0.5051320493599354, "grad_norm": 2.835741446058392, "learning_rate": 6.522725597265179e-07, "loss": 0.5835, "step": 5475 }, { "epoch": 0.5051320493599354, "eval_GEN Loss": 0.4575701057910919, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.39843320846557617, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8258413672447205, "eval_runtime": 56.8904, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5475 }, { "epoch": 0.5052243109214624, "grad_norm": 1.7982453708177557, "learning_rate": 6.520845913449666e-07, "loss": 0.6395, "step": 5476 }, { "epoch": 0.5053165724829892, "grad_norm": 2.1774989082569998, "learning_rate": 6.518966205089669e-07, "loss": 0.5537, "step": 5477 }, { "epoch": 0.5054088340445162, "grad_norm": 1.9577817660335204, "learning_rate": 6.517086472355532e-07, "loss": 0.6773, "step": 5478 }, { "epoch": 0.5055010956060432, "grad_norm": 3.0066836677296336, "learning_rate": 6.515206715417597e-07, "loss": 0.9076, "step": 5479 }, { "epoch": 0.50559335716757, "grad_norm": 2.536593049308347, "learning_rate": 6.513326934446213e-07, "loss": 0.8068, "step": 5480 }, { "epoch": 0.50559335716757, "eval_GEN Loss": 0.4569445550441742, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.39713600277900696, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8334735631942749, "eval_runtime": 56.9846, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5480 }, { "epoch": 0.505685618729097, "grad_norm": 2.5320131234978938, "learning_rate": 6.511447129611725e-07, "loss": 0.7828, "step": 5481 }, { "epoch": 0.5057778802906239, "grad_norm": 1.930681914016267, "learning_rate": 6.509567301084491e-07, "loss": 0.662, "step": 5482 }, { "epoch": 0.5058701418521508, "grad_norm": 2.258211299737169, "learning_rate": 6.507687449034857e-07, "loss": 0.6336, "step": 5483 }, { "epoch": 0.5059624034136778, "grad_norm": 3.0055771316252, "learning_rate": 6.505807573633181e-07, "loss": 0.7621, "step": 5484 }, { "epoch": 0.5060546649752047, "grad_norm": 1.7733831105087055, "learning_rate": 6.503927675049821e-07, "loss": 0.6791, "step": 5485 }, { "epoch": 0.5060546649752047, "eval_GEN Loss": 0.4565430283546448, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM Loss": 0.38648223876953125, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.840624988079071, "eval_runtime": 56.9721, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5485 }, { "epoch": 0.5061469265367317, "grad_norm": 3.21039821225345, "learning_rate": 6.502047753455134e-07, "loss": 0.8295, "step": 5486 }, { "epoch": 0.5062391880982585, "grad_norm": 1.436366776127382, "learning_rate": 6.500167809019483e-07, "loss": 0.6122, "step": 5487 }, { "epoch": 0.5063314496597855, "grad_norm": 2.2757987211183033, "learning_rate": 6.498287841913233e-07, "loss": 0.7719, "step": 5488 }, { "epoch": 0.5064237112213125, "grad_norm": 1.6151257610552796, "learning_rate": 6.496407852306746e-07, "loss": 0.6955, "step": 5489 }, { "epoch": 0.5065159727828393, "grad_norm": 1.4595550849291279, "learning_rate": 6.494527840370392e-07, "loss": 0.7249, "step": 5490 }, { "epoch": 0.5065159727828393, "eval_GEN Loss": 0.45609524846076965, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3838522136211395, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8490985631942749, "eval_runtime": 56.0364, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5490 }, { "epoch": 0.5066082343443663, "grad_norm": 1.525945970259381, "learning_rate": 6.492647806274541e-07, "loss": 0.6406, "step": 5491 }, { "epoch": 0.5067004959058932, "grad_norm": 1.9497357473973373, "learning_rate": 6.490767750189564e-07, "loss": 0.8744, "step": 5492 }, { "epoch": 0.5067927574674201, "grad_norm": 2.2242600973362774, "learning_rate": 6.488887672285833e-07, "loss": 0.8189, "step": 5493 }, { "epoch": 0.5068850190289471, "grad_norm": 2.1181544323594235, "learning_rate": 6.487007572733726e-07, "loss": 0.8144, "step": 5494 }, { "epoch": 0.506977280590474, "grad_norm": 1.3212708314692936, "learning_rate": 6.48512745170362e-07, "loss": 0.6533, "step": 5495 }, { "epoch": 0.506977280590474, "eval_GEN Loss": 0.45553985238075256, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.3746609091758728, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8555889129638672, "eval_runtime": 56.9927, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5495 }, { "epoch": 0.507069542152001, "grad_norm": 2.2156947770219486, "learning_rate": 6.483247309365895e-07, "loss": 0.5527, "step": 5496 }, { "epoch": 0.5071618037135278, "grad_norm": 2.385185561710092, "learning_rate": 6.481367145890931e-07, "loss": 0.7397, "step": 5497 }, { "epoch": 0.5072540652750548, "grad_norm": 2.638685298021261, "learning_rate": 6.479486961449113e-07, "loss": 0.7945, "step": 5498 }, { "epoch": 0.5073463268365818, "grad_norm": 1.683399512240882, "learning_rate": 6.477606756210822e-07, "loss": 0.564, "step": 5499 }, { "epoch": 0.5074385883981086, "grad_norm": 1.783326758103116, "learning_rate": 6.47572653034645e-07, "loss": 0.6544, "step": 5500 }, { "epoch": 0.5074385883981086, "eval_GEN Loss": 0.45632559061050415, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.37432757019996643, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8497596383094788, "eval_runtime": 57.1568, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5500 }, { "epoch": 0.5075308499596356, "grad_norm": 2.4131150939341666, "learning_rate": 6.473846284026386e-07, "loss": 0.7823, "step": 5501 }, { "epoch": 0.5076231115211625, "grad_norm": 1.4076103690368338, "learning_rate": 6.471966017421017e-07, "loss": 0.6245, "step": 5502 }, { "epoch": 0.5077153730826894, "grad_norm": 1.995452513835266, "learning_rate": 6.470085730700741e-07, "loss": 0.6523, "step": 5503 }, { "epoch": 0.5078076346442163, "grad_norm": 1.6746242191361094, "learning_rate": 6.468205424035948e-07, "loss": 0.5687, "step": 5504 }, { "epoch": 0.5078998962057433, "grad_norm": 1.556116438130549, "learning_rate": 6.466325097597037e-07, "loss": 0.6302, "step": 5505 }, { "epoch": 0.5078998962057433, "eval_GEN Loss": 0.4559377431869507, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM Loss": 0.37578651309013367, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8396033644676208, "eval_runtime": 56.8686, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5505 }, { "epoch": 0.5079921577672702, "grad_norm": 2.320698822635991, "learning_rate": 6.464444751554403e-07, "loss": 0.6611, "step": 5506 }, { "epoch": 0.5080844193287971, "grad_norm": 3.6483612858547656, "learning_rate": 6.462564386078452e-07, "loss": 1.0066, "step": 5507 }, { "epoch": 0.5081766808903241, "grad_norm": 1.6166801555695078, "learning_rate": 6.460684001339577e-07, "loss": 0.7457, "step": 5508 }, { "epoch": 0.508268942451851, "grad_norm": 1.9810460809952564, "learning_rate": 6.458803597508189e-07, "loss": 0.6845, "step": 5509 }, { "epoch": 0.5083612040133779, "grad_norm": 2.052441866063954, "learning_rate": 6.456923174754691e-07, "loss": 0.7485, "step": 5510 }, { "epoch": 0.5083612040133779, "eval_GEN Loss": 0.45434489846229553, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3816729784011841, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8301081657409668, "eval_runtime": 56.852, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5510 }, { "epoch": 0.5084534655749049, "grad_norm": 1.5068141473406207, "learning_rate": 6.455042733249488e-07, "loss": 0.6669, "step": 5511 }, { "epoch": 0.5085457271364318, "grad_norm": 1.8560152834062953, "learning_rate": 6.45316227316299e-07, "loss": 0.692, "step": 5512 }, { "epoch": 0.5086379886979587, "grad_norm": 1.4465512112890548, "learning_rate": 6.451281794665607e-07, "loss": 0.5173, "step": 5513 }, { "epoch": 0.5087302502594856, "grad_norm": 2.4526967715434003, "learning_rate": 6.44940129792775e-07, "loss": 0.7129, "step": 5514 }, { "epoch": 0.5088225118210126, "grad_norm": 1.707265893283639, "learning_rate": 6.447520783119835e-07, "loss": 0.5174, "step": 5515 }, { "epoch": 0.5088225118210126, "eval_GEN Loss": 0.4534631073474884, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3745405077934265, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8234975934028625, "eval_runtime": 56.854, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5515 }, { "epoch": 0.5089147733825395, "grad_norm": 1.8035244358442266, "learning_rate": 6.445640250412273e-07, "loss": 0.7013, "step": 5516 }, { "epoch": 0.5090070349440664, "grad_norm": 1.4472528662083786, "learning_rate": 6.443759699975487e-07, "loss": 0.6886, "step": 5517 }, { "epoch": 0.5090992965055934, "grad_norm": 1.7489648358315126, "learning_rate": 6.441879131979889e-07, "loss": 0.6482, "step": 5518 }, { "epoch": 0.5091915580671202, "grad_norm": 2.4931522723578174, "learning_rate": 6.439998546595905e-07, "loss": 0.8596, "step": 5519 }, { "epoch": 0.5092838196286472, "grad_norm": 2.091727174047805, "learning_rate": 6.438117943993953e-07, "loss": 0.7362, "step": 5520 }, { "epoch": 0.5092838196286472, "eval_GEN Loss": 0.45178496837615967, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM Loss": 0.35584917664527893, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8224759697914124, "eval_runtime": 56.9819, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5520 }, { "epoch": 0.5093760811901742, "grad_norm": 2.082812935274943, "learning_rate": 6.436237324344456e-07, "loss": 0.7064, "step": 5521 }, { "epoch": 0.509468342751701, "grad_norm": 1.4670834757653342, "learning_rate": 6.434356687817838e-07, "loss": 0.5657, "step": 5522 }, { "epoch": 0.509560604313228, "grad_norm": 1.5841282771382648, "learning_rate": 6.432476034584531e-07, "loss": 0.7645, "step": 5523 }, { "epoch": 0.5096528658747549, "grad_norm": 1.9207897058346919, "learning_rate": 6.430595364814956e-07, "loss": 0.8245, "step": 5524 }, { "epoch": 0.5097451274362819, "grad_norm": 2.3186295825573913, "learning_rate": 6.428714678679543e-07, "loss": 0.7439, "step": 5525 }, { "epoch": 0.5097451274362819, "eval_GEN Loss": 0.4499998688697815, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3473503887653351, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8248196840286255, "eval_runtime": 56.9296, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5525 }, { "epoch": 0.5098373889978088, "grad_norm": 1.2970185486302632, "learning_rate": 6.426833976348726e-07, "loss": 0.555, "step": 5526 }, { "epoch": 0.5099296505593357, "grad_norm": 2.334326697141373, "learning_rate": 6.424953257992936e-07, "loss": 0.8017, "step": 5527 }, { "epoch": 0.5100219121208627, "grad_norm": 1.8268949908808656, "learning_rate": 6.423072523782607e-07, "loss": 0.7116, "step": 5528 }, { "epoch": 0.5101141736823895, "grad_norm": 2.2576600789486854, "learning_rate": 6.421191773888172e-07, "loss": 0.6376, "step": 5529 }, { "epoch": 0.5102064352439165, "grad_norm": 2.0860244379790207, "learning_rate": 6.419311008480069e-07, "loss": 0.5722, "step": 5530 }, { "epoch": 0.5102064352439165, "eval_GEN Loss": 0.45018523931503296, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.3397412598133087, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8337740302085876, "eval_runtime": 57.0132, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5530 }, { "epoch": 0.5102986968054435, "grad_norm": 2.3334572012891304, "learning_rate": 6.417430227728737e-07, "loss": 0.6888, "step": 5531 }, { "epoch": 0.5103909583669703, "grad_norm": 2.0782313393850473, "learning_rate": 6.415549431804615e-07, "loss": 0.9178, "step": 5532 }, { "epoch": 0.5104832199284973, "grad_norm": 3.701509730590314, "learning_rate": 6.413668620878142e-07, "loss": 0.9476, "step": 5533 }, { "epoch": 0.5105754814900242, "grad_norm": 2.29123925048228, "learning_rate": 6.41178779511976e-07, "loss": 0.7697, "step": 5534 }, { "epoch": 0.5106677430515512, "grad_norm": 3.85752465322228, "learning_rate": 6.409906954699916e-07, "loss": 0.8389, "step": 5535 }, { "epoch": 0.5106677430515512, "eval_GEN Loss": 0.4487907290458679, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.33559584617614746, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8372595906257629, "eval_runtime": 57.0055, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5535 }, { "epoch": 0.510760004613078, "grad_norm": 1.752149375982018, "learning_rate": 6.408026099789049e-07, "loss": 0.6794, "step": 5536 }, { "epoch": 0.510852266174605, "grad_norm": 1.3790445347795153, "learning_rate": 6.406145230557609e-07, "loss": 0.5255, "step": 5537 }, { "epoch": 0.510944527736132, "grad_norm": 2.39869035304379, "learning_rate": 6.404264347176042e-07, "loss": 0.7979, "step": 5538 }, { "epoch": 0.5110367892976588, "grad_norm": 2.7997027258934155, "learning_rate": 6.402383449814798e-07, "loss": 0.8222, "step": 5539 }, { "epoch": 0.5111290508591858, "grad_norm": 1.4659131805101937, "learning_rate": 6.400502538644327e-07, "loss": 0.7094, "step": 5540 }, { "epoch": 0.5111290508591858, "eval_GEN Loss": 0.4493500292301178, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM Loss": 0.34062618017196655, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.829026460647583, "eval_runtime": 56.8304, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 5540 }, { "epoch": 0.5112213124207127, "grad_norm": 1.2794880839490979, "learning_rate": 6.398621613835077e-07, "loss": 0.5279, "step": 5541 }, { "epoch": 0.5113135739822396, "grad_norm": 2.4163857723185598, "learning_rate": 6.396740675557503e-07, "loss": 0.6321, "step": 5542 }, { "epoch": 0.5114058355437666, "grad_norm": 1.0382322063609388, "learning_rate": 6.394859723982058e-07, "loss": 0.519, "step": 5543 }, { "epoch": 0.5114980971052935, "grad_norm": 1.1752987850621708, "learning_rate": 6.392978759279196e-07, "loss": 0.5174, "step": 5544 }, { "epoch": 0.5115903586668205, "grad_norm": 1.9828130987725483, "learning_rate": 6.391097781619376e-07, "loss": 0.849, "step": 5545 }, { "epoch": 0.5115903586668205, "eval_GEN Loss": 0.44957906007766724, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3486257493495941, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8239783644676208, "eval_runtime": 56.9608, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5545 }, { "epoch": 0.5116826202283473, "grad_norm": 2.438424757564112, "learning_rate": 6.389216791173053e-07, "loss": 0.8026, "step": 5546 }, { "epoch": 0.5117748817898743, "grad_norm": 1.3766106028845146, "learning_rate": 6.387335788110682e-07, "loss": 0.7202, "step": 5547 }, { "epoch": 0.5118671433514013, "grad_norm": 1.2040453164707638, "learning_rate": 6.385454772602728e-07, "loss": 0.4883, "step": 5548 }, { "epoch": 0.5119594049129281, "grad_norm": 2.159949522643694, "learning_rate": 6.383573744819649e-07, "loss": 0.814, "step": 5549 }, { "epoch": 0.5120516664744551, "grad_norm": 1.9671133219107375, "learning_rate": 6.381692704931907e-07, "loss": 0.6271, "step": 5550 }, { "epoch": 0.5120516664744551, "eval_GEN Loss": 0.45020103454589844, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.36207616329193115, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.81640625, "eval_runtime": 56.1098, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5550 }, { "epoch": 0.512143928035982, "grad_norm": 1.6012677752692825, "learning_rate": 6.379811653109964e-07, "loss": 0.6368, "step": 5551 }, { "epoch": 0.5122361895975089, "grad_norm": 2.729328183281446, "learning_rate": 6.377930589524285e-07, "loss": 0.945, "step": 5552 }, { "epoch": 0.5123284511590359, "grad_norm": 1.7024290035892686, "learning_rate": 6.376049514345336e-07, "loss": 0.5968, "step": 5553 }, { "epoch": 0.5124207127205628, "grad_norm": 1.4377785212625305, "learning_rate": 6.374168427743581e-07, "loss": 0.5447, "step": 5554 }, { "epoch": 0.5125129742820898, "grad_norm": 1.800579030235277, "learning_rate": 6.372287329889487e-07, "loss": 0.8086, "step": 5555 }, { "epoch": 0.5125129742820898, "eval_GEN Loss": 0.4504340887069702, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38055768609046936, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8148437738418579, "eval_runtime": 55.9571, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5555 }, { "epoch": 0.5126052358436166, "grad_norm": 2.190949721380559, "learning_rate": 6.370406220953524e-07, "loss": 0.6018, "step": 5556 }, { "epoch": 0.5126974974051436, "grad_norm": 2.997613400308788, "learning_rate": 6.368525101106157e-07, "loss": 0.8371, "step": 5557 }, { "epoch": 0.5127897589666706, "grad_norm": 1.8690606990755332, "learning_rate": 6.366643970517862e-07, "loss": 0.5643, "step": 5558 }, { "epoch": 0.5128820205281974, "grad_norm": 2.0842984372614817, "learning_rate": 6.364762829359104e-07, "loss": 0.5714, "step": 5559 }, { "epoch": 0.5129742820897244, "grad_norm": 1.80907274739727, "learning_rate": 6.36288167780036e-07, "loss": 0.7527, "step": 5560 }, { "epoch": 0.5129742820897244, "eval_GEN Loss": 0.4509964883327484, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.3895706236362457, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8137620091438293, "eval_runtime": 57.2505, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 5560 }, { "epoch": 0.5130665436512513, "grad_norm": 1.7309333813147096, "learning_rate": 6.361000516012099e-07, "loss": 0.7167, "step": 5561 }, { "epoch": 0.5131588052127782, "grad_norm": 2.360577003425649, "learning_rate": 6.359119344164798e-07, "loss": 0.7261, "step": 5562 }, { "epoch": 0.5132510667743052, "grad_norm": 1.5204859027336464, "learning_rate": 6.357238162428928e-07, "loss": 0.7074, "step": 5563 }, { "epoch": 0.5133433283358321, "grad_norm": 2.854270480324611, "learning_rate": 6.355356970974969e-07, "loss": 0.578, "step": 5564 }, { "epoch": 0.513435589897359, "grad_norm": 1.9389416902332974, "learning_rate": 6.353475769973396e-07, "loss": 0.756, "step": 5565 }, { "epoch": 0.513435589897359, "eval_GEN Loss": 0.4517325758934021, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.38177505135536194, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8161057829856873, "eval_runtime": 56.851, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5565 }, { "epoch": 0.5135278514588859, "grad_norm": 3.2059845571223695, "learning_rate": 6.351594559594683e-07, "loss": 0.8137, "step": 5566 }, { "epoch": 0.5136201130204129, "grad_norm": 2.0481359604254643, "learning_rate": 6.349713340009313e-07, "loss": 0.7393, "step": 5567 }, { "epoch": 0.5137123745819397, "grad_norm": 1.8176198630591178, "learning_rate": 6.347832111387764e-07, "loss": 0.6444, "step": 5568 }, { "epoch": 0.5138046361434667, "grad_norm": 1.5082516721554804, "learning_rate": 6.345950873900515e-07, "loss": 0.5779, "step": 5569 }, { "epoch": 0.5138968977049937, "grad_norm": 1.8177616897590998, "learning_rate": 6.344069627718045e-07, "loss": 0.7324, "step": 5570 }, { "epoch": 0.5138968977049937, "eval_GEN Loss": 0.45200106501579285, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3758385181427002, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.823317289352417, "eval_runtime": 56.7775, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5570 }, { "epoch": 0.5139891592665206, "grad_norm": 1.7628144341053928, "learning_rate": 6.342188373010838e-07, "loss": 0.8149, "step": 5571 }, { "epoch": 0.5140814208280475, "grad_norm": 2.193866448841458, "learning_rate": 6.340307109949376e-07, "loss": 0.6098, "step": 5572 }, { "epoch": 0.5141736823895744, "grad_norm": 2.4931913894128535, "learning_rate": 6.33842583870414e-07, "loss": 0.69, "step": 5573 }, { "epoch": 0.5142659439511014, "grad_norm": 1.279292728085059, "learning_rate": 6.336544559445617e-07, "loss": 0.5862, "step": 5574 }, { "epoch": 0.5143582055126283, "grad_norm": 2.0749796720097287, "learning_rate": 6.33466327234429e-07, "loss": 0.9467, "step": 5575 }, { "epoch": 0.5143582055126283, "eval_GEN Loss": 0.45089322328567505, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.7815610267155579, "eval_PRM F1 Neg": 0.64, "eval_PRM Loss": 0.38205522298812866, "eval_PRM NPV": 0.5925925925925926, "eval_PRM Precision": 0.9113924050632911, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8253004550933838, "eval_runtime": 57.0586, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5575 }, { "epoch": 0.5144504670741552, "grad_norm": 2.0671302699336147, "learning_rate": 6.332781977570643e-07, "loss": 0.6596, "step": 5576 }, { "epoch": 0.5145427286356822, "grad_norm": 1.7768090913429462, "learning_rate": 6.330900675295163e-07, "loss": 0.7754, "step": 5577 }, { "epoch": 0.514634990197209, "grad_norm": 2.146394407793, "learning_rate": 6.329019365688337e-07, "loss": 0.8186, "step": 5578 }, { "epoch": 0.514727251758736, "grad_norm": 1.9415915314086902, "learning_rate": 6.327138048920651e-07, "loss": 0.7821, "step": 5579 }, { "epoch": 0.514819513320263, "grad_norm": 1.8815365723098438, "learning_rate": 6.325256725162594e-07, "loss": 0.6846, "step": 5580 }, { "epoch": 0.514819513320263, "eval_GEN Loss": 0.45208540558815, "eval_GEN top-5 accuracy": 0.981587023235423, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3875800669193268, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8299880027770996, "eval_runtime": 56.3753, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 5580 }, { "epoch": 0.5149117748817899, "grad_norm": 1.7610067241030218, "learning_rate": 6.323375394584655e-07, "loss": 0.5971, "step": 5581 }, { "epoch": 0.5150040364433168, "grad_norm": 3.3762997816149416, "learning_rate": 6.321494057357321e-07, "loss": 0.8156, "step": 5582 }, { "epoch": 0.5150962980048437, "grad_norm": 1.3010184945999592, "learning_rate": 6.319612713651082e-07, "loss": 0.5007, "step": 5583 }, { "epoch": 0.5151885595663707, "grad_norm": 3.0328871210350723, "learning_rate": 6.317731363636431e-07, "loss": 0.6655, "step": 5584 }, { "epoch": 0.5152808211278976, "grad_norm": 2.554672247276849, "learning_rate": 6.315850007483858e-07, "loss": 0.7718, "step": 5585 }, { "epoch": 0.5152808211278976, "eval_GEN Loss": 0.4522760808467865, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.39202845096588135, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8229567408561707, "eval_runtime": 56.0122, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5585 }, { "epoch": 0.5153730826894245, "grad_norm": 2.728341374212986, "learning_rate": 6.31396864536385e-07, "loss": 0.7697, "step": 5586 }, { "epoch": 0.5154653442509515, "grad_norm": 2.995123196624161, "learning_rate": 6.312087277446907e-07, "loss": 0.8681, "step": 5587 }, { "epoch": 0.5155576058124783, "grad_norm": 2.9963151211861554, "learning_rate": 6.310205903903514e-07, "loss": 0.7243, "step": 5588 }, { "epoch": 0.5156498673740053, "grad_norm": 1.5147748073683869, "learning_rate": 6.308324524904169e-07, "loss": 0.6985, "step": 5589 }, { "epoch": 0.5157421289355323, "grad_norm": 1.562184970972822, "learning_rate": 6.306443140619364e-07, "loss": 0.6763, "step": 5590 }, { "epoch": 0.5157421289355323, "eval_GEN Loss": 0.45302218198776245, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.3973682224750519, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8216947317123413, "eval_runtime": 55.873, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5590 }, { "epoch": 0.5158343904970591, "grad_norm": 2.667370271614254, "learning_rate": 6.304561751219593e-07, "loss": 0.8548, "step": 5591 }, { "epoch": 0.5159266520585861, "grad_norm": 1.919672343966586, "learning_rate": 6.30268035687535e-07, "loss": 0.5, "step": 5592 }, { "epoch": 0.516018913620113, "grad_norm": 2.1326258719293167, "learning_rate": 6.300798957757129e-07, "loss": 0.6637, "step": 5593 }, { "epoch": 0.51611117518164, "grad_norm": 2.265612875007111, "learning_rate": 6.298917554035427e-07, "loss": 0.9586, "step": 5594 }, { "epoch": 0.5162034367431669, "grad_norm": 2.802531573896737, "learning_rate": 6.297036145880739e-07, "loss": 0.931, "step": 5595 }, { "epoch": 0.5162034367431669, "eval_GEN Loss": 0.4515702426433563, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3866071105003357, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.817187488079071, "eval_runtime": 56.0865, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5595 }, { "epoch": 0.5162956983046938, "grad_norm": 1.7805559675752267, "learning_rate": 6.29515473346356e-07, "loss": 0.7103, "step": 5596 }, { "epoch": 0.5163879598662208, "grad_norm": 1.9536563480469293, "learning_rate": 6.29327331695439e-07, "loss": 0.5279, "step": 5597 }, { "epoch": 0.5164802214277476, "grad_norm": 2.045673286570409, "learning_rate": 6.291391896523723e-07, "loss": 0.7896, "step": 5598 }, { "epoch": 0.5165724829892746, "grad_norm": 2.018521118836675, "learning_rate": 6.289510472342059e-07, "loss": 0.6618, "step": 5599 }, { "epoch": 0.5166647445508015, "grad_norm": 1.6652476826743248, "learning_rate": 6.287629044579892e-07, "loss": 0.6751, "step": 5600 }, { "epoch": 0.5166647445508015, "eval_GEN Loss": 0.4510137736797333, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3820176124572754, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8142427802085876, "eval_runtime": 56.8185, "eval_samples_per_second": 1.144, "eval_steps_per_second": 0.088, "step": 5600 }, { "epoch": 0.5167570061123284, "grad_norm": 1.9637216730577067, "learning_rate": 6.285747613407722e-07, "loss": 0.5877, "step": 5601 }, { "epoch": 0.5168492676738554, "grad_norm": 1.7493501165465766, "learning_rate": 6.283866178996047e-07, "loss": 0.6261, "step": 5602 }, { "epoch": 0.5169415292353823, "grad_norm": 3.2223265324930694, "learning_rate": 6.281984741515367e-07, "loss": 0.7098, "step": 5603 }, { "epoch": 0.5170337907969093, "grad_norm": 2.2542153967230476, "learning_rate": 6.280103301136179e-07, "loss": 0.8691, "step": 5604 }, { "epoch": 0.5171260523584361, "grad_norm": 2.017571352226846, "learning_rate": 6.27822185802898e-07, "loss": 0.6609, "step": 5605 }, { "epoch": 0.5171260523584361, "eval_GEN Loss": 0.44986197352409363, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3664259910583496, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8082332015037537, "eval_runtime": 55.9941, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5605 }, { "epoch": 0.5172183139199631, "grad_norm": 1.653332353687636, "learning_rate": 6.276340412364275e-07, "loss": 0.7148, "step": 5606 }, { "epoch": 0.5173105754814901, "grad_norm": 2.1412779132315967, "learning_rate": 6.274458964312558e-07, "loss": 0.6256, "step": 5607 }, { "epoch": 0.5174028370430169, "grad_norm": 1.7865717124097864, "learning_rate": 6.272577514044333e-07, "loss": 0.657, "step": 5608 }, { "epoch": 0.5174950986045439, "grad_norm": 2.3124486455940576, "learning_rate": 6.270696061730096e-07, "loss": 0.6811, "step": 5609 }, { "epoch": 0.5175873601660708, "grad_norm": 1.792394071090575, "learning_rate": 6.26881460754035e-07, "loss": 0.6195, "step": 5610 }, { "epoch": 0.5175873601660708, "eval_GEN Loss": 0.44995149970054626, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3662834167480469, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8077524304389954, "eval_runtime": 57.1931, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5610 }, { "epoch": 0.5176796217275977, "grad_norm": 1.365850519342223, "learning_rate": 6.266933151645595e-07, "loss": 0.6623, "step": 5611 }, { "epoch": 0.5177718832891247, "grad_norm": 1.9733858679541343, "learning_rate": 6.26505169421633e-07, "loss": 0.5847, "step": 5612 }, { "epoch": 0.5178641448506516, "grad_norm": 2.0408445009975495, "learning_rate": 6.263170235423059e-07, "loss": 0.714, "step": 5613 }, { "epoch": 0.5179564064121785, "grad_norm": 1.8887884959492431, "learning_rate": 6.26128877543628e-07, "loss": 0.7583, "step": 5614 }, { "epoch": 0.5180486679737054, "grad_norm": 2.199651138239929, "learning_rate": 6.259407314426495e-07, "loss": 0.8131, "step": 5615 }, { "epoch": 0.5180486679737054, "eval_GEN Loss": 0.44942745566368103, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3612017333507538, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8056490421295166, "eval_runtime": 56.7628, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5615 }, { "epoch": 0.5181409295352324, "grad_norm": 1.8224479757920558, "learning_rate": 6.257525852564203e-07, "loss": 0.7793, "step": 5616 }, { "epoch": 0.5182331910967594, "grad_norm": 1.5272115285287886, "learning_rate": 6.255644390019908e-07, "loss": 0.6174, "step": 5617 }, { "epoch": 0.5183254526582862, "grad_norm": 2.104714243058201, "learning_rate": 6.253762926964106e-07, "loss": 0.6269, "step": 5618 }, { "epoch": 0.5184177142198132, "grad_norm": 1.8214137170033353, "learning_rate": 6.251881463567305e-07, "loss": 0.8563, "step": 5619 }, { "epoch": 0.5185099757813401, "grad_norm": 1.811520362916884, "learning_rate": 6.25e-07, "loss": 0.5518, "step": 5620 }, { "epoch": 0.5185099757813401, "eval_GEN Loss": 0.44915929436683655, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3626227378845215, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8056490421295166, "eval_runtime": 56.951, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5620 }, { "epoch": 0.518602237342867, "grad_norm": 2.185563533235991, "learning_rate": 6.248118536432699e-07, "loss": 0.6366, "step": 5621 }, { "epoch": 0.518694498904394, "grad_norm": 2.3601929412699096, "learning_rate": 6.246237073035895e-07, "loss": 0.7442, "step": 5622 }, { "epoch": 0.5187867604659209, "grad_norm": 1.8509913521511683, "learning_rate": 6.244355609980095e-07, "loss": 0.5279, "step": 5623 }, { "epoch": 0.5188790220274478, "grad_norm": 2.1703942248708454, "learning_rate": 6.2424741474358e-07, "loss": 0.5629, "step": 5624 }, { "epoch": 0.5189712835889747, "grad_norm": 1.5511299349136545, "learning_rate": 6.240592685573508e-07, "loss": 0.5111, "step": 5625 }, { "epoch": 0.5189712835889747, "eval_GEN Loss": 0.44853806495666504, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3579433858394623, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8096754550933838, "eval_runtime": 56.7337, "eval_samples_per_second": 1.146, "eval_steps_per_second": 0.088, "step": 5625 }, { "epoch": 0.5190635451505017, "grad_norm": 2.1764307988952774, "learning_rate": 6.238711224563721e-07, "loss": 0.6212, "step": 5626 }, { "epoch": 0.5191558067120287, "grad_norm": 3.0229395596908453, "learning_rate": 6.236829764576943e-07, "loss": 0.8748, "step": 5627 }, { "epoch": 0.5192480682735555, "grad_norm": 2.193575348479619, "learning_rate": 6.234948305783672e-07, "loss": 0.7321, "step": 5628 }, { "epoch": 0.5193403298350825, "grad_norm": 1.9159845463482639, "learning_rate": 6.233066848354406e-07, "loss": 0.714, "step": 5629 }, { "epoch": 0.5194325913966094, "grad_norm": 2.515014387627152, "learning_rate": 6.231185392459651e-07, "loss": 0.5745, "step": 5630 }, { "epoch": 0.5194325913966094, "eval_GEN Loss": 0.44816461205482483, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35256242752075195, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.813401460647583, "eval_runtime": 55.9386, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5630 }, { "epoch": 0.5195248529581363, "grad_norm": 2.353312659769086, "learning_rate": 6.229303938269906e-07, "loss": 0.7254, "step": 5631 }, { "epoch": 0.5196171145196632, "grad_norm": 3.0887371073165943, "learning_rate": 6.227422485955671e-07, "loss": 0.9305, "step": 5632 }, { "epoch": 0.5197093760811902, "grad_norm": 1.545183715123463, "learning_rate": 6.225541035687443e-07, "loss": 0.5989, "step": 5633 }, { "epoch": 0.5198016376427171, "grad_norm": 3.7002351126092563, "learning_rate": 6.223659587635727e-07, "loss": 0.8593, "step": 5634 }, { "epoch": 0.519893899204244, "grad_norm": 2.1868744891461276, "learning_rate": 6.221778141971022e-07, "loss": 0.8368, "step": 5635 }, { "epoch": 0.519893899204244, "eval_GEN Loss": 0.4479001760482788, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36158040165901184, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8096754550933838, "eval_runtime": 56.2073, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 5635 }, { "epoch": 0.519986160765771, "grad_norm": 3.491455969898752, "learning_rate": 6.219896698863824e-07, "loss": 1.0132, "step": 5636 }, { "epoch": 0.5200784223272978, "grad_norm": 1.4675490135707177, "learning_rate": 6.218015258484635e-07, "loss": 0.534, "step": 5637 }, { "epoch": 0.5201706838888248, "grad_norm": 1.3803056017483728, "learning_rate": 6.216133821003955e-07, "loss": 0.5972, "step": 5638 }, { "epoch": 0.5202629454503518, "grad_norm": 1.8219956732593308, "learning_rate": 6.214252386592279e-07, "loss": 0.7104, "step": 5639 }, { "epoch": 0.5203552070118787, "grad_norm": 1.705236224217243, "learning_rate": 6.21237095542011e-07, "loss": 0.6711, "step": 5640 }, { "epoch": 0.5203552070118787, "eval_GEN Loss": 0.44925791025161743, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3730471134185791, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8040865659713745, "eval_runtime": 55.9342, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5640 }, { "epoch": 0.5204474685734056, "grad_norm": 2.1894682341475895, "learning_rate": 6.210489527657943e-07, "loss": 0.6393, "step": 5641 }, { "epoch": 0.5205397301349325, "grad_norm": 1.8566644172680138, "learning_rate": 6.208608103476278e-07, "loss": 0.7625, "step": 5642 }, { "epoch": 0.5206319916964595, "grad_norm": 1.885313165199742, "learning_rate": 6.206726683045613e-07, "loss": 0.7362, "step": 5643 }, { "epoch": 0.5207242532579864, "grad_norm": 2.5670410461913256, "learning_rate": 6.20484526653644e-07, "loss": 0.5812, "step": 5644 }, { "epoch": 0.5208165148195133, "grad_norm": 2.155499238579875, "learning_rate": 6.202963854119263e-07, "loss": 0.7161, "step": 5645 }, { "epoch": 0.5208165148195133, "eval_GEN Loss": 0.44908007979393005, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37322524189949036, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8021033406257629, "eval_runtime": 56.1309, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5645 }, { "epoch": 0.5209087763810403, "grad_norm": 1.8939059464587926, "learning_rate": 6.201082445964577e-07, "loss": 0.6238, "step": 5646 }, { "epoch": 0.5210010379425671, "grad_norm": 2.4029122565745595, "learning_rate": 6.199201042242872e-07, "loss": 0.6503, "step": 5647 }, { "epoch": 0.5210932995040941, "grad_norm": 1.841557252613327, "learning_rate": 6.197319643124652e-07, "loss": 0.6496, "step": 5648 }, { "epoch": 0.5211855610656211, "grad_norm": 1.759475031946073, "learning_rate": 6.195438248780409e-07, "loss": 0.6527, "step": 5649 }, { "epoch": 0.521277822627148, "grad_norm": 1.425641427875087, "learning_rate": 6.193556859380638e-07, "loss": 0.7285, "step": 5650 }, { "epoch": 0.521277822627148, "eval_GEN Loss": 0.44821837544441223, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3667643666267395, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8025240302085876, "eval_runtime": 55.8903, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5650 }, { "epoch": 0.5213700841886749, "grad_norm": 2.1144584333435703, "learning_rate": 6.191675475095832e-07, "loss": 0.65, "step": 5651 }, { "epoch": 0.5214623457502018, "grad_norm": 1.5532272471346928, "learning_rate": 6.189794096096487e-07, "loss": 0.7759, "step": 5652 }, { "epoch": 0.5215546073117288, "grad_norm": 2.1058550625144554, "learning_rate": 6.187912722553096e-07, "loss": 0.6219, "step": 5653 }, { "epoch": 0.5216468688732557, "grad_norm": 1.9280558301189363, "learning_rate": 6.186031354636148e-07, "loss": 0.6299, "step": 5654 }, { "epoch": 0.5217391304347826, "grad_norm": 1.4535604894387755, "learning_rate": 6.184149992516144e-07, "loss": 0.6155, "step": 5655 }, { "epoch": 0.5217391304347826, "eval_GEN Loss": 0.44713133573532104, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3629145324230194, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8063101172447205, "eval_runtime": 56.1262, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5655 }, { "epoch": 0.5218313919963096, "grad_norm": 1.718167358485877, "learning_rate": 6.18226863636357e-07, "loss": 0.6541, "step": 5656 }, { "epoch": 0.5219236535578364, "grad_norm": 1.7420718281463405, "learning_rate": 6.18038728634892e-07, "loss": 0.672, "step": 5657 }, { "epoch": 0.5220159151193634, "grad_norm": 1.5743813410790881, "learning_rate": 6.17850594264268e-07, "loss": 0.6781, "step": 5658 }, { "epoch": 0.5221081766808904, "grad_norm": 2.0629198192353186, "learning_rate": 6.176624605415346e-07, "loss": 0.8087, "step": 5659 }, { "epoch": 0.5222004382424172, "grad_norm": 1.518011852171398, "learning_rate": 6.174743274837408e-07, "loss": 0.521, "step": 5660 }, { "epoch": 0.5222004382424172, "eval_GEN Loss": 0.4462627172470093, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3691242039203644, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8099759817123413, "eval_runtime": 56.1218, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5660 }, { "epoch": 0.5222926998039442, "grad_norm": 3.0851803218641813, "learning_rate": 6.17286195107935e-07, "loss": 0.6455, "step": 5661 }, { "epoch": 0.5223849613654711, "grad_norm": 1.6520356086691528, "learning_rate": 6.170980634311665e-07, "loss": 0.5738, "step": 5662 }, { "epoch": 0.522477222926998, "grad_norm": 1.7262882819182959, "learning_rate": 6.169099324704839e-07, "loss": 0.6839, "step": 5663 }, { "epoch": 0.5225694844885249, "grad_norm": 1.5900572390812744, "learning_rate": 6.16721802242936e-07, "loss": 0.6047, "step": 5664 }, { "epoch": 0.5226617460500519, "grad_norm": 2.0680992014279544, "learning_rate": 6.165336727655712e-07, "loss": 0.7454, "step": 5665 }, { "epoch": 0.5226617460500519, "eval_GEN Loss": 0.44633716344833374, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3699776530265808, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.80859375, "eval_runtime": 56.1143, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5665 }, { "epoch": 0.5227540076115789, "grad_norm": 2.060159878919546, "learning_rate": 6.163455440554385e-07, "loss": 0.5928, "step": 5666 }, { "epoch": 0.5228462691731057, "grad_norm": 3.415195227167983, "learning_rate": 6.161574161295861e-07, "loss": 0.7743, "step": 5667 }, { "epoch": 0.5229385307346327, "grad_norm": 1.4975987624650748, "learning_rate": 6.159692890050627e-07, "loss": 0.6378, "step": 5668 }, { "epoch": 0.5230307922961596, "grad_norm": 2.0273831365645836, "learning_rate": 6.157811626989163e-07, "loss": 0.6232, "step": 5669 }, { "epoch": 0.5231230538576865, "grad_norm": 2.2838012374139804, "learning_rate": 6.155930372281957e-07, "loss": 0.655, "step": 5670 }, { "epoch": 0.5231230538576865, "eval_GEN Loss": 0.4472615420818329, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.377178817987442, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.810276448726654, "eval_runtime": 56.1176, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5670 }, { "epoch": 0.5232153154192135, "grad_norm": 1.9160831330236083, "learning_rate": 6.154049126099488e-07, "loss": 0.5451, "step": 5671 }, { "epoch": 0.5233075769807404, "grad_norm": 2.0863378990869386, "learning_rate": 6.152167888612238e-07, "loss": 0.6438, "step": 5672 }, { "epoch": 0.5233998385422673, "grad_norm": 2.0256805825490933, "learning_rate": 6.150286659990688e-07, "loss": 0.6444, "step": 5673 }, { "epoch": 0.5234921001037942, "grad_norm": 2.0354097336710306, "learning_rate": 6.148405440405318e-07, "loss": 0.7875, "step": 5674 }, { "epoch": 0.5235843616653212, "grad_norm": 2.4234383493080487, "learning_rate": 6.146524230026607e-07, "loss": 0.7264, "step": 5675 }, { "epoch": 0.5235843616653212, "eval_GEN Loss": 0.4476272463798523, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37628740072250366, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8101261854171753, "eval_runtime": 57.107, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5675 }, { "epoch": 0.5236766232268482, "grad_norm": 2.1739976963407726, "learning_rate": 6.144643029025032e-07, "loss": 0.5038, "step": 5676 }, { "epoch": 0.523768884788375, "grad_norm": 1.4638454884411112, "learning_rate": 6.142761837571074e-07, "loss": 0.5827, "step": 5677 }, { "epoch": 0.523861146349902, "grad_norm": 1.7031683469742596, "learning_rate": 6.140880655835206e-07, "loss": 0.7357, "step": 5678 }, { "epoch": 0.5239534079114289, "grad_norm": 1.3880413738333226, "learning_rate": 6.138999483987902e-07, "loss": 0.5763, "step": 5679 }, { "epoch": 0.5240456694729558, "grad_norm": 1.6944410741069569, "learning_rate": 6.137118322199642e-07, "loss": 0.7959, "step": 5680 }, { "epoch": 0.5240456694729558, "eval_GEN Loss": 0.4470641314983368, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3699677884578705, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8081730604171753, "eval_runtime": 56.9587, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5680 }, { "epoch": 0.5241379310344828, "grad_norm": 2.597280137950061, "learning_rate": 6.135237170640898e-07, "loss": 0.7004, "step": 5681 }, { "epoch": 0.5242301925960097, "grad_norm": 1.6785736449467181, "learning_rate": 6.133356029482141e-07, "loss": 0.7781, "step": 5682 }, { "epoch": 0.5243224541575366, "grad_norm": 1.9801822068209523, "learning_rate": 6.131474898893843e-07, "loss": 0.685, "step": 5683 }, { "epoch": 0.5244147157190635, "grad_norm": 1.7547107652923057, "learning_rate": 6.129593779046477e-07, "loss": 0.6499, "step": 5684 }, { "epoch": 0.5245069772805905, "grad_norm": 1.8841228991424999, "learning_rate": 6.127712670110515e-07, "loss": 0.658, "step": 5685 }, { "epoch": 0.5245069772805905, "eval_GEN Loss": 0.44818422198295593, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3633226752281189, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8136418461799622, "eval_runtime": 56.9391, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5685 }, { "epoch": 0.5245992388421175, "grad_norm": 1.458544269333822, "learning_rate": 6.12583157225642e-07, "loss": 0.6392, "step": 5686 }, { "epoch": 0.5246915004036443, "grad_norm": 2.4680354675994245, "learning_rate": 6.123950485654665e-07, "loss": 0.8198, "step": 5687 }, { "epoch": 0.5247837619651713, "grad_norm": 1.8455498008931657, "learning_rate": 6.122069410475716e-07, "loss": 0.8543, "step": 5688 }, { "epoch": 0.5248760235266982, "grad_norm": 2.6066753507019307, "learning_rate": 6.120188346890038e-07, "loss": 0.6644, "step": 5689 }, { "epoch": 0.5249682850882251, "grad_norm": 2.523782400474924, "learning_rate": 6.118307295068094e-07, "loss": 0.7155, "step": 5690 }, { "epoch": 0.5249682850882251, "eval_GEN Loss": 0.4477595388889313, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3545914888381958, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8121394515037537, "eval_runtime": 57.1749, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 5690 }, { "epoch": 0.5250605466497521, "grad_norm": 2.6921047352467165, "learning_rate": 6.116426255180352e-07, "loss": 0.7442, "step": 5691 }, { "epoch": 0.525152808211279, "grad_norm": 2.3867617250654933, "learning_rate": 6.114545227397274e-07, "loss": 0.7456, "step": 5692 }, { "epoch": 0.5252450697728059, "grad_norm": 1.5068535640348422, "learning_rate": 6.112664211889317e-07, "loss": 0.748, "step": 5693 }, { "epoch": 0.5253373313343328, "grad_norm": 2.324481744054839, "learning_rate": 6.110783208826949e-07, "loss": 0.7767, "step": 5694 }, { "epoch": 0.5254295928958598, "grad_norm": 3.725689281452816, "learning_rate": 6.108902218380625e-07, "loss": 0.9249, "step": 5695 }, { "epoch": 0.5254295928958598, "eval_GEN Loss": 0.44682958722114563, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34877315163612366, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8144230842590332, "eval_runtime": 57.5302, "eval_samples_per_second": 1.13, "eval_steps_per_second": 0.087, "step": 5695 }, { "epoch": 0.5255218544573866, "grad_norm": 1.8643512445831143, "learning_rate": 6.107021240720805e-07, "loss": 0.6782, "step": 5696 }, { "epoch": 0.5256141160189136, "grad_norm": 1.9355564664553877, "learning_rate": 6.105140276017943e-07, "loss": 0.7423, "step": 5697 }, { "epoch": 0.5257063775804406, "grad_norm": 2.0297188562063018, "learning_rate": 6.103259324442499e-07, "loss": 0.6299, "step": 5698 }, { "epoch": 0.5257986391419674, "grad_norm": 1.3524175387190998, "learning_rate": 6.101378386164926e-07, "loss": 0.6033, "step": 5699 }, { "epoch": 0.5258909007034944, "grad_norm": 1.7317991457456778, "learning_rate": 6.099497461355677e-07, "loss": 0.6756, "step": 5700 }, { "epoch": 0.5258909007034944, "eval_GEN Loss": 0.446855366230011, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3471384346485138, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8129807710647583, "eval_runtime": 56.8702, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5700 }, { "epoch": 0.5259831622650213, "grad_norm": 1.4107373642524215, "learning_rate": 6.097616550185203e-07, "loss": 0.7203, "step": 5701 }, { "epoch": 0.5260754238265483, "grad_norm": 1.7527544574193301, "learning_rate": 6.095735652823959e-07, "loss": 0.6839, "step": 5702 }, { "epoch": 0.5261676853880752, "grad_norm": 2.1407508007180254, "learning_rate": 6.093854769442394e-07, "loss": 0.6025, "step": 5703 }, { "epoch": 0.5262599469496021, "grad_norm": 2.5755348338338675, "learning_rate": 6.091973900210952e-07, "loss": 0.6072, "step": 5704 }, { "epoch": 0.5263522085111291, "grad_norm": 1.8491515696407166, "learning_rate": 6.090093045300087e-07, "loss": 0.6197, "step": 5705 }, { "epoch": 0.5263522085111291, "eval_GEN Loss": 0.4474896490573883, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3507747948169708, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8189904093742371, "eval_runtime": 56.9436, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5705 }, { "epoch": 0.5264444700726559, "grad_norm": 1.7322922104778524, "learning_rate": 6.088212204880242e-07, "loss": 0.655, "step": 5706 }, { "epoch": 0.5265367316341829, "grad_norm": 1.6643030458236585, "learning_rate": 6.086331379121861e-07, "loss": 0.6515, "step": 5707 }, { "epoch": 0.5266289931957099, "grad_norm": 1.497882866835344, "learning_rate": 6.084450568195387e-07, "loss": 0.6781, "step": 5708 }, { "epoch": 0.5267212547572367, "grad_norm": 1.955309052085084, "learning_rate": 6.082569772271264e-07, "loss": 0.6326, "step": 5709 }, { "epoch": 0.5268135163187637, "grad_norm": 2.345963826523206, "learning_rate": 6.080688991519933e-07, "loss": 0.7732, "step": 5710 }, { "epoch": 0.5268135163187637, "eval_GEN Loss": 0.44751062989234924, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35443076491355896, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8213341236114502, "eval_runtime": 56.8726, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5710 }, { "epoch": 0.5269057778802906, "grad_norm": 1.8182150813100464, "learning_rate": 6.078808226111829e-07, "loss": 0.6896, "step": 5711 }, { "epoch": 0.5269980394418176, "grad_norm": 1.8641763624767973, "learning_rate": 6.076927476217395e-07, "loss": 0.6248, "step": 5712 }, { "epoch": 0.5270903010033445, "grad_norm": 1.789839136246562, "learning_rate": 6.075046742007066e-07, "loss": 0.5831, "step": 5713 }, { "epoch": 0.5271825625648714, "grad_norm": 2.096662235467083, "learning_rate": 6.073166023651276e-07, "loss": 0.7889, "step": 5714 }, { "epoch": 0.5272748241263984, "grad_norm": 1.621292778138727, "learning_rate": 6.071285321320458e-07, "loss": 0.5716, "step": 5715 }, { "epoch": 0.5272748241263984, "eval_GEN Loss": 0.4473215639591217, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35942983627319336, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8171274065971375, "eval_runtime": 56.9846, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5715 }, { "epoch": 0.5273670856879252, "grad_norm": 1.9315921302226176, "learning_rate": 6.069404635185048e-07, "loss": 0.6666, "step": 5716 }, { "epoch": 0.5274593472494522, "grad_norm": 1.8199996052074006, "learning_rate": 6.067523965415473e-07, "loss": 0.754, "step": 5717 }, { "epoch": 0.5275516088109792, "grad_norm": 1.6836661886246906, "learning_rate": 6.065643312182163e-07, "loss": 0.7647, "step": 5718 }, { "epoch": 0.527643870372506, "grad_norm": 1.9268351900170428, "learning_rate": 6.063762675655546e-07, "loss": 0.7624, "step": 5719 }, { "epoch": 0.527736131934033, "grad_norm": 1.849418438677574, "learning_rate": 6.061882056006049e-07, "loss": 0.4525, "step": 5720 }, { "epoch": 0.527736131934033, "eval_GEN Loss": 0.44771870970726013, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36347728967666626, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8135216236114502, "eval_runtime": 57.2839, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 5720 }, { "epoch": 0.5278283934955599, "grad_norm": 1.7320491791104387, "learning_rate": 6.060001453404097e-07, "loss": 0.548, "step": 5721 }, { "epoch": 0.5279206550570869, "grad_norm": 1.9951754225076337, "learning_rate": 6.05812086802011e-07, "loss": 0.5727, "step": 5722 }, { "epoch": 0.5280129166186137, "grad_norm": 2.4438215882413323, "learning_rate": 6.056240300024515e-07, "loss": 0.7372, "step": 5723 }, { "epoch": 0.5281051781801407, "grad_norm": 1.939363484317739, "learning_rate": 6.054359749587729e-07, "loss": 0.718, "step": 5724 }, { "epoch": 0.5281974397416677, "grad_norm": 1.4720336140490862, "learning_rate": 6.052479216880169e-07, "loss": 0.54, "step": 5725 }, { "epoch": 0.5281974397416677, "eval_GEN Loss": 0.4486754834651947, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36356741189956665, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8061898946762085, "eval_runtime": 57.0205, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5725 }, { "epoch": 0.5282897013031945, "grad_norm": 1.7398843619257718, "learning_rate": 6.050598702072251e-07, "loss": 0.8212, "step": 5726 }, { "epoch": 0.5283819628647215, "grad_norm": 1.817823087540096, "learning_rate": 6.048718205334396e-07, "loss": 0.758, "step": 5727 }, { "epoch": 0.5284742244262484, "grad_norm": 1.6718176931202637, "learning_rate": 6.046837726837013e-07, "loss": 0.591, "step": 5728 }, { "epoch": 0.5285664859877753, "grad_norm": 2.2194718659056907, "learning_rate": 6.044957266750512e-07, "loss": 0.7563, "step": 5729 }, { "epoch": 0.5286587475493023, "grad_norm": 1.998589536082279, "learning_rate": 6.043076825245311e-07, "loss": 0.7235, "step": 5730 }, { "epoch": 0.5286587475493023, "eval_GEN Loss": 0.45001405477523804, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3605497479438782, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8070913553237915, "eval_runtime": 56.9351, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5730 }, { "epoch": 0.5287510091108292, "grad_norm": 1.5797622514308651, "learning_rate": 6.041196402491812e-07, "loss": 0.708, "step": 5731 }, { "epoch": 0.5288432706723561, "grad_norm": 1.7767464724482345, "learning_rate": 6.039315998660424e-07, "loss": 0.5511, "step": 5732 }, { "epoch": 0.528935532233883, "grad_norm": 1.4635738878862588, "learning_rate": 6.037435613921551e-07, "loss": 0.5709, "step": 5733 }, { "epoch": 0.52902779379541, "grad_norm": 1.7949522091167387, "learning_rate": 6.035555248445598e-07, "loss": 0.7175, "step": 5734 }, { "epoch": 0.529120055356937, "grad_norm": 1.8406474172508283, "learning_rate": 6.033674902402966e-07, "loss": 0.7284, "step": 5735 }, { "epoch": 0.529120055356937, "eval_GEN Loss": 0.4490952789783478, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.35529235005378723, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8025841116905212, "eval_runtime": 56.8543, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5735 }, { "epoch": 0.5292123169184638, "grad_norm": 2.381266353220206, "learning_rate": 6.031794575964052e-07, "loss": 0.5777, "step": 5736 }, { "epoch": 0.5293045784799908, "grad_norm": 1.3720134317235824, "learning_rate": 6.02991426929926e-07, "loss": 0.6821, "step": 5737 }, { "epoch": 0.5293968400415177, "grad_norm": 1.5182484460625396, "learning_rate": 6.028033982578984e-07, "loss": 0.5962, "step": 5738 }, { "epoch": 0.5294891016030446, "grad_norm": 3.0145687543454853, "learning_rate": 6.026153715973617e-07, "loss": 0.9278, "step": 5739 }, { "epoch": 0.5295813631645716, "grad_norm": 2.241435558193642, "learning_rate": 6.02427346965355e-07, "loss": 0.8217, "step": 5740 }, { "epoch": 0.5295813631645716, "eval_GEN Loss": 0.44902342557907104, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3520326018333435, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8015024065971375, "eval_runtime": 56.7576, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5740 }, { "epoch": 0.5296736247260985, "grad_norm": 1.7420505960143153, "learning_rate": 6.022393243789179e-07, "loss": 0.596, "step": 5741 }, { "epoch": 0.5297658862876254, "grad_norm": 1.869893808868276, "learning_rate": 6.020513038550891e-07, "loss": 0.7341, "step": 5742 }, { "epoch": 0.5298581478491523, "grad_norm": 2.184481031946633, "learning_rate": 6.018632854109071e-07, "loss": 0.7259, "step": 5743 }, { "epoch": 0.5299504094106793, "grad_norm": 2.145416557903291, "learning_rate": 6.016752690634108e-07, "loss": 0.87, "step": 5744 }, { "epoch": 0.5300426709722063, "grad_norm": 2.169942648649425, "learning_rate": 6.014872548296382e-07, "loss": 0.8805, "step": 5745 }, { "epoch": 0.5300426709722063, "eval_GEN Loss": 0.4486738443374634, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3462068438529968, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8054086565971375, "eval_runtime": 56.9367, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5745 }, { "epoch": 0.5301349325337331, "grad_norm": 2.236037089142614, "learning_rate": 6.012992427266277e-07, "loss": 0.5588, "step": 5746 }, { "epoch": 0.5302271940952601, "grad_norm": 2.2147227169813246, "learning_rate": 6.011112327714168e-07, "loss": 0.6948, "step": 5747 }, { "epoch": 0.530319455656787, "grad_norm": 2.366155149816648, "learning_rate": 6.009232249810438e-07, "loss": 0.7951, "step": 5748 }, { "epoch": 0.5304117172183139, "grad_norm": 1.8560775159357397, "learning_rate": 6.007352193725461e-07, "loss": 0.6911, "step": 5749 }, { "epoch": 0.5305039787798409, "grad_norm": 3.2970550887055214, "learning_rate": 6.005472159629608e-07, "loss": 0.7461, "step": 5750 }, { "epoch": 0.5305039787798409, "eval_GEN Loss": 0.44901928305625916, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3462573289871216, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8114783763885498, "eval_runtime": 56.9881, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5750 }, { "epoch": 0.5305962403413678, "grad_norm": 1.7451012039764036, "learning_rate": 6.003592147693256e-07, "loss": 0.615, "step": 5751 }, { "epoch": 0.5306885019028947, "grad_norm": 2.26977785962814, "learning_rate": 6.00171215808677e-07, "loss": 0.895, "step": 5752 }, { "epoch": 0.5307807634644216, "grad_norm": 1.8594729806756736, "learning_rate": 5.999832190980519e-07, "loss": 0.7118, "step": 5753 }, { "epoch": 0.5308730250259486, "grad_norm": 2.2452222393231547, "learning_rate": 5.997952246544868e-07, "loss": 0.854, "step": 5754 }, { "epoch": 0.5309652865874754, "grad_norm": 1.9422433751007169, "learning_rate": 5.99607232495018e-07, "loss": 0.8577, "step": 5755 }, { "epoch": 0.5309652865874754, "eval_GEN Loss": 0.4490140378475189, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3522162139415741, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8158053159713745, "eval_runtime": 56.0704, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5755 }, { "epoch": 0.5310575481490024, "grad_norm": 2.1212442160734217, "learning_rate": 5.99419242636682e-07, "loss": 0.7612, "step": 5756 }, { "epoch": 0.5311498097105294, "grad_norm": 2.608307663900946, "learning_rate": 5.992312550965145e-07, "loss": 0.7052, "step": 5757 }, { "epoch": 0.5312420712720562, "grad_norm": 2.01757353480641, "learning_rate": 5.990432698915511e-07, "loss": 0.6016, "step": 5758 }, { "epoch": 0.5313343328335832, "grad_norm": 2.051557517331167, "learning_rate": 5.988552870388276e-07, "loss": 0.7515, "step": 5759 }, { "epoch": 0.5314265943951101, "grad_norm": 2.0332137873504013, "learning_rate": 5.98667306555379e-07, "loss": 0.805, "step": 5760 }, { "epoch": 0.5314265943951101, "eval_GEN Loss": 0.44901716709136963, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3614150583744049, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8185096383094788, "eval_runtime": 56.8916, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5760 }, { "epoch": 0.5315188559566371, "grad_norm": 2.2849396580872896, "learning_rate": 5.984793284582404e-07, "loss": 0.6798, "step": 5761 }, { "epoch": 0.531611117518164, "grad_norm": 2.5956538204201545, "learning_rate": 5.98291352764447e-07, "loss": 0.737, "step": 5762 }, { "epoch": 0.5317033790796909, "grad_norm": 2.2958503043273604, "learning_rate": 5.981033794910334e-07, "loss": 0.7191, "step": 5763 }, { "epoch": 0.5317956406412179, "grad_norm": 2.0912968822548006, "learning_rate": 5.979154086550337e-07, "loss": 0.7131, "step": 5764 }, { "epoch": 0.5318879022027447, "grad_norm": 2.125094082732696, "learning_rate": 5.977274402734821e-07, "loss": 0.7405, "step": 5765 }, { "epoch": 0.5318879022027447, "eval_GEN Loss": 0.4495677947998047, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3589363396167755, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8227163553237915, "eval_runtime": 57.2607, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 5765 }, { "epoch": 0.5319801637642717, "grad_norm": 1.8986306783248967, "learning_rate": 5.97539474363413e-07, "loss": 0.7002, "step": 5766 }, { "epoch": 0.5320724253257987, "grad_norm": 2.173992977723716, "learning_rate": 5.973515109418599e-07, "loss": 0.798, "step": 5767 }, { "epoch": 0.5321646868873255, "grad_norm": 1.8995688328563411, "learning_rate": 5.971635500258564e-07, "loss": 0.5261, "step": 5768 }, { "epoch": 0.5322569484488525, "grad_norm": 3.116547203142588, "learning_rate": 5.969755916324359e-07, "loss": 0.6428, "step": 5769 }, { "epoch": 0.5323492100103794, "grad_norm": 1.6361694388606847, "learning_rate": 5.967876357786314e-07, "loss": 0.6034, "step": 5770 }, { "epoch": 0.5323492100103794, "eval_GEN Loss": 0.44854357838630676, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3534570634365082, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8248798251152039, "eval_runtime": 56.7899, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5770 }, { "epoch": 0.5324414715719064, "grad_norm": 1.929079671069441, "learning_rate": 5.965996824814758e-07, "loss": 0.7486, "step": 5771 }, { "epoch": 0.5325337331334333, "grad_norm": 1.5037176039710862, "learning_rate": 5.964117317580014e-07, "loss": 0.4946, "step": 5772 }, { "epoch": 0.5326259946949602, "grad_norm": 2.0500265756050102, "learning_rate": 5.962237836252411e-07, "loss": 0.6373, "step": 5773 }, { "epoch": 0.5327182562564872, "grad_norm": 2.4155659808586383, "learning_rate": 5.960358381002268e-07, "loss": 0.6248, "step": 5774 }, { "epoch": 0.532810517818014, "grad_norm": 1.8259090943507035, "learning_rate": 5.958478951999903e-07, "loss": 0.4787, "step": 5775 }, { "epoch": 0.532810517818014, "eval_GEN Loss": 0.44915181398391724, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3575804829597473, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8309495449066162, "eval_runtime": 56.9522, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5775 }, { "epoch": 0.532902779379541, "grad_norm": 1.6688503695343222, "learning_rate": 5.956599549415636e-07, "loss": 0.6134, "step": 5776 }, { "epoch": 0.532995040941068, "grad_norm": 2.0285070799644607, "learning_rate": 5.954720173419779e-07, "loss": 0.8709, "step": 5777 }, { "epoch": 0.5330873025025948, "grad_norm": 2.286646154745885, "learning_rate": 5.952840824182646e-07, "loss": 0.5603, "step": 5778 }, { "epoch": 0.5331795640641218, "grad_norm": 2.5920431651317513, "learning_rate": 5.950961501874543e-07, "loss": 0.7312, "step": 5779 }, { "epoch": 0.5332718256256487, "grad_norm": 3.253211621068001, "learning_rate": 5.949082206665781e-07, "loss": 0.847, "step": 5780 }, { "epoch": 0.5332718256256487, "eval_GEN Loss": 0.4495263695716858, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35761889815330505, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8329627513885498, "eval_runtime": 56.9995, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5780 }, { "epoch": 0.5333640871871757, "grad_norm": 2.0171212678412522, "learning_rate": 5.947202938726662e-07, "loss": 0.6431, "step": 5781 }, { "epoch": 0.5334563487487026, "grad_norm": 3.884293815529922, "learning_rate": 5.945323698227488e-07, "loss": 0.9653, "step": 5782 }, { "epoch": 0.5335486103102295, "grad_norm": 3.069901926038726, "learning_rate": 5.943444485338562e-07, "loss": 0.8231, "step": 5783 }, { "epoch": 0.5336408718717565, "grad_norm": 1.6477164883371354, "learning_rate": 5.941565300230179e-07, "loss": 0.5645, "step": 5784 }, { "epoch": 0.5337331334332833, "grad_norm": 1.5732401708174348, "learning_rate": 5.939686143072635e-07, "loss": 0.4792, "step": 5785 }, { "epoch": 0.5337331334332833, "eval_GEN Loss": 0.4496711790561676, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36491459608078003, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.834885835647583, "eval_runtime": 57.124, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 5785 }, { "epoch": 0.5338253949948103, "grad_norm": 2.159350343234668, "learning_rate": 5.937807014036218e-07, "loss": 0.8087, "step": 5786 }, { "epoch": 0.5339176565563372, "grad_norm": 2.022540201729159, "learning_rate": 5.935927913291224e-07, "loss": 0.8175, "step": 5787 }, { "epoch": 0.5340099181178641, "grad_norm": 1.3657427602450478, "learning_rate": 5.934048841007936e-07, "loss": 0.506, "step": 5788 }, { "epoch": 0.5341021796793911, "grad_norm": 2.1907507235085335, "learning_rate": 5.93216979735664e-07, "loss": 0.7051, "step": 5789 }, { "epoch": 0.534194441240918, "grad_norm": 2.2315676549144308, "learning_rate": 5.930290782507616e-07, "loss": 0.7174, "step": 5790 }, { "epoch": 0.534194441240918, "eval_GEN Loss": 0.45041510462760925, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3696982264518738, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8388521671295166, "eval_runtime": 57.3495, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 5790 }, { "epoch": 0.534286702802445, "grad_norm": 1.8697648374865585, "learning_rate": 5.928411796631144e-07, "loss": 0.6783, "step": 5791 }, { "epoch": 0.5343789643639718, "grad_norm": 1.8503514910690493, "learning_rate": 5.926532839897502e-07, "loss": 0.6207, "step": 5792 }, { "epoch": 0.5344712259254988, "grad_norm": 2.6801405588766625, "learning_rate": 5.924653912476962e-07, "loss": 0.627, "step": 5793 }, { "epoch": 0.5345634874870258, "grad_norm": 3.1825256763236434, "learning_rate": 5.922775014539798e-07, "loss": 0.9072, "step": 5794 }, { "epoch": 0.5346557490485526, "grad_norm": 1.7219506544124317, "learning_rate": 5.920896146256278e-07, "loss": 0.6279, "step": 5795 }, { "epoch": 0.5346557490485526, "eval_GEN Loss": 0.4500353932380676, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3650282025337219, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8369591236114502, "eval_runtime": 57.0276, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 5795 }, { "epoch": 0.5347480106100796, "grad_norm": 2.0997850867493573, "learning_rate": 5.919017307796668e-07, "loss": 0.8179, "step": 5796 }, { "epoch": 0.5348402721716065, "grad_norm": 1.7155024057468957, "learning_rate": 5.917138499331226e-07, "loss": 0.682, "step": 5797 }, { "epoch": 0.5349325337331334, "grad_norm": 3.369350292484986, "learning_rate": 5.91525972103022e-07, "loss": 0.6307, "step": 5798 }, { "epoch": 0.5350247952946604, "grad_norm": 1.9060662169378466, "learning_rate": 5.913380973063905e-07, "loss": 0.8015, "step": 5799 }, { "epoch": 0.5351170568561873, "grad_norm": 1.3823874118563797, "learning_rate": 5.911502255602534e-07, "loss": 0.6224, "step": 5800 }, { "epoch": 0.5351170568561873, "eval_GEN Loss": 0.44995418190956116, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35996726155281067, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8368690013885498, "eval_runtime": 57.0841, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 5800 }, { "epoch": 0.5352093184177142, "grad_norm": 2.35608433866281, "learning_rate": 5.909623568816364e-07, "loss": 0.8382, "step": 5801 }, { "epoch": 0.5353015799792411, "grad_norm": 2.178332508287671, "learning_rate": 5.907744912875642e-07, "loss": 0.8333, "step": 5802 }, { "epoch": 0.5353938415407681, "grad_norm": 1.6363865875793884, "learning_rate": 5.905866287950615e-07, "loss": 0.6602, "step": 5803 }, { "epoch": 0.535486103102295, "grad_norm": 2.3679194535164663, "learning_rate": 5.903987694211525e-07, "loss": 0.5324, "step": 5804 }, { "epoch": 0.5355783646638219, "grad_norm": 1.4269772285775357, "learning_rate": 5.902109131828617e-07, "loss": 0.6942, "step": 5805 }, { "epoch": 0.5355783646638219, "eval_GEN Loss": 0.44862109422683716, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35410743951797485, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8402644395828247, "eval_runtime": 56.7546, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 5805 }, { "epoch": 0.5356706262253489, "grad_norm": 1.187229197901674, "learning_rate": 5.900230600972126e-07, "loss": 0.5, "step": 5806 }, { "epoch": 0.5357628877868758, "grad_norm": 2.6126308852165097, "learning_rate": 5.898352101812285e-07, "loss": 0.6575, "step": 5807 }, { "epoch": 0.5358551493484027, "grad_norm": 1.6207106668131552, "learning_rate": 5.896473634519334e-07, "loss": 0.6805, "step": 5808 }, { "epoch": 0.5359474109099297, "grad_norm": 3.4763261574642286, "learning_rate": 5.894595199263498e-07, "loss": 0.9343, "step": 5809 }, { "epoch": 0.5360396724714566, "grad_norm": 1.2154843556272092, "learning_rate": 5.892716796215005e-07, "loss": 0.5521, "step": 5810 }, { "epoch": 0.5360396724714566, "eval_GEN Loss": 0.4492841958999634, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3497515320777893, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8439303040504456, "eval_runtime": 56.88, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5810 }, { "epoch": 0.5361319340329835, "grad_norm": 2.0362083042463692, "learning_rate": 5.890838425544075e-07, "loss": 0.6058, "step": 5811 }, { "epoch": 0.5362241955945104, "grad_norm": 1.7922271102877259, "learning_rate": 5.888960087420935e-07, "loss": 0.794, "step": 5812 }, { "epoch": 0.5363164571560374, "grad_norm": 1.8033143585973566, "learning_rate": 5.887081782015801e-07, "loss": 0.6826, "step": 5813 }, { "epoch": 0.5364087187175643, "grad_norm": 3.465484882624158, "learning_rate": 5.885203509498886e-07, "loss": 0.8785, "step": 5814 }, { "epoch": 0.5365009802790912, "grad_norm": 1.2213065199221158, "learning_rate": 5.883325270040403e-07, "loss": 0.5525, "step": 5815 }, { "epoch": 0.5365009802790912, "eval_GEN Loss": 0.44950050115585327, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3496865928173065, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8412860631942749, "eval_runtime": 55.8233, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 5815 }, { "epoch": 0.5365932418406182, "grad_norm": 1.5078621356177477, "learning_rate": 5.881447063810562e-07, "loss": 0.6141, "step": 5816 }, { "epoch": 0.536685503402145, "grad_norm": 2.6540051968823186, "learning_rate": 5.879568890979568e-07, "loss": 0.8905, "step": 5817 }, { "epoch": 0.536777764963672, "grad_norm": 2.1017076090499756, "learning_rate": 5.877690751717622e-07, "loss": 0.7689, "step": 5818 }, { "epoch": 0.5368700265251989, "grad_norm": 2.5676515796809367, "learning_rate": 5.875812646194928e-07, "loss": 0.628, "step": 5819 }, { "epoch": 0.5369622880867259, "grad_norm": 2.558700944854717, "learning_rate": 5.873934574581681e-07, "loss": 0.8597, "step": 5820 }, { "epoch": 0.5369622880867259, "eval_GEN Loss": 0.4488917291164398, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3573242723941803, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8333232998847961, "eval_runtime": 56.2035, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5820 }, { "epoch": 0.5370545496482528, "grad_norm": 1.7296060586377249, "learning_rate": 5.872056537048076e-07, "loss": 0.7032, "step": 5821 }, { "epoch": 0.5371468112097797, "grad_norm": 2.042982232597957, "learning_rate": 5.870178533764298e-07, "loss": 0.6008, "step": 5822 }, { "epoch": 0.5372390727713067, "grad_norm": 1.8460714169958954, "learning_rate": 5.868300564900543e-07, "loss": 0.5413, "step": 5823 }, { "epoch": 0.5373313343328335, "grad_norm": 1.7553498878978515, "learning_rate": 5.866422630626992e-07, "loss": 0.513, "step": 5824 }, { "epoch": 0.5374235958943605, "grad_norm": 1.3498959361152614, "learning_rate": 5.864544731113824e-07, "loss": 0.5685, "step": 5825 }, { "epoch": 0.5374235958943605, "eval_GEN Loss": 0.4513486921787262, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36338549852371216, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.833984375, "eval_runtime": 56.0366, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5825 }, { "epoch": 0.5375158574558875, "grad_norm": 2.2869505167957227, "learning_rate": 5.862666866531221e-07, "loss": 0.6126, "step": 5826 }, { "epoch": 0.5376081190174143, "grad_norm": 1.5968139007917215, "learning_rate": 5.860789037049353e-07, "loss": 0.3845, "step": 5827 }, { "epoch": 0.5377003805789413, "grad_norm": 1.91353585550136, "learning_rate": 5.8589112428384e-07, "loss": 0.6511, "step": 5828 }, { "epoch": 0.5377926421404682, "grad_norm": 1.891338556897087, "learning_rate": 5.857033484068522e-07, "loss": 0.6921, "step": 5829 }, { "epoch": 0.5378849037019952, "grad_norm": 1.8616492129304043, "learning_rate": 5.855155760909889e-07, "loss": 0.8368, "step": 5830 }, { "epoch": 0.5378849037019952, "eval_GEN Loss": 0.4492308497428894, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3625842034816742, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8289362788200378, "eval_runtime": 56.1258, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 5830 }, { "epoch": 0.5379771652635221, "grad_norm": 2.571094152999237, "learning_rate": 5.853278073532664e-07, "loss": 0.8579, "step": 5831 }, { "epoch": 0.538069426825049, "grad_norm": 1.8896006678672719, "learning_rate": 5.851400422107001e-07, "loss": 0.6966, "step": 5832 }, { "epoch": 0.538161688386576, "grad_norm": 3.5021742978510044, "learning_rate": 5.849522806803062e-07, "loss": 0.9696, "step": 5833 }, { "epoch": 0.5382539499481028, "grad_norm": 1.741130386831645, "learning_rate": 5.847645227790996e-07, "loss": 0.7425, "step": 5834 }, { "epoch": 0.5383462115096298, "grad_norm": 1.8924611515179963, "learning_rate": 5.845767685240953e-07, "loss": 0.6614, "step": 5835 }, { "epoch": 0.5383462115096298, "eval_GEN Loss": 0.4495334327220917, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3609731197357178, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8343148827552795, "eval_runtime": 56.0003, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5835 }, { "epoch": 0.5384384730711568, "grad_norm": 2.168234072325096, "learning_rate": 5.843890179323076e-07, "loss": 0.7116, "step": 5836 }, { "epoch": 0.5385307346326836, "grad_norm": 2.0574000005009156, "learning_rate": 5.842012710207514e-07, "loss": 0.6794, "step": 5837 }, { "epoch": 0.5386229961942106, "grad_norm": 1.4600699649291664, "learning_rate": 5.8401352780644e-07, "loss": 0.5891, "step": 5838 }, { "epoch": 0.5387152577557375, "grad_norm": 2.8078433257444084, "learning_rate": 5.838257883063874e-07, "loss": 0.8644, "step": 5839 }, { "epoch": 0.5388075193172644, "grad_norm": 2.8492107997215825, "learning_rate": 5.836380525376066e-07, "loss": 0.8936, "step": 5840 }, { "epoch": 0.5388075193172644, "eval_GEN Loss": 0.44970762729644775, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36723437905311584, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8362680077552795, "eval_runtime": 55.8671, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5840 }, { "epoch": 0.5388997808787914, "grad_norm": 1.7903759914514972, "learning_rate": 5.834503205171106e-07, "loss": 0.6512, "step": 5841 }, { "epoch": 0.5389920424403183, "grad_norm": 2.2846497136013304, "learning_rate": 5.83262592261912e-07, "loss": 0.6903, "step": 5842 }, { "epoch": 0.5390843040018453, "grad_norm": 1.4552474440027527, "learning_rate": 5.830748677890227e-07, "loss": 0.5684, "step": 5843 }, { "epoch": 0.5391765655633721, "grad_norm": 2.246475236276283, "learning_rate": 5.828871471154552e-07, "loss": 0.6462, "step": 5844 }, { "epoch": 0.5392688271248991, "grad_norm": 2.1444854072494937, "learning_rate": 5.826994302582205e-07, "loss": 0.8818, "step": 5845 }, { "epoch": 0.5392688271248991, "eval_GEN Loss": 0.4487519860267639, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3712630271911621, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8394230604171753, "eval_runtime": 55.756, "eval_samples_per_second": 1.166, "eval_steps_per_second": 0.09, "step": 5845 }, { "epoch": 0.5393610886864261, "grad_norm": 1.9498300362717798, "learning_rate": 5.825117172343303e-07, "loss": 0.5679, "step": 5846 }, { "epoch": 0.5394533502479529, "grad_norm": 2.801527726289478, "learning_rate": 5.823240080607947e-07, "loss": 1.0734, "step": 5847 }, { "epoch": 0.5395456118094799, "grad_norm": 1.6007312373121423, "learning_rate": 5.82136302754625e-07, "loss": 0.5516, "step": 5848 }, { "epoch": 0.5396378733710068, "grad_norm": 1.8295705655773762, "learning_rate": 5.81948601332831e-07, "loss": 0.7105, "step": 5849 }, { "epoch": 0.5397301349325337, "grad_norm": 1.832811874605488, "learning_rate": 5.817609038124224e-07, "loss": 0.6583, "step": 5850 }, { "epoch": 0.5397301349325337, "eval_GEN Loss": 0.4473370313644409, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3632742464542389, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8364182710647583, "eval_runtime": 56.0348, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5850 }, { "epoch": 0.5398223964940606, "grad_norm": 1.6692405513644966, "learning_rate": 5.815732102104088e-07, "loss": 0.5819, "step": 5851 }, { "epoch": 0.5399146580555876, "grad_norm": 1.8658434414049225, "learning_rate": 5.813855205437993e-07, "loss": 0.4917, "step": 5852 }, { "epoch": 0.5400069196171146, "grad_norm": 1.7207831733650945, "learning_rate": 5.811978348296027e-07, "loss": 0.6201, "step": 5853 }, { "epoch": 0.5400991811786414, "grad_norm": 2.8815873517511426, "learning_rate": 5.810101530848268e-07, "loss": 0.9138, "step": 5854 }, { "epoch": 0.5401914427401684, "grad_norm": 2.2257714769161487, "learning_rate": 5.808224753264805e-07, "loss": 0.8249, "step": 5855 }, { "epoch": 0.5401914427401684, "eval_GEN Loss": 0.44589003920555115, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35213279724121094, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8349759578704834, "eval_runtime": 55.9731, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5855 }, { "epoch": 0.5402837043016953, "grad_norm": 1.2100988984440277, "learning_rate": 5.806348015715709e-07, "loss": 0.706, "step": 5856 }, { "epoch": 0.5403759658632222, "grad_norm": 1.698129884245249, "learning_rate": 5.804471318371051e-07, "loss": 0.7055, "step": 5857 }, { "epoch": 0.5404682274247492, "grad_norm": 2.619703535217051, "learning_rate": 5.802594661400907e-07, "loss": 0.6769, "step": 5858 }, { "epoch": 0.5405604889862761, "grad_norm": 1.7699485900799037, "learning_rate": 5.80071804497534e-07, "loss": 0.6622, "step": 5859 }, { "epoch": 0.540652750547803, "grad_norm": 2.309559162457744, "learning_rate": 5.798841469264409e-07, "loss": 0.5949, "step": 5860 }, { "epoch": 0.540652750547803, "eval_GEN Loss": 0.44504597783088684, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3445006012916565, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8394832015037537, "eval_runtime": 55.9423, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5860 }, { "epoch": 0.5407450121093299, "grad_norm": 1.6542999443104147, "learning_rate": 5.796964934438174e-07, "loss": 0.5125, "step": 5861 }, { "epoch": 0.5408372736708569, "grad_norm": 1.5294429308461062, "learning_rate": 5.79508844066669e-07, "loss": 0.5527, "step": 5862 }, { "epoch": 0.5409295352323839, "grad_norm": 1.7583389186282403, "learning_rate": 5.793211988120008e-07, "loss": 0.4997, "step": 5863 }, { "epoch": 0.5410217967939107, "grad_norm": 2.306804594803944, "learning_rate": 5.791335576968173e-07, "loss": 0.8097, "step": 5864 }, { "epoch": 0.5411140583554377, "grad_norm": 2.457145396180528, "learning_rate": 5.789459207381233e-07, "loss": 0.8116, "step": 5865 }, { "epoch": 0.5411140583554377, "eval_GEN Loss": 0.4447591304779053, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34254494309425354, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8518930077552795, "eval_runtime": 56.0103, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5865 }, { "epoch": 0.5412063199169646, "grad_norm": 2.077934589800638, "learning_rate": 5.787582879529223e-07, "loss": 0.7785, "step": 5866 }, { "epoch": 0.5412985814784915, "grad_norm": 1.730693960858954, "learning_rate": 5.785706593582181e-07, "loss": 0.7028, "step": 5867 }, { "epoch": 0.5413908430400185, "grad_norm": 2.3960705665100015, "learning_rate": 5.783830349710135e-07, "loss": 0.6702, "step": 5868 }, { "epoch": 0.5414831046015454, "grad_norm": 1.1834348125804082, "learning_rate": 5.781954148083119e-07, "loss": 0.4839, "step": 5869 }, { "epoch": 0.5415753661630723, "grad_norm": 2.2348809628726416, "learning_rate": 5.780077988871155e-07, "loss": 0.6838, "step": 5870 }, { "epoch": 0.5415753661630723, "eval_GEN Loss": 0.44599902629852295, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3459123969078064, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8465144038200378, "eval_runtime": 56.2024, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5870 }, { "epoch": 0.5416676277245992, "grad_norm": 1.4430423251394537, "learning_rate": 5.778201872244261e-07, "loss": 0.6564, "step": 5871 }, { "epoch": 0.5417598892861262, "grad_norm": 2.2144189461984745, "learning_rate": 5.776325798372459e-07, "loss": 0.7379, "step": 5872 }, { "epoch": 0.5418521508476531, "grad_norm": 1.9048207532471055, "learning_rate": 5.77444976742576e-07, "loss": 0.7886, "step": 5873 }, { "epoch": 0.54194441240918, "grad_norm": 1.3655512990609937, "learning_rate": 5.772573779574168e-07, "loss": 0.529, "step": 5874 }, { "epoch": 0.542036673970707, "grad_norm": 3.32815742817519, "learning_rate": 5.770697834987693e-07, "loss": 0.7706, "step": 5875 }, { "epoch": 0.542036673970707, "eval_GEN Loss": 0.4469482898712158, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3520021140575409, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.838161051273346, "eval_runtime": 55.9422, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5875 }, { "epoch": 0.5421289355322338, "grad_norm": 1.9093630248157234, "learning_rate": 5.768821933836335e-07, "loss": 0.7118, "step": 5876 }, { "epoch": 0.5422211970937608, "grad_norm": 2.242118986881792, "learning_rate": 5.766946076290091e-07, "loss": 0.6852, "step": 5877 }, { "epoch": 0.5423134586552878, "grad_norm": 1.5933188808348442, "learning_rate": 5.765070262518954e-07, "loss": 0.8524, "step": 5878 }, { "epoch": 0.5424057202168147, "grad_norm": 1.6438611105854315, "learning_rate": 5.76319449269291e-07, "loss": 0.3954, "step": 5879 }, { "epoch": 0.5424979817783416, "grad_norm": 1.830068719330009, "learning_rate": 5.761318766981951e-07, "loss": 0.5091, "step": 5880 }, { "epoch": 0.5424979817783416, "eval_GEN Loss": 0.44753319025039673, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37153053283691406, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8378005027770996, "eval_runtime": 56.18, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5880 }, { "epoch": 0.5425902433398685, "grad_norm": 2.041701874548551, "learning_rate": 5.759443085556053e-07, "loss": 0.7693, "step": 5881 }, { "epoch": 0.5426825049013955, "grad_norm": 1.7611823619981535, "learning_rate": 5.757567448585193e-07, "loss": 0.5624, "step": 5882 }, { "epoch": 0.5427747664629223, "grad_norm": 2.0587695602270566, "learning_rate": 5.755691856239348e-07, "loss": 0.7191, "step": 5883 }, { "epoch": 0.5428670280244493, "grad_norm": 1.7069660611813369, "learning_rate": 5.753816308688486e-07, "loss": 0.6198, "step": 5884 }, { "epoch": 0.5429592895859763, "grad_norm": 1.7941907591026522, "learning_rate": 5.75194080610257e-07, "loss": 0.781, "step": 5885 }, { "epoch": 0.5429592895859763, "eval_GEN Loss": 0.44858518242836, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.38808637857437134, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8452824354171753, "eval_runtime": 56.0376, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5885 }, { "epoch": 0.5430515511475031, "grad_norm": 2.2689765690278403, "learning_rate": 5.750065348651562e-07, "loss": 0.805, "step": 5886 }, { "epoch": 0.5431438127090301, "grad_norm": 3.278457817746423, "learning_rate": 5.74818993650542e-07, "loss": 0.5718, "step": 5887 }, { "epoch": 0.543236074270557, "grad_norm": 2.4166789642472986, "learning_rate": 5.746314569834094e-07, "loss": 0.7728, "step": 5888 }, { "epoch": 0.543328335832084, "grad_norm": 2.1436619101488734, "learning_rate": 5.744439248807534e-07, "loss": 0.7365, "step": 5889 }, { "epoch": 0.5434205973936109, "grad_norm": 2.18272910823413, "learning_rate": 5.742563973595687e-07, "loss": 0.7512, "step": 5890 }, { "epoch": 0.5434205973936109, "eval_GEN Loss": 0.4484110176563263, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.393480509519577, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8490685224533081, "eval_runtime": 55.9868, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5890 }, { "epoch": 0.5435128589551378, "grad_norm": 3.2015430040906003, "learning_rate": 5.740688744368492e-07, "loss": 0.7141, "step": 5891 }, { "epoch": 0.5436051205166648, "grad_norm": 1.7128664378571286, "learning_rate": 5.738813561295884e-07, "loss": 0.8139, "step": 5892 }, { "epoch": 0.5436973820781916, "grad_norm": 2.4040058954259362, "learning_rate": 5.736938424547793e-07, "loss": 0.6409, "step": 5893 }, { "epoch": 0.5437896436397186, "grad_norm": 1.4792311094040151, "learning_rate": 5.735063334294152e-07, "loss": 0.4885, "step": 5894 }, { "epoch": 0.5438819052012456, "grad_norm": 2.0374759322125473, "learning_rate": 5.733188290704883e-07, "loss": 0.9515, "step": 5895 }, { "epoch": 0.5438819052012456, "eval_GEN Loss": 0.44808119535446167, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.3932257294654846, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8500300645828247, "eval_runtime": 56.0933, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5895 }, { "epoch": 0.5439741667627724, "grad_norm": 3.381129966694147, "learning_rate": 5.731313293949902e-07, "loss": 0.948, "step": 5896 }, { "epoch": 0.5440664283242994, "grad_norm": 2.7614117380323604, "learning_rate": 5.729438344199129e-07, "loss": 0.9092, "step": 5897 }, { "epoch": 0.5441586898858263, "grad_norm": 1.973666722799482, "learning_rate": 5.727563441622472e-07, "loss": 0.6649, "step": 5898 }, { "epoch": 0.5442509514473532, "grad_norm": 2.043219743131938, "learning_rate": 5.725688586389838e-07, "loss": 0.5562, "step": 5899 }, { "epoch": 0.5443432130088802, "grad_norm": 2.4122978384708955, "learning_rate": 5.723813778671128e-07, "loss": 0.7516, "step": 5900 }, { "epoch": 0.5443432130088802, "eval_GEN Loss": 0.44781965017318726, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.36976659297943115, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8394832015037537, "eval_runtime": 56.0757, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5900 }, { "epoch": 0.5444354745704071, "grad_norm": 2.374421554894921, "learning_rate": 5.721939018636244e-07, "loss": 0.9465, "step": 5901 }, { "epoch": 0.5445277361319341, "grad_norm": 2.339227461952067, "learning_rate": 5.720064306455078e-07, "loss": 0.6834, "step": 5902 }, { "epoch": 0.5446199976934609, "grad_norm": 1.8784667042528662, "learning_rate": 5.718189642297515e-07, "loss": 0.6775, "step": 5903 }, { "epoch": 0.5447122592549879, "grad_norm": 1.6559652186582885, "learning_rate": 5.716315026333446e-07, "loss": 0.6507, "step": 5904 }, { "epoch": 0.5448045208165149, "grad_norm": 1.887604593672403, "learning_rate": 5.71444045873275e-07, "loss": 0.6071, "step": 5905 }, { "epoch": 0.5448045208165149, "eval_GEN Loss": 0.44712576270103455, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3517681658267975, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8367487788200378, "eval_runtime": 55.9933, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5905 }, { "epoch": 0.5448967823780417, "grad_norm": 1.6813905041198745, "learning_rate": 5.712565939665303e-07, "loss": 0.4468, "step": 5906 }, { "epoch": 0.5449890439395687, "grad_norm": 1.5723308832344287, "learning_rate": 5.710691469300974e-07, "loss": 0.5918, "step": 5907 }, { "epoch": 0.5450813055010956, "grad_norm": 2.3579866883057403, "learning_rate": 5.708817047809633e-07, "loss": 0.8553, "step": 5908 }, { "epoch": 0.5451735670626225, "grad_norm": 1.3807209312330326, "learning_rate": 5.706942675361146e-07, "loss": 0.662, "step": 5909 }, { "epoch": 0.5452658286241495, "grad_norm": 1.9656511128933696, "learning_rate": 5.705068352125368e-07, "loss": 0.7186, "step": 5910 }, { "epoch": 0.5452658286241495, "eval_GEN Loss": 0.4472618103027344, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33864954113960266, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8422476053237915, "eval_runtime": 55.9862, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5910 }, { "epoch": 0.5453580901856764, "grad_norm": 2.0814156481361756, "learning_rate": 5.703194078272151e-07, "loss": 0.6847, "step": 5911 }, { "epoch": 0.5454503517472034, "grad_norm": 1.3684798761856496, "learning_rate": 5.701319853971349e-07, "loss": 0.6962, "step": 5912 }, { "epoch": 0.5455426133087302, "grad_norm": 1.8381859440718178, "learning_rate": 5.699445679392807e-07, "loss": 0.7173, "step": 5913 }, { "epoch": 0.5456348748702572, "grad_norm": 2.4182662626836153, "learning_rate": 5.69757155470636e-07, "loss": 0.6502, "step": 5914 }, { "epoch": 0.545727136431784, "grad_norm": 1.9404722611797978, "learning_rate": 5.695697480081852e-07, "loss": 0.7367, "step": 5915 }, { "epoch": 0.545727136431784, "eval_GEN Loss": 0.4479016959667206, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3343588709831238, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8481370210647583, "eval_runtime": 56.9626, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 5915 }, { "epoch": 0.545819397993311, "grad_norm": 3.0723257564109594, "learning_rate": 5.693823455689109e-07, "loss": 0.8472, "step": 5916 }, { "epoch": 0.545911659554838, "grad_norm": 1.9411256025651027, "learning_rate": 5.691949481697961e-07, "loss": 0.5828, "step": 5917 }, { "epoch": 0.5460039211163649, "grad_norm": 1.8921361109903005, "learning_rate": 5.690075558278227e-07, "loss": 0.6803, "step": 5918 }, { "epoch": 0.5460961826778918, "grad_norm": 2.2496111337983757, "learning_rate": 5.688201685599729e-07, "loss": 0.793, "step": 5919 }, { "epoch": 0.5461884442394187, "grad_norm": 1.8078423760732314, "learning_rate": 5.68632786383228e-07, "loss": 0.6525, "step": 5920 }, { "epoch": 0.5461884442394187, "eval_GEN Loss": 0.4489862322807312, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.333961546421051, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8525841236114502, "eval_runtime": 56.8479, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5920 }, { "epoch": 0.5462807058009457, "grad_norm": 2.0360558898865846, "learning_rate": 5.684454093145685e-07, "loss": 0.7341, "step": 5921 }, { "epoch": 0.5463729673624727, "grad_norm": 1.1024946210754787, "learning_rate": 5.682580373709751e-07, "loss": 0.4145, "step": 5922 }, { "epoch": 0.5464652289239995, "grad_norm": 1.5037024982579847, "learning_rate": 5.680706705694277e-07, "loss": 0.4828, "step": 5923 }, { "epoch": 0.5465574904855265, "grad_norm": 2.2296616694317986, "learning_rate": 5.678833089269057e-07, "loss": 0.8301, "step": 5924 }, { "epoch": 0.5466497520470533, "grad_norm": 1.9959925646373031, "learning_rate": 5.67695952460388e-07, "loss": 0.7227, "step": 5925 }, { "epoch": 0.5466497520470533, "eval_GEN Loss": 0.44770190119743347, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33407172560691833, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8475360870361328, "eval_runtime": 56.9319, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 5925 }, { "epoch": 0.5467420136085803, "grad_norm": 2.4412682604192164, "learning_rate": 5.675086011868535e-07, "loss": 0.8843, "step": 5926 }, { "epoch": 0.5468342751701073, "grad_norm": 1.9790099098668692, "learning_rate": 5.673212551232801e-07, "loss": 0.6782, "step": 5927 }, { "epoch": 0.5469265367316342, "grad_norm": 2.2539325443867777, "learning_rate": 5.67133914286645e-07, "loss": 0.6641, "step": 5928 }, { "epoch": 0.5470187982931611, "grad_norm": 2.141712247738704, "learning_rate": 5.66946578693926e-07, "loss": 0.7671, "step": 5929 }, { "epoch": 0.547111059854688, "grad_norm": 1.5253266255169893, "learning_rate": 5.667592483620994e-07, "loss": 0.6135, "step": 5930 }, { "epoch": 0.547111059854688, "eval_GEN Loss": 0.4468701481819153, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3375617563724518, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8463942408561707, "eval_runtime": 57.2972, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 5930 }, { "epoch": 0.547203321416215, "grad_norm": 1.7253304046639926, "learning_rate": 5.665719233081413e-07, "loss": 0.6649, "step": 5931 }, { "epoch": 0.547295582977742, "grad_norm": 1.595564373276263, "learning_rate": 5.663846035490274e-07, "loss": 0.5896, "step": 5932 }, { "epoch": 0.5473878445392688, "grad_norm": 2.4702824804649817, "learning_rate": 5.661972891017332e-07, "loss": 0.8518, "step": 5933 }, { "epoch": 0.5474801061007958, "grad_norm": 2.199668788622321, "learning_rate": 5.660099799832331e-07, "loss": 0.7809, "step": 5934 }, { "epoch": 0.5475723676623226, "grad_norm": 1.5215934626891463, "learning_rate": 5.658226762105015e-07, "loss": 0.6241, "step": 5935 }, { "epoch": 0.5475723676623226, "eval_GEN Loss": 0.4466407597064972, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.337177574634552, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8424879908561707, "eval_runtime": 56.8618, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 5935 }, { "epoch": 0.5476646292238496, "grad_norm": 2.748193508265221, "learning_rate": 5.656353778005119e-07, "loss": 0.7088, "step": 5936 }, { "epoch": 0.5477568907853766, "grad_norm": 1.7045158818288686, "learning_rate": 5.65448084770238e-07, "loss": 0.6149, "step": 5937 }, { "epoch": 0.5478491523469035, "grad_norm": 2.458701116183841, "learning_rate": 5.652607971366526e-07, "loss": 0.8346, "step": 5938 }, { "epoch": 0.5479414139084304, "grad_norm": 1.687590522635232, "learning_rate": 5.650735149167273e-07, "loss": 0.5871, "step": 5939 }, { "epoch": 0.5480336754699573, "grad_norm": 1.3873017790874902, "learning_rate": 5.648862381274348e-07, "loss": 0.5166, "step": 5940 }, { "epoch": 0.5480336754699573, "eval_GEN Loss": 0.4463694393634796, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33818763494491577, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8337740302085876, "eval_runtime": 56.0166, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5940 }, { "epoch": 0.5481259370314843, "grad_norm": 1.6942534021175686, "learning_rate": 5.646989667857459e-07, "loss": 0.6408, "step": 5941 }, { "epoch": 0.5482181985930112, "grad_norm": 1.6770076082916041, "learning_rate": 5.645117009086317e-07, "loss": 0.7246, "step": 5942 }, { "epoch": 0.5483104601545381, "grad_norm": 2.434288482782804, "learning_rate": 5.64324440513062e-07, "loss": 0.7541, "step": 5943 }, { "epoch": 0.5484027217160651, "grad_norm": 1.862012350595842, "learning_rate": 5.641371856160073e-07, "loss": 0.6902, "step": 5944 }, { "epoch": 0.5484949832775919, "grad_norm": 2.6184733278917465, "learning_rate": 5.639499362344366e-07, "loss": 0.7438, "step": 5945 }, { "epoch": 0.5484949832775919, "eval_GEN Loss": 0.44770586490631104, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3460562229156494, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8347055315971375, "eval_runtime": 56.1034, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 5945 }, { "epoch": 0.5485872448391189, "grad_norm": 1.2641863896800023, "learning_rate": 5.637626923853187e-07, "loss": 0.5491, "step": 5946 }, { "epoch": 0.5486795064006458, "grad_norm": 1.832971276065754, "learning_rate": 5.635754540856221e-07, "loss": 0.5571, "step": 5947 }, { "epoch": 0.5487717679621728, "grad_norm": 1.6925930309539023, "learning_rate": 5.633882213523145e-07, "loss": 0.5752, "step": 5948 }, { "epoch": 0.5488640295236997, "grad_norm": 2.2162283470213247, "learning_rate": 5.632009942023633e-07, "loss": 0.8185, "step": 5949 }, { "epoch": 0.5489562910852266, "grad_norm": 1.9458069112234833, "learning_rate": 5.630137726527351e-07, "loss": 0.7051, "step": 5950 }, { "epoch": 0.5489562910852266, "eval_GEN Loss": 0.44787561893463135, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3494913578033447, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8350660800933838, "eval_runtime": 55.8792, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5950 }, { "epoch": 0.5490485526467536, "grad_norm": 3.97667150790683, "learning_rate": 5.628265567203966e-07, "loss": 0.917, "step": 5951 }, { "epoch": 0.5491408142082804, "grad_norm": 1.9835946779925995, "learning_rate": 5.626393464223133e-07, "loss": 0.7354, "step": 5952 }, { "epoch": 0.5492330757698074, "grad_norm": 1.914993458623533, "learning_rate": 5.624521417754505e-07, "loss": 0.6655, "step": 5953 }, { "epoch": 0.5493253373313344, "grad_norm": 2.3714644853168, "learning_rate": 5.622649427967731e-07, "loss": 0.7372, "step": 5954 }, { "epoch": 0.5494175988928612, "grad_norm": 2.9257955003864047, "learning_rate": 5.620777495032454e-07, "loss": 0.6314, "step": 5955 }, { "epoch": 0.5494175988928612, "eval_GEN Loss": 0.4481867551803589, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3522792458534241, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8323917984962463, "eval_runtime": 55.9853, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5955 }, { "epoch": 0.5495098604543882, "grad_norm": 2.1504091296099723, "learning_rate": 5.618905619118312e-07, "loss": 0.767, "step": 5956 }, { "epoch": 0.5496021220159151, "grad_norm": 1.5298848996811598, "learning_rate": 5.617033800394933e-07, "loss": 0.6584, "step": 5957 }, { "epoch": 0.549694383577442, "grad_norm": 1.7270189353856877, "learning_rate": 5.61516203903195e-07, "loss": 0.7849, "step": 5958 }, { "epoch": 0.549786645138969, "grad_norm": 2.247131493587974, "learning_rate": 5.613290335198982e-07, "loss": 0.6498, "step": 5959 }, { "epoch": 0.5498789067004959, "grad_norm": 1.9089982802892862, "learning_rate": 5.611418689065644e-07, "loss": 0.6095, "step": 5960 }, { "epoch": 0.5498789067004959, "eval_GEN Loss": 0.4481411874294281, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35213157534599304, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8327824473381042, "eval_runtime": 56.1699, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5960 }, { "epoch": 0.5499711682620229, "grad_norm": 1.9841491120550447, "learning_rate": 5.609547100801551e-07, "loss": 0.7643, "step": 5961 }, { "epoch": 0.5500634298235497, "grad_norm": 3.313752511013024, "learning_rate": 5.607675570576308e-07, "loss": 0.7517, "step": 5962 }, { "epoch": 0.5501556913850767, "grad_norm": 1.669278162322066, "learning_rate": 5.605804098559517e-07, "loss": 0.6181, "step": 5963 }, { "epoch": 0.5502479529466037, "grad_norm": 1.893737739683359, "learning_rate": 5.603932684920769e-07, "loss": 0.652, "step": 5964 }, { "epoch": 0.5503402145081305, "grad_norm": 1.648867344889991, "learning_rate": 5.60206132982966e-07, "loss": 0.7522, "step": 5965 }, { "epoch": 0.5503402145081305, "eval_GEN Loss": 0.4469587802886963, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34845659136772156, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8331129550933838, "eval_runtime": 55.9964, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5965 }, { "epoch": 0.5504324760696575, "grad_norm": 1.4941922988494802, "learning_rate": 5.600190033455774e-07, "loss": 0.573, "step": 5966 }, { "epoch": 0.5505247376311844, "grad_norm": 2.327149478403429, "learning_rate": 5.59831879596869e-07, "loss": 0.6827, "step": 5967 }, { "epoch": 0.5506169991927113, "grad_norm": 2.47379855992817, "learning_rate": 5.596447617537981e-07, "loss": 0.4307, "step": 5968 }, { "epoch": 0.5507092607542383, "grad_norm": 1.9869216162176155, "learning_rate": 5.594576498333219e-07, "loss": 0.4394, "step": 5969 }, { "epoch": 0.5508015223157652, "grad_norm": 2.490293544377963, "learning_rate": 5.592705438523966e-07, "loss": 0.9697, "step": 5970 }, { "epoch": 0.5508015223157652, "eval_GEN Loss": 0.4461511969566345, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3415340185165405, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8353365659713745, "eval_runtime": 56.1928, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 5970 }, { "epoch": 0.5508937838772922, "grad_norm": 1.8001716082597052, "learning_rate": 5.590834438279779e-07, "loss": 0.6542, "step": 5971 }, { "epoch": 0.550986045438819, "grad_norm": 1.6628754117134685, "learning_rate": 5.588963497770215e-07, "loss": 0.6516, "step": 5972 }, { "epoch": 0.551078307000346, "grad_norm": 1.7496542011974336, "learning_rate": 5.58709261716482e-07, "loss": 0.5979, "step": 5973 }, { "epoch": 0.551170568561873, "grad_norm": 3.055952246945401, "learning_rate": 5.585221796633134e-07, "loss": 0.8571, "step": 5974 }, { "epoch": 0.5512628301233998, "grad_norm": 2.044869200172498, "learning_rate": 5.583351036344694e-07, "loss": 0.7518, "step": 5975 }, { "epoch": 0.5512628301233998, "eval_GEN Loss": 0.4444950819015503, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33646970987319946, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8408052921295166, "eval_runtime": 56.0512, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 5975 }, { "epoch": 0.5513550916849268, "grad_norm": 1.6010524352732722, "learning_rate": 5.581480336469034e-07, "loss": 0.6417, "step": 5976 }, { "epoch": 0.5514473532464537, "grad_norm": 2.7409595338392743, "learning_rate": 5.579609697175677e-07, "loss": 0.7319, "step": 5977 }, { "epoch": 0.5515396148079806, "grad_norm": 2.111517683572759, "learning_rate": 5.577739118634145e-07, "loss": 0.6635, "step": 5978 }, { "epoch": 0.5516318763695075, "grad_norm": 1.3973512083036954, "learning_rate": 5.575868601013952e-07, "loss": 0.6432, "step": 5979 }, { "epoch": 0.5517241379310345, "grad_norm": 2.7586111089443284, "learning_rate": 5.573998144484609e-07, "loss": 0.7924, "step": 5980 }, { "epoch": 0.5517241379310345, "eval_GEN Loss": 0.4438677132129669, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3384241759777069, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8416466116905212, "eval_runtime": 55.8551, "eval_samples_per_second": 1.164, "eval_steps_per_second": 0.09, "step": 5980 }, { "epoch": 0.5518163994925614, "grad_norm": 1.7882990071410962, "learning_rate": 5.572127749215617e-07, "loss": 0.6515, "step": 5981 }, { "epoch": 0.5519086610540883, "grad_norm": 1.451019894858869, "learning_rate": 5.570257415376475e-07, "loss": 0.6688, "step": 5982 }, { "epoch": 0.5520009226156153, "grad_norm": 3.106478733885264, "learning_rate": 5.568387143136677e-07, "loss": 0.9905, "step": 5983 }, { "epoch": 0.5520931841771421, "grad_norm": 1.3427922827012988, "learning_rate": 5.566516932665709e-07, "loss": 0.6454, "step": 5984 }, { "epoch": 0.5521854457386691, "grad_norm": 1.9058539545105901, "learning_rate": 5.564646784133049e-07, "loss": 0.8058, "step": 5985 }, { "epoch": 0.5521854457386691, "eval_GEN Loss": 0.44302743673324585, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34371137619018555, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8403846025466919, "eval_runtime": 55.9248, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 5985 }, { "epoch": 0.5522777073001961, "grad_norm": 1.680154666063775, "learning_rate": 5.56277669770818e-07, "loss": 0.6791, "step": 5986 }, { "epoch": 0.552369968861723, "grad_norm": 2.2196172792106674, "learning_rate": 5.560906673560567e-07, "loss": 0.7418, "step": 5987 }, { "epoch": 0.5524622304232499, "grad_norm": 1.452864479570459, "learning_rate": 5.559036711859678e-07, "loss": 0.668, "step": 5988 }, { "epoch": 0.5525544919847768, "grad_norm": 2.20630029169702, "learning_rate": 5.557166812774965e-07, "loss": 0.7495, "step": 5989 }, { "epoch": 0.5526467535463038, "grad_norm": 1.588108809117061, "learning_rate": 5.55529697647589e-07, "loss": 0.6531, "step": 5990 }, { "epoch": 0.5526467535463038, "eval_GEN Loss": 0.44336459040641785, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3497132360935211, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8376802802085876, "eval_runtime": 55.8728, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 5990 }, { "epoch": 0.5527390151078307, "grad_norm": 1.9071142992819081, "learning_rate": 5.553427203131897e-07, "loss": 0.6705, "step": 5991 }, { "epoch": 0.5528312766693576, "grad_norm": 2.796655967921059, "learning_rate": 5.551557492912424e-07, "loss": 0.7104, "step": 5992 }, { "epoch": 0.5529235382308846, "grad_norm": 2.7681583375322703, "learning_rate": 5.549687845986913e-07, "loss": 0.9129, "step": 5993 }, { "epoch": 0.5530157997924114, "grad_norm": 3.6782294403528657, "learning_rate": 5.547818262524791e-07, "loss": 0.5998, "step": 5994 }, { "epoch": 0.5531080613539384, "grad_norm": 2.401177010102145, "learning_rate": 5.545948742695484e-07, "loss": 0.7559, "step": 5995 }, { "epoch": 0.5531080613539384, "eval_GEN Loss": 0.44440627098083496, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.36248886585235596, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8379206657409668, "eval_runtime": 55.9927, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 5995 }, { "epoch": 0.5532003229154654, "grad_norm": 1.315077852800186, "learning_rate": 5.544079286668408e-07, "loss": 0.6187, "step": 5996 }, { "epoch": 0.5532925844769923, "grad_norm": 1.6366349040992625, "learning_rate": 5.542209894612979e-07, "loss": 0.681, "step": 5997 }, { "epoch": 0.5533848460385192, "grad_norm": 2.108660611248231, "learning_rate": 5.540340566698604e-07, "loss": 0.5855, "step": 5998 }, { "epoch": 0.5534771076000461, "grad_norm": 2.507727759167045, "learning_rate": 5.538471303094685e-07, "loss": 0.7543, "step": 5999 }, { "epoch": 0.5535693691615731, "grad_norm": 2.072884640928673, "learning_rate": 5.536602103970613e-07, "loss": 0.6128, "step": 6000 }, { "epoch": 0.5535693691615731, "eval_GEN Loss": 0.4444344639778137, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3656314015388489, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8364783525466919, "eval_runtime": 56.151, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6000 }, { "epoch": 0.5535693691615731, "eval_GEN Loss": 0.4444344639778137, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3656314015388489, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8364783525466919, "eval_runtime": 58.4311, "eval_samples_per_second": 1.112, "eval_steps_per_second": 0.086, "step": 6000 }, { "epoch": 0.5536616307231, "grad_norm": 1.6031643643729174, "learning_rate": 5.534732969495783e-07, "loss": 0.6311, "step": 6001 }, { "epoch": 0.5537538922846269, "grad_norm": 1.7794351278911462, "learning_rate": 5.532863899839579e-07, "loss": 0.6065, "step": 6002 }, { "epoch": 0.5538461538461539, "grad_norm": 1.7807496112740777, "learning_rate": 5.530994895171374e-07, "loss": 0.7087, "step": 6003 }, { "epoch": 0.5539384154076807, "grad_norm": 2.622093589336072, "learning_rate": 5.529125955660546e-07, "loss": 0.894, "step": 6004 }, { "epoch": 0.5540306769692077, "grad_norm": 1.5694141483148643, "learning_rate": 5.527257081476459e-07, "loss": 0.532, "step": 6005 }, { "epoch": 0.5540306769692077, "eval_GEN Loss": 0.4440942704677582, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35753506422042847, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8405348658561707, "eval_runtime": 57.2756, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6005 }, { "epoch": 0.5541229385307347, "grad_norm": 1.7742120738231326, "learning_rate": 5.525388272788472e-07, "loss": 0.6483, "step": 6006 }, { "epoch": 0.5542152000922616, "grad_norm": 2.5938472986510996, "learning_rate": 5.523519529765937e-07, "loss": 0.9287, "step": 6007 }, { "epoch": 0.5543074616537885, "grad_norm": 1.998956921764008, "learning_rate": 5.521650852578209e-07, "loss": 0.6681, "step": 6008 }, { "epoch": 0.5543997232153154, "grad_norm": 1.5738473701207076, "learning_rate": 5.519782241394628e-07, "loss": 0.6677, "step": 6009 }, { "epoch": 0.5544919847768424, "grad_norm": 1.7985534269999972, "learning_rate": 5.517913696384527e-07, "loss": 0.6368, "step": 6010 }, { "epoch": 0.5544919847768424, "eval_GEN Loss": 0.44287413358688354, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3565295338630676, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8399038314819336, "eval_runtime": 57.3323, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6010 }, { "epoch": 0.5545842463383692, "grad_norm": 2.342831216551444, "learning_rate": 5.51604521771724e-07, "loss": 0.6594, "step": 6011 }, { "epoch": 0.5546765078998962, "grad_norm": 2.185456544648431, "learning_rate": 5.514176805562092e-07, "loss": 0.6335, "step": 6012 }, { "epoch": 0.5547687694614232, "grad_norm": 3.1587787241035508, "learning_rate": 5.512308460088399e-07, "loss": 0.844, "step": 6013 }, { "epoch": 0.55486103102295, "grad_norm": 4.012089675546207, "learning_rate": 5.510440181465474e-07, "loss": 1.0717, "step": 6014 }, { "epoch": 0.554953292584477, "grad_norm": 1.3730953957238945, "learning_rate": 5.508571969862624e-07, "loss": 0.4715, "step": 6015 }, { "epoch": 0.554953292584477, "eval_GEN Loss": 0.44279107451438904, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3585335314273834, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8472355604171753, "eval_runtime": 57.0108, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6015 }, { "epoch": 0.5550455541460039, "grad_norm": 3.433425605642012, "learning_rate": 5.50670382544915e-07, "loss": 0.6432, "step": 6016 }, { "epoch": 0.5551378157075308, "grad_norm": 3.3046227757593845, "learning_rate": 5.504835748394344e-07, "loss": 0.7054, "step": 6017 }, { "epoch": 0.5552300772690578, "grad_norm": 2.307954100587407, "learning_rate": 5.502967738867498e-07, "loss": 0.7432, "step": 6018 }, { "epoch": 0.5553223388305847, "grad_norm": 3.6848133739914033, "learning_rate": 5.50109979703789e-07, "loss": 0.9906, "step": 6019 }, { "epoch": 0.5554146003921117, "grad_norm": 2.0882914204999117, "learning_rate": 5.499231923074797e-07, "loss": 0.6647, "step": 6020 }, { "epoch": 0.5554146003921117, "eval_GEN Loss": 0.44406092166900635, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3607516288757324, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8451322317123413, "eval_runtime": 57.27, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6020 }, { "epoch": 0.5555068619536385, "grad_norm": 3.3744975261730987, "learning_rate": 5.497364117147487e-07, "loss": 0.7071, "step": 6021 }, { "epoch": 0.5555991235151655, "grad_norm": 2.0210413394949738, "learning_rate": 5.495496379425227e-07, "loss": 0.7879, "step": 6022 }, { "epoch": 0.5556913850766925, "grad_norm": 2.377189263909455, "learning_rate": 5.493628710077275e-07, "loss": 0.7347, "step": 6023 }, { "epoch": 0.5557836466382193, "grad_norm": 2.5940103552788347, "learning_rate": 5.491761109272874e-07, "loss": 0.7611, "step": 6024 }, { "epoch": 0.5558759081997463, "grad_norm": 3.567129081517511, "learning_rate": 5.48989357718128e-07, "loss": 0.8317, "step": 6025 }, { "epoch": 0.5558759081997463, "eval_GEN Loss": 0.44379958510398865, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3647468388080597, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8437199592590332, "eval_runtime": 57.3495, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6025 }, { "epoch": 0.5559681697612732, "grad_norm": 2.0016781028031363, "learning_rate": 5.488026113971725e-07, "loss": 0.6968, "step": 6026 }, { "epoch": 0.5560604313228001, "grad_norm": 2.076297823455995, "learning_rate": 5.486158719813443e-07, "loss": 0.4838, "step": 6027 }, { "epoch": 0.5561526928843271, "grad_norm": 2.1421910987297474, "learning_rate": 5.484291394875659e-07, "loss": 0.8799, "step": 6028 }, { "epoch": 0.556244954445854, "grad_norm": 2.177592901547279, "learning_rate": 5.482424139327596e-07, "loss": 0.6627, "step": 6029 }, { "epoch": 0.556337216007381, "grad_norm": 1.800778826114008, "learning_rate": 5.480556953338465e-07, "loss": 0.67, "step": 6030 }, { "epoch": 0.556337216007381, "eval_GEN Loss": 0.44419172406196594, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3788146674633026, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8489783406257629, "eval_runtime": 57.277, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6030 }, { "epoch": 0.5564294775689078, "grad_norm": 1.4436387830618151, "learning_rate": 5.478689837077474e-07, "loss": 0.6105, "step": 6031 }, { "epoch": 0.5565217391304348, "grad_norm": 2.575774992825141, "learning_rate": 5.476822790713822e-07, "loss": 0.7822, "step": 6032 }, { "epoch": 0.5566140006919618, "grad_norm": 2.4842600998794375, "learning_rate": 5.474955814416707e-07, "loss": 0.6878, "step": 6033 }, { "epoch": 0.5567062622534886, "grad_norm": 2.022336573065477, "learning_rate": 5.473088908355318e-07, "loss": 0.726, "step": 6034 }, { "epoch": 0.5567985238150156, "grad_norm": 1.4545209792278082, "learning_rate": 5.471222072698831e-07, "loss": 0.5624, "step": 6035 }, { "epoch": 0.5567985238150156, "eval_GEN Loss": 0.4425466060638428, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3767794370651245, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8492788672447205, "eval_runtime": 57.1559, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6035 }, { "epoch": 0.5568907853765425, "grad_norm": 1.8979758698518996, "learning_rate": 5.469355307616429e-07, "loss": 0.6648, "step": 6036 }, { "epoch": 0.5569830469380694, "grad_norm": 2.4514133266429767, "learning_rate": 5.467488613277277e-07, "loss": 0.7218, "step": 6037 }, { "epoch": 0.5570753084995964, "grad_norm": 2.308728951701348, "learning_rate": 5.465621989850539e-07, "loss": 0.8342, "step": 6038 }, { "epoch": 0.5571675700611233, "grad_norm": 1.8736288022438226, "learning_rate": 5.463755437505369e-07, "loss": 0.6966, "step": 6039 }, { "epoch": 0.5572598316226502, "grad_norm": 1.7018471891436084, "learning_rate": 5.461888956410921e-07, "loss": 0.5853, "step": 6040 }, { "epoch": 0.5572598316226502, "eval_GEN Loss": 0.4426960051059723, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36654287576675415, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8493990302085876, "eval_runtime": 57.262, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6040 }, { "epoch": 0.5573520931841771, "grad_norm": 1.772931308474006, "learning_rate": 5.460022546736336e-07, "loss": 0.6825, "step": 6041 }, { "epoch": 0.5574443547457041, "grad_norm": 1.8117607319920592, "learning_rate": 5.458156208650749e-07, "loss": 0.671, "step": 6042 }, { "epoch": 0.557536616307231, "grad_norm": 1.8618744625006067, "learning_rate": 5.456289942323294e-07, "loss": 0.689, "step": 6043 }, { "epoch": 0.5576288778687579, "grad_norm": 1.8639644549799157, "learning_rate": 5.454423747923095e-07, "loss": 0.709, "step": 6044 }, { "epoch": 0.5577211394302849, "grad_norm": 1.7995675946875946, "learning_rate": 5.452557625619268e-07, "loss": 0.7222, "step": 6045 }, { "epoch": 0.5577211394302849, "eval_GEN Loss": 0.4431593716144562, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3646218776702881, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8492488265037537, "eval_runtime": 57.2779, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6045 }, { "epoch": 0.5578134009918118, "grad_norm": 2.3814671111722645, "learning_rate": 5.450691575580921e-07, "loss": 0.767, "step": 6046 }, { "epoch": 0.5579056625533387, "grad_norm": 1.9545952931158048, "learning_rate": 5.448825597977165e-07, "loss": 0.581, "step": 6047 }, { "epoch": 0.5579979241148656, "grad_norm": 1.528205036373789, "learning_rate": 5.446959692977094e-07, "loss": 0.6909, "step": 6048 }, { "epoch": 0.5580901856763926, "grad_norm": 1.7796182698855962, "learning_rate": 5.445093860749798e-07, "loss": 0.6534, "step": 6049 }, { "epoch": 0.5581824472379195, "grad_norm": 1.9208921358726816, "learning_rate": 5.443228101464365e-07, "loss": 0.7369, "step": 6050 }, { "epoch": 0.5581824472379195, "eval_GEN Loss": 0.4433639943599701, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36594533920288086, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8494892120361328, "eval_runtime": 57.1445, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6050 }, { "epoch": 0.5582747087994464, "grad_norm": 1.4856925726487455, "learning_rate": 5.44136241528987e-07, "loss": 0.732, "step": 6051 }, { "epoch": 0.5583669703609734, "grad_norm": 2.1356016941552762, "learning_rate": 5.439496802395387e-07, "loss": 0.8022, "step": 6052 }, { "epoch": 0.5584592319225002, "grad_norm": 1.4721841261553976, "learning_rate": 5.437631262949978e-07, "loss": 0.4921, "step": 6053 }, { "epoch": 0.5585514934840272, "grad_norm": 2.6197610068079724, "learning_rate": 5.435765797122704e-07, "loss": 0.8696, "step": 6054 }, { "epoch": 0.5586437550455542, "grad_norm": 1.523218798736045, "learning_rate": 5.433900405082615e-07, "loss": 0.6908, "step": 6055 }, { "epoch": 0.5586437550455542, "eval_GEN Loss": 0.44373270869255066, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36885830760002136, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8506009578704834, "eval_runtime": 57.1478, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6055 }, { "epoch": 0.558736016607081, "grad_norm": 2.0107099387400593, "learning_rate": 5.432035086998757e-07, "loss": 0.6211, "step": 6056 }, { "epoch": 0.558828278168608, "grad_norm": 1.3488593888435445, "learning_rate": 5.430169843040162e-07, "loss": 0.5673, "step": 6057 }, { "epoch": 0.5589205397301349, "grad_norm": 1.740803340646608, "learning_rate": 5.428304673375871e-07, "loss": 0.7719, "step": 6058 }, { "epoch": 0.5590128012916619, "grad_norm": 1.9342027997783982, "learning_rate": 5.426439578174902e-07, "loss": 0.7273, "step": 6059 }, { "epoch": 0.5591050628531888, "grad_norm": 2.016506417314573, "learning_rate": 5.424574557606274e-07, "loss": 0.7594, "step": 6060 }, { "epoch": 0.5591050628531888, "eval_GEN Loss": 0.443193644285202, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36932602524757385, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8531550765037537, "eval_runtime": 57.2643, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6060 }, { "epoch": 0.5591973244147157, "grad_norm": 1.5795993285502758, "learning_rate": 5.422709611839e-07, "loss": 0.6427, "step": 6061 }, { "epoch": 0.5592895859762427, "grad_norm": 1.8021418480154971, "learning_rate": 5.420844741042084e-07, "loss": 0.7967, "step": 6062 }, { "epoch": 0.5593818475377695, "grad_norm": 1.8256085912570994, "learning_rate": 5.418979945384523e-07, "loss": 0.5413, "step": 6063 }, { "epoch": 0.5594741090992965, "grad_norm": 3.327913082376932, "learning_rate": 5.417115225035305e-07, "loss": 0.6846, "step": 6064 }, { "epoch": 0.5595663706608235, "grad_norm": 1.8121306906762618, "learning_rate": 5.415250580163419e-07, "loss": 0.698, "step": 6065 }, { "epoch": 0.5595663706608235, "eval_GEN Loss": 0.4430874288082123, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3676074147224426, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8564002513885498, "eval_runtime": 57.1529, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6065 }, { "epoch": 0.5596586322223503, "grad_norm": 2.019778544318833, "learning_rate": 5.413386010937838e-07, "loss": 0.7622, "step": 6066 }, { "epoch": 0.5597508937838773, "grad_norm": 1.6272247983882702, "learning_rate": 5.411521517527531e-07, "loss": 0.5698, "step": 6067 }, { "epoch": 0.5598431553454042, "grad_norm": 1.7953437572872537, "learning_rate": 5.409657100101467e-07, "loss": 0.8083, "step": 6068 }, { "epoch": 0.5599354169069312, "grad_norm": 1.6472951964477116, "learning_rate": 5.407792758828599e-07, "loss": 0.679, "step": 6069 }, { "epoch": 0.560027678468458, "grad_norm": 1.79596830847061, "learning_rate": 5.405928493877877e-07, "loss": 0.7914, "step": 6070 }, { "epoch": 0.560027678468458, "eval_GEN Loss": 0.4428771436214447, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3641536235809326, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8594050407409668, "eval_runtime": 57.098, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6070 }, { "epoch": 0.560119940029985, "grad_norm": 2.143868710633408, "learning_rate": 5.404064305418241e-07, "loss": 0.6879, "step": 6071 }, { "epoch": 0.560212201591512, "grad_norm": 2.121643059409146, "learning_rate": 5.402200193618632e-07, "loss": 0.667, "step": 6072 }, { "epoch": 0.5603044631530388, "grad_norm": 1.5000740986061276, "learning_rate": 5.400336158647975e-07, "loss": 0.6444, "step": 6073 }, { "epoch": 0.5603967247145658, "grad_norm": 1.8945459770277933, "learning_rate": 5.398472200675192e-07, "loss": 0.4759, "step": 6074 }, { "epoch": 0.5604889862760927, "grad_norm": 2.2070144190507737, "learning_rate": 5.396608319869199e-07, "loss": 0.8163, "step": 6075 }, { "epoch": 0.5604889862760927, "eval_GEN Loss": 0.44367656111717224, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3670448362827301, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8658654093742371, "eval_runtime": 57.049, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6075 }, { "epoch": 0.5605812478376196, "grad_norm": 1.5680832846055872, "learning_rate": 5.394744516398905e-07, "loss": 0.6054, "step": 6076 }, { "epoch": 0.5606735093991466, "grad_norm": 2.105096434324365, "learning_rate": 5.392880790433208e-07, "loss": 0.6445, "step": 6077 }, { "epoch": 0.5607657709606735, "grad_norm": 1.769483895228845, "learning_rate": 5.391017142141e-07, "loss": 0.5708, "step": 6078 }, { "epoch": 0.5608580325222005, "grad_norm": 1.5344183274595646, "learning_rate": 5.389153571691175e-07, "loss": 0.7567, "step": 6079 }, { "epoch": 0.5609502940837273, "grad_norm": 2.1193382014783926, "learning_rate": 5.387290079252607e-07, "loss": 0.8801, "step": 6080 }, { "epoch": 0.5609502940837273, "eval_GEN Loss": 0.4437219798564911, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3750041723251343, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8693810105323792, "eval_runtime": 57.1838, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6080 }, { "epoch": 0.5610425556452543, "grad_norm": 1.3675272563452354, "learning_rate": 5.385426664994166e-07, "loss": 0.5827, "step": 6081 }, { "epoch": 0.5611348172067813, "grad_norm": 2.2153464814397807, "learning_rate": 5.383563329084726e-07, "loss": 0.6841, "step": 6082 }, { "epoch": 0.5612270787683081, "grad_norm": 1.7230999463602303, "learning_rate": 5.381700071693141e-07, "loss": 0.8029, "step": 6083 }, { "epoch": 0.5613193403298351, "grad_norm": 2.1280006519183865, "learning_rate": 5.379836892988261e-07, "loss": 0.6286, "step": 6084 }, { "epoch": 0.561411601891362, "grad_norm": 2.3219225665896865, "learning_rate": 5.377973793138931e-07, "loss": 0.6799, "step": 6085 }, { "epoch": 0.561411601891362, "eval_GEN Loss": 0.4442606270313263, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3753512501716614, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8725661039352417, "eval_runtime": 57.169, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6085 }, { "epoch": 0.5615038634528889, "grad_norm": 1.6790429628068604, "learning_rate": 5.376110772313989e-07, "loss": 0.7098, "step": 6086 }, { "epoch": 0.5615961250144159, "grad_norm": 2.7998290775258385, "learning_rate": 5.374247830682263e-07, "loss": 0.6895, "step": 6087 }, { "epoch": 0.5616883865759428, "grad_norm": 1.8539098969593657, "learning_rate": 5.37238496841258e-07, "loss": 0.655, "step": 6088 }, { "epoch": 0.5617806481374698, "grad_norm": 2.0799089159923434, "learning_rate": 5.370522185673751e-07, "loss": 0.8315, "step": 6089 }, { "epoch": 0.5618729096989966, "grad_norm": 1.9842334081499282, "learning_rate": 5.368659482634585e-07, "loss": 0.621, "step": 6090 }, { "epoch": 0.5618729096989966, "eval_GEN Loss": 0.444583922624588, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3695072531700134, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8797175288200378, "eval_runtime": 57.2989, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6090 }, { "epoch": 0.5619651712605236, "grad_norm": 1.9030064406865195, "learning_rate": 5.366796859463885e-07, "loss": 0.6164, "step": 6091 }, { "epoch": 0.5620574328220506, "grad_norm": 1.9843014117132551, "learning_rate": 5.364934316330442e-07, "loss": 0.457, "step": 6092 }, { "epoch": 0.5621496943835774, "grad_norm": 2.0945648938771506, "learning_rate": 5.363071853403046e-07, "loss": 0.7004, "step": 6093 }, { "epoch": 0.5622419559451044, "grad_norm": 1.6778355431143932, "learning_rate": 5.361209470850475e-07, "loss": 0.6138, "step": 6094 }, { "epoch": 0.5623342175066313, "grad_norm": 1.719113068149742, "learning_rate": 5.359347168841501e-07, "loss": 0.5611, "step": 6095 }, { "epoch": 0.5623342175066313, "eval_GEN Loss": 0.4460788667201996, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37019413709640503, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8838341236114502, "eval_runtime": 57.3961, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6095 }, { "epoch": 0.5624264790681582, "grad_norm": 2.010235266397851, "learning_rate": 5.357484947544885e-07, "loss": 0.7774, "step": 6096 }, { "epoch": 0.5625187406296852, "grad_norm": 2.3367462298487047, "learning_rate": 5.355622807129391e-07, "loss": 0.686, "step": 6097 }, { "epoch": 0.5626110021912121, "grad_norm": 1.7208946770839701, "learning_rate": 5.353760747763767e-07, "loss": 0.6382, "step": 6098 }, { "epoch": 0.562703263752739, "grad_norm": 2.3559952935085287, "learning_rate": 5.351898769616752e-07, "loss": 0.7186, "step": 6099 }, { "epoch": 0.5627955253142659, "grad_norm": 3.2541779886524056, "learning_rate": 5.350036872857087e-07, "loss": 0.7246, "step": 6100 }, { "epoch": 0.5627955253142659, "eval_GEN Loss": 0.44610080122947693, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37200111150741577, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8849759697914124, "eval_runtime": 57.1181, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6100 }, { "epoch": 0.5628877868757929, "grad_norm": 2.7611738836556556, "learning_rate": 5.348175057653496e-07, "loss": 0.7632, "step": 6101 }, { "epoch": 0.5629800484373197, "grad_norm": 2.3327918265878154, "learning_rate": 5.3463133241747e-07, "loss": 0.9377, "step": 6102 }, { "epoch": 0.5630723099988467, "grad_norm": 1.6218853969021552, "learning_rate": 5.344451672589411e-07, "loss": 0.6568, "step": 6103 }, { "epoch": 0.5631645715603737, "grad_norm": 1.6381885545774464, "learning_rate": 5.34259010306634e-07, "loss": 0.6199, "step": 6104 }, { "epoch": 0.5632568331219006, "grad_norm": 1.441411674822083, "learning_rate": 5.340728615774181e-07, "loss": 0.5568, "step": 6105 }, { "epoch": 0.5632568331219006, "eval_GEN Loss": 0.44724056124687195, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.379880428314209, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8784855604171753, "eval_runtime": 57.3192, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6105 }, { "epoch": 0.5633490946834275, "grad_norm": 2.0017445525203414, "learning_rate": 5.338867210881625e-07, "loss": 0.7631, "step": 6106 }, { "epoch": 0.5634413562449544, "grad_norm": 1.4236004896162777, "learning_rate": 5.337005888557358e-07, "loss": 0.4985, "step": 6107 }, { "epoch": 0.5635336178064814, "grad_norm": 2.6583366691749397, "learning_rate": 5.335144648970056e-07, "loss": 0.6841, "step": 6108 }, { "epoch": 0.5636258793680083, "grad_norm": 1.6091246467932905, "learning_rate": 5.333283492288384e-07, "loss": 0.6184, "step": 6109 }, { "epoch": 0.5637181409295352, "grad_norm": 3.441287531537653, "learning_rate": 5.331422418681004e-07, "loss": 0.9627, "step": 6110 }, { "epoch": 0.5637181409295352, "eval_GEN Loss": 0.4469130039215088, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3916610777378082, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8715444803237915, "eval_runtime": 57.3707, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6110 }, { "epoch": 0.5638104024910622, "grad_norm": 2.459008289743503, "learning_rate": 5.329561428316572e-07, "loss": 0.632, "step": 6111 }, { "epoch": 0.563902664052589, "grad_norm": 2.1061594742903873, "learning_rate": 5.327700521363733e-07, "loss": 0.7561, "step": 6112 }, { "epoch": 0.563994925614116, "grad_norm": 2.323000753314308, "learning_rate": 5.32583969799112e-07, "loss": 0.6079, "step": 6113 }, { "epoch": 0.564087187175643, "grad_norm": 1.7510638490111514, "learning_rate": 5.323978958367371e-07, "loss": 0.6465, "step": 6114 }, { "epoch": 0.5641794487371699, "grad_norm": 2.630766726429942, "learning_rate": 5.322118302661107e-07, "loss": 0.7809, "step": 6115 }, { "epoch": 0.5641794487371699, "eval_GEN Loss": 0.4479348063468933, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3996533453464508, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8708533644676208, "eval_runtime": 57.1276, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6115 }, { "epoch": 0.5642717102986968, "grad_norm": 2.218273520796578, "learning_rate": 5.320257731040944e-07, "loss": 0.7383, "step": 6116 }, { "epoch": 0.5643639718602237, "grad_norm": 1.3378541321119644, "learning_rate": 5.318397243675485e-07, "loss": 0.5772, "step": 6117 }, { "epoch": 0.5644562334217507, "grad_norm": 2.880939922004264, "learning_rate": 5.316536840733337e-07, "loss": 0.6269, "step": 6118 }, { "epoch": 0.5645484949832776, "grad_norm": 2.590496781680865, "learning_rate": 5.314676522383089e-07, "loss": 0.7544, "step": 6119 }, { "epoch": 0.5646407565448045, "grad_norm": 2.3011021239273535, "learning_rate": 5.312816288793328e-07, "loss": 0.4983, "step": 6120 }, { "epoch": 0.5646407565448045, "eval_GEN Loss": 0.44666653871536255, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3953973650932312, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.862500011920929, "eval_runtime": 57.343, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6120 }, { "epoch": 0.5647330181063315, "grad_norm": 1.7077281105576765, "learning_rate": 5.310956140132628e-07, "loss": 0.8193, "step": 6121 }, { "epoch": 0.5648252796678583, "grad_norm": 1.1071698784500625, "learning_rate": 5.309096076569563e-07, "loss": 0.4717, "step": 6122 }, { "epoch": 0.5649175412293853, "grad_norm": 1.8427813728335336, "learning_rate": 5.307236098272691e-07, "loss": 0.5271, "step": 6123 }, { "epoch": 0.5650098027909123, "grad_norm": 1.7010863907637501, "learning_rate": 5.305376205410566e-07, "loss": 0.7703, "step": 6124 }, { "epoch": 0.5651020643524391, "grad_norm": 2.604091552223231, "learning_rate": 5.303516398151739e-07, "loss": 0.8943, "step": 6125 }, { "epoch": 0.5651020643524391, "eval_GEN Loss": 0.44603076577186584, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3899054229259491, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8585336804389954, "eval_runtime": 57.2796, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6125 }, { "epoch": 0.5651943259139661, "grad_norm": 2.108792939332955, "learning_rate": 5.301656676664745e-07, "loss": 0.6478, "step": 6126 }, { "epoch": 0.565286587475493, "grad_norm": 2.1895863857701023, "learning_rate": 5.299797041118117e-07, "loss": 0.6537, "step": 6127 }, { "epoch": 0.56537884903702, "grad_norm": 3.6670059991590094, "learning_rate": 5.297937491680373e-07, "loss": 0.8632, "step": 6128 }, { "epoch": 0.5654711105985469, "grad_norm": 1.8152428165771783, "learning_rate": 5.296078028520035e-07, "loss": 0.8185, "step": 6129 }, { "epoch": 0.5655633721600738, "grad_norm": 2.0333631113850563, "learning_rate": 5.294218651805607e-07, "loss": 0.7835, "step": 6130 }, { "epoch": 0.5655633721600738, "eval_GEN Loss": 0.4469115734100342, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.39168596267700195, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8574519157409668, "eval_runtime": 57.3214, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6130 }, { "epoch": 0.5656556337216008, "grad_norm": 1.6749706763771293, "learning_rate": 5.292359361705587e-07, "loss": 0.6476, "step": 6131 }, { "epoch": 0.5657478952831276, "grad_norm": 1.9170090127683967, "learning_rate": 5.290500158388471e-07, "loss": 0.6313, "step": 6132 }, { "epoch": 0.5658401568446546, "grad_norm": 1.8817047578922965, "learning_rate": 5.288641042022742e-07, "loss": 0.6559, "step": 6133 }, { "epoch": 0.5659324184061815, "grad_norm": 2.211860990077569, "learning_rate": 5.286782012776875e-07, "loss": 0.8811, "step": 6134 }, { "epoch": 0.5660246799677084, "grad_norm": 1.2941898868997248, "learning_rate": 5.284923070819336e-07, "loss": 0.5671, "step": 6135 }, { "epoch": 0.5660246799677084, "eval_GEN Loss": 0.44703465700149536, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38215172290802, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8521033525466919, "eval_runtime": 57.3326, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6135 }, { "epoch": 0.5661169415292354, "grad_norm": 1.9589152314255067, "learning_rate": 5.283064216318589e-07, "loss": 0.4806, "step": 6136 }, { "epoch": 0.5662092030907623, "grad_norm": 1.2643098215233752, "learning_rate": 5.281205449443086e-07, "loss": 0.6277, "step": 6137 }, { "epoch": 0.5663014646522893, "grad_norm": 1.760342146508232, "learning_rate": 5.279346770361266e-07, "loss": 0.642, "step": 6138 }, { "epoch": 0.5663937262138161, "grad_norm": 3.0947950214333417, "learning_rate": 5.277488179241572e-07, "loss": 0.8301, "step": 6139 }, { "epoch": 0.5664859877753431, "grad_norm": 2.066608678522965, "learning_rate": 5.27562967625243e-07, "loss": 0.6947, "step": 6140 }, { "epoch": 0.5664859877753431, "eval_GEN Loss": 0.44731318950653076, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37222999334335327, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8486778736114502, "eval_runtime": 57.0409, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6140 }, { "epoch": 0.5665782493368701, "grad_norm": 2.4489269123059834, "learning_rate": 5.273771261562261e-07, "loss": 0.8638, "step": 6141 }, { "epoch": 0.5666705108983969, "grad_norm": 2.9549763540586715, "learning_rate": 5.271912935339474e-07, "loss": 0.7956, "step": 6142 }, { "epoch": 0.5667627724599239, "grad_norm": 1.5248128591012942, "learning_rate": 5.270054697752479e-07, "loss": 0.702, "step": 6143 }, { "epoch": 0.5668550340214508, "grad_norm": 1.7168258836736479, "learning_rate": 5.268196548969669e-07, "loss": 0.5038, "step": 6144 }, { "epoch": 0.5669472955829777, "grad_norm": 2.2207995833581466, "learning_rate": 5.266338489159435e-07, "loss": 0.7683, "step": 6145 }, { "epoch": 0.5669472955829777, "eval_GEN Loss": 0.4477813243865967, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3679277002811432, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8457632064819336, "eval_runtime": 57.2641, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6145 }, { "epoch": 0.5670395571445047, "grad_norm": 1.878630356189863, "learning_rate": 5.264480518490153e-07, "loss": 0.7269, "step": 6146 }, { "epoch": 0.5671318187060316, "grad_norm": 1.8546867107575418, "learning_rate": 5.262622637130199e-07, "loss": 0.586, "step": 6147 }, { "epoch": 0.5672240802675586, "grad_norm": 1.343978533503116, "learning_rate": 5.260764845247935e-07, "loss": 0.5522, "step": 6148 }, { "epoch": 0.5673163418290854, "grad_norm": 1.8022136333296677, "learning_rate": 5.258907143011716e-07, "loss": 0.7058, "step": 6149 }, { "epoch": 0.5674086033906124, "grad_norm": 1.663079410235386, "learning_rate": 5.257049530589894e-07, "loss": 0.5944, "step": 6150 }, { "epoch": 0.5674086033906124, "eval_GEN Loss": 0.4481658339500427, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3613624572753906, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8456730842590332, "eval_runtime": 57.1466, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6150 }, { "epoch": 0.5675008649521394, "grad_norm": 2.140899834414291, "learning_rate": 5.255192008150806e-07, "loss": 0.8861, "step": 6151 }, { "epoch": 0.5675931265136662, "grad_norm": 1.4867796552324366, "learning_rate": 5.253334575862785e-07, "loss": 0.583, "step": 6152 }, { "epoch": 0.5676853880751932, "grad_norm": 1.5525545827256437, "learning_rate": 5.251477233894151e-07, "loss": 0.6224, "step": 6153 }, { "epoch": 0.5677776496367201, "grad_norm": 1.4309867238998513, "learning_rate": 5.249619982413224e-07, "loss": 0.6531, "step": 6154 }, { "epoch": 0.567869911198247, "grad_norm": 1.3863241087609588, "learning_rate": 5.247762821588308e-07, "loss": 0.6433, "step": 6155 }, { "epoch": 0.567869911198247, "eval_GEN Loss": 0.44783708453178406, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35481974482536316, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.848437488079071, "eval_runtime": 57.234, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6155 }, { "epoch": 0.567962172759774, "grad_norm": 1.691708086866545, "learning_rate": 5.245905751587703e-07, "loss": 0.6018, "step": 6156 }, { "epoch": 0.5680544343213009, "grad_norm": 1.5148224594904718, "learning_rate": 5.244048772579699e-07, "loss": 0.6479, "step": 6157 }, { "epoch": 0.5681466958828278, "grad_norm": 2.469190864495284, "learning_rate": 5.24219188473258e-07, "loss": 0.7766, "step": 6158 }, { "epoch": 0.5682389574443547, "grad_norm": 2.146868630818894, "learning_rate": 5.240335088214616e-07, "loss": 0.7795, "step": 6159 }, { "epoch": 0.5683312190058817, "grad_norm": 2.5537190064162325, "learning_rate": 5.238478383194077e-07, "loss": 0.9488, "step": 6160 }, { "epoch": 0.5683312190058817, "eval_GEN Loss": 0.447154700756073, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35590067505836487, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8420072197914124, "eval_runtime": 57.1427, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6160 }, { "epoch": 0.5684234805674087, "grad_norm": 1.7955989689765957, "learning_rate": 5.236621769839219e-07, "loss": 0.6064, "step": 6161 }, { "epoch": 0.5685157421289355, "grad_norm": 1.1898363461554136, "learning_rate": 5.234765248318293e-07, "loss": 0.4338, "step": 6162 }, { "epoch": 0.5686080036904625, "grad_norm": 1.32247575820924, "learning_rate": 5.232908818799533e-07, "loss": 0.6128, "step": 6163 }, { "epoch": 0.5687002652519894, "grad_norm": 1.800022647161181, "learning_rate": 5.231052481451182e-07, "loss": 0.5995, "step": 6164 }, { "epoch": 0.5687925268135163, "grad_norm": 1.7753933142265066, "learning_rate": 5.229196236441457e-07, "loss": 0.7372, "step": 6165 }, { "epoch": 0.5687925268135163, "eval_GEN Loss": 0.44691330194473267, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36090758442878723, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8399639129638672, "eval_runtime": 57.3339, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6165 }, { "epoch": 0.5688847883750432, "grad_norm": 2.8345615330355587, "learning_rate": 5.227340083938577e-07, "loss": 0.6546, "step": 6166 }, { "epoch": 0.5689770499365702, "grad_norm": 1.835231795802832, "learning_rate": 5.225484024110745e-07, "loss": 0.6786, "step": 6167 }, { "epoch": 0.5690693114980971, "grad_norm": 1.7944115037862123, "learning_rate": 5.223628057126167e-07, "loss": 0.8347, "step": 6168 }, { "epoch": 0.569161573059624, "grad_norm": 1.439465111716869, "learning_rate": 5.221772183153029e-07, "loss": 0.4987, "step": 6169 }, { "epoch": 0.569253834621151, "grad_norm": 3.5505841859413216, "learning_rate": 5.219916402359514e-07, "loss": 0.9236, "step": 6170 }, { "epoch": 0.569253834621151, "eval_GEN Loss": 0.4468501806259155, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3712359368801117, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8360576629638672, "eval_runtime": 57.1796, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6170 }, { "epoch": 0.5693460961826778, "grad_norm": 1.6667541546954812, "learning_rate": 5.218060714913796e-07, "loss": 0.6261, "step": 6171 }, { "epoch": 0.5694383577442048, "grad_norm": 1.503982680211012, "learning_rate": 5.216205120984041e-07, "loss": 0.56, "step": 6172 }, { "epoch": 0.5695306193057318, "grad_norm": 1.256389490809627, "learning_rate": 5.214349620738405e-07, "loss": 0.6269, "step": 6173 }, { "epoch": 0.5696228808672587, "grad_norm": 2.127738128604865, "learning_rate": 5.212494214345034e-07, "loss": 0.5951, "step": 6174 }, { "epoch": 0.5697151424287856, "grad_norm": 2.0984686488423896, "learning_rate": 5.210638901972072e-07, "loss": 0.676, "step": 6175 }, { "epoch": 0.5697151424287856, "eval_GEN Loss": 0.44801753759384155, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37713494896888733, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8355168104171753, "eval_runtime": 57.376, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6175 }, { "epoch": 0.5698074039903125, "grad_norm": 1.5623644429667924, "learning_rate": 5.20878368378765e-07, "loss": 0.6359, "step": 6176 }, { "epoch": 0.5698996655518395, "grad_norm": 2.245924673569924, "learning_rate": 5.20692855995989e-07, "loss": 0.687, "step": 6177 }, { "epoch": 0.5699919271133664, "grad_norm": 1.7802022978044774, "learning_rate": 5.205073530656901e-07, "loss": 0.6259, "step": 6178 }, { "epoch": 0.5700841886748933, "grad_norm": 1.5567258899209426, "learning_rate": 5.203218596046798e-07, "loss": 0.5204, "step": 6179 }, { "epoch": 0.5701764502364203, "grad_norm": 1.464125682044938, "learning_rate": 5.201363756297672e-07, "loss": 0.6038, "step": 6180 }, { "epoch": 0.5701764502364203, "eval_GEN Loss": 0.4488571882247925, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3740454316139221, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8370793461799622, "eval_runtime": 57.128, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6180 }, { "epoch": 0.5702687117979471, "grad_norm": 1.708001043406093, "learning_rate": 5.199509011577612e-07, "loss": 0.609, "step": 6181 }, { "epoch": 0.5703609733594741, "grad_norm": 1.7101422764066867, "learning_rate": 5.1976543620547e-07, "loss": 0.6545, "step": 6182 }, { "epoch": 0.5704532349210011, "grad_norm": 2.321386510253528, "learning_rate": 5.195799807897008e-07, "loss": 0.8314, "step": 6183 }, { "epoch": 0.570545496482528, "grad_norm": 3.018362557622081, "learning_rate": 5.193945349272595e-07, "loss": 0.6273, "step": 6184 }, { "epoch": 0.5706377580440549, "grad_norm": 3.1128825449050868, "learning_rate": 5.192090986349514e-07, "loss": 0.8193, "step": 6185 }, { "epoch": 0.5706377580440549, "eval_GEN Loss": 0.44802117347717285, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3708059787750244, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8387620449066162, "eval_runtime": 57.3052, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6185 }, { "epoch": 0.5707300196055818, "grad_norm": 1.4411742222053687, "learning_rate": 5.190236719295816e-07, "loss": 0.6475, "step": 6186 }, { "epoch": 0.5708222811671088, "grad_norm": 1.5943905804330318, "learning_rate": 5.188382548279535e-07, "loss": 0.7621, "step": 6187 }, { "epoch": 0.5709145427286357, "grad_norm": 1.8112512199900366, "learning_rate": 5.186528473468695e-07, "loss": 0.5684, "step": 6188 }, { "epoch": 0.5710068042901626, "grad_norm": 2.4060558346075083, "learning_rate": 5.184674495031322e-07, "loss": 1.0475, "step": 6189 }, { "epoch": 0.5710990658516896, "grad_norm": 2.276919267330909, "learning_rate": 5.182820613135423e-07, "loss": 0.8138, "step": 6190 }, { "epoch": 0.5710990658516896, "eval_GEN Loss": 0.4486725330352783, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3674919605255127, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8448317050933838, "eval_runtime": 57.2818, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6190 }, { "epoch": 0.5711913274132164, "grad_norm": 1.7339592696728643, "learning_rate": 5.180966827949e-07, "loss": 0.6029, "step": 6191 }, { "epoch": 0.5712835889747434, "grad_norm": 2.4385550845249937, "learning_rate": 5.179113139640044e-07, "loss": 0.7959, "step": 6192 }, { "epoch": 0.5713758505362704, "grad_norm": 2.410520420443738, "learning_rate": 5.177259548376542e-07, "loss": 0.7489, "step": 6193 }, { "epoch": 0.5714681120977972, "grad_norm": 1.6958709432536094, "learning_rate": 5.175406054326469e-07, "loss": 0.6345, "step": 6194 }, { "epoch": 0.5715603736593242, "grad_norm": 3.026204818624776, "learning_rate": 5.173552657657788e-07, "loss": 0.927, "step": 6195 }, { "epoch": 0.5715603736593242, "eval_GEN Loss": 0.4475541114807129, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3630867302417755, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8487379550933838, "eval_runtime": 57.3407, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6195 }, { "epoch": 0.5716526352208511, "grad_norm": 1.542340256435394, "learning_rate": 5.171699358538462e-07, "loss": 0.7088, "step": 6196 }, { "epoch": 0.571744896782378, "grad_norm": 1.7996649592882747, "learning_rate": 5.169846157136437e-07, "loss": 0.7954, "step": 6197 }, { "epoch": 0.5718371583439049, "grad_norm": 1.5767991352721336, "learning_rate": 5.167993053619653e-07, "loss": 0.5993, "step": 6198 }, { "epoch": 0.5719294199054319, "grad_norm": 1.6209888845824885, "learning_rate": 5.16614004815604e-07, "loss": 0.467, "step": 6199 }, { "epoch": 0.5720216814669589, "grad_norm": 1.6499212407902066, "learning_rate": 5.164287140913524e-07, "loss": 0.6617, "step": 6200 }, { "epoch": 0.5720216814669589, "eval_GEN Loss": 0.4485163986682892, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3642854392528534, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8577523827552795, "eval_runtime": 57.3193, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6200 }, { "epoch": 0.5721139430284857, "grad_norm": 1.2500008034993393, "learning_rate": 5.162434332060016e-07, "loss": 0.4662, "step": 6201 }, { "epoch": 0.5722062045900127, "grad_norm": 1.7051528183804858, "learning_rate": 5.160581621763421e-07, "loss": 0.5484, "step": 6202 }, { "epoch": 0.5722984661515396, "grad_norm": 2.3125585276972154, "learning_rate": 5.158729010191632e-07, "loss": 0.7992, "step": 6203 }, { "epoch": 0.5723907277130665, "grad_norm": 2.206468118767554, "learning_rate": 5.15687649751254e-07, "loss": 0.7239, "step": 6204 }, { "epoch": 0.5724829892745935, "grad_norm": 2.380458913050461, "learning_rate": 5.155024083894021e-07, "loss": 0.7647, "step": 6205 }, { "epoch": 0.5724829892745935, "eval_GEN Loss": 0.44868528842926025, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3702375888824463, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.857692301273346, "eval_runtime": 57.2183, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6205 }, { "epoch": 0.5725752508361204, "grad_norm": 1.6461874110616814, "learning_rate": 5.153171769503941e-07, "loss": 0.6555, "step": 6206 }, { "epoch": 0.5726675123976473, "grad_norm": 1.8160444101621238, "learning_rate": 5.151319554510163e-07, "loss": 0.5797, "step": 6207 }, { "epoch": 0.5727597739591742, "grad_norm": 2.227270060004341, "learning_rate": 5.149467439080537e-07, "loss": 0.6876, "step": 6208 }, { "epoch": 0.5728520355207012, "grad_norm": 1.7848689332243686, "learning_rate": 5.147615423382902e-07, "loss": 0.8492, "step": 6209 }, { "epoch": 0.5729442970822282, "grad_norm": 2.8142925458608063, "learning_rate": 5.145763507585092e-07, "loss": 0.6772, "step": 6210 }, { "epoch": 0.5729442970822282, "eval_GEN Loss": 0.448138564825058, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3724932372570038, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8555588722229004, "eval_runtime": 57.1755, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6210 }, { "epoch": 0.573036558643755, "grad_norm": 1.7836752663844049, "learning_rate": 5.143911691854933e-07, "loss": 0.6051, "step": 6211 }, { "epoch": 0.573128820205282, "grad_norm": 2.2766217358855623, "learning_rate": 5.142059976360237e-07, "loss": 0.8162, "step": 6212 }, { "epoch": 0.5732210817668089, "grad_norm": 2.370832110954563, "learning_rate": 5.140208361268808e-07, "loss": 0.722, "step": 6213 }, { "epoch": 0.5733133433283358, "grad_norm": 1.396679711852194, "learning_rate": 5.138356846748446e-07, "loss": 0.4564, "step": 6214 }, { "epoch": 0.5734056048898628, "grad_norm": 1.5360126941360914, "learning_rate": 5.136505432966937e-07, "loss": 0.7661, "step": 6215 }, { "epoch": 0.5734056048898628, "eval_GEN Loss": 0.44859305024147034, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3767581880092621, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8487379550933838, "eval_runtime": 57.2025, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6215 }, { "epoch": 0.5734978664513897, "grad_norm": 1.2484035579758996, "learning_rate": 5.134654120092058e-07, "loss": 0.5262, "step": 6216 }, { "epoch": 0.5735901280129166, "grad_norm": 1.483914027177951, "learning_rate": 5.132802908291577e-07, "loss": 0.5843, "step": 6217 }, { "epoch": 0.5736823895744435, "grad_norm": 2.0681244336544786, "learning_rate": 5.130951797733256e-07, "loss": 0.7169, "step": 6218 }, { "epoch": 0.5737746511359705, "grad_norm": 3.559879071738796, "learning_rate": 5.129100788584845e-07, "loss": 0.874, "step": 6219 }, { "epoch": 0.5738669126974975, "grad_norm": 1.759559768189963, "learning_rate": 5.127249881014083e-07, "loss": 0.6823, "step": 6220 }, { "epoch": 0.5738669126974975, "eval_GEN Loss": 0.4485185742378235, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3839877247810364, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8512620329856873, "eval_runtime": 57.371, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6220 }, { "epoch": 0.5739591742590243, "grad_norm": 1.6711208700745743, "learning_rate": 5.125399075188705e-07, "loss": 0.6009, "step": 6221 }, { "epoch": 0.5740514358205513, "grad_norm": 2.5476573705496715, "learning_rate": 5.123548371276433e-07, "loss": 0.8214, "step": 6222 }, { "epoch": 0.5741436973820782, "grad_norm": 2.3306827635155507, "learning_rate": 5.121697769444982e-07, "loss": 0.6874, "step": 6223 }, { "epoch": 0.5742359589436051, "grad_norm": 3.2129076017573257, "learning_rate": 5.119847269862051e-07, "loss": 0.8815, "step": 6224 }, { "epoch": 0.5743282205051321, "grad_norm": 2.30950632822209, "learning_rate": 5.117996872695343e-07, "loss": 0.6243, "step": 6225 }, { "epoch": 0.5743282205051321, "eval_GEN Loss": 0.44919687509536743, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.39208537340164185, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.85546875, "eval_runtime": 57.3235, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6225 }, { "epoch": 0.574420482066659, "grad_norm": 2.753139448215076, "learning_rate": 5.11614657811254e-07, "loss": 0.8853, "step": 6226 }, { "epoch": 0.5745127436281859, "grad_norm": 3.650423192875443, "learning_rate": 5.114296386281317e-07, "loss": 1.0976, "step": 6227 }, { "epoch": 0.5746050051897128, "grad_norm": 1.7808354335579697, "learning_rate": 5.112446297369345e-07, "loss": 0.6677, "step": 6228 }, { "epoch": 0.5746972667512398, "grad_norm": 1.8502618110215394, "learning_rate": 5.11059631154428e-07, "loss": 0.6783, "step": 6229 }, { "epoch": 0.5747895283127666, "grad_norm": 2.4380896231259856, "learning_rate": 5.108746428973771e-07, "loss": 0.9668, "step": 6230 }, { "epoch": 0.5747895283127666, "eval_GEN Loss": 0.4472537040710449, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3901454508304596, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8471454381942749, "eval_runtime": 57.3268, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6230 }, { "epoch": 0.5748817898742936, "grad_norm": 1.7610658515690787, "learning_rate": 5.106896649825453e-07, "loss": 0.7222, "step": 6231 }, { "epoch": 0.5749740514358206, "grad_norm": 1.796302167953163, "learning_rate": 5.105046974266964e-07, "loss": 0.5969, "step": 6232 }, { "epoch": 0.5750663129973475, "grad_norm": 3.310097208396216, "learning_rate": 5.103197402465919e-07, "loss": 1.0236, "step": 6233 }, { "epoch": 0.5751585745588744, "grad_norm": 2.0031917256681, "learning_rate": 5.101347934589929e-07, "loss": 0.6425, "step": 6234 }, { "epoch": 0.5752508361204013, "grad_norm": 1.669421328953246, "learning_rate": 5.099498570806599e-07, "loss": 0.6156, "step": 6235 }, { "epoch": 0.5752508361204013, "eval_GEN Loss": 0.44629761576652527, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3836534023284912, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8453124761581421, "eval_runtime": 57.3424, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6235 }, { "epoch": 0.5753430976819283, "grad_norm": 1.7075303966703184, "learning_rate": 5.09764931128352e-07, "loss": 0.5507, "step": 6236 }, { "epoch": 0.5754353592434552, "grad_norm": 2.0412386661491895, "learning_rate": 5.095800156188274e-07, "loss": 0.9103, "step": 6237 }, { "epoch": 0.5755276208049821, "grad_norm": 1.9685970693040504, "learning_rate": 5.093951105688433e-07, "loss": 0.6855, "step": 6238 }, { "epoch": 0.5756198823665091, "grad_norm": 1.1805826720932644, "learning_rate": 5.092102159951563e-07, "loss": 0.669, "step": 6239 }, { "epoch": 0.5757121439280359, "grad_norm": 1.8840681972806004, "learning_rate": 5.090253319145219e-07, "loss": 0.7034, "step": 6240 }, { "epoch": 0.5757121439280359, "eval_GEN Loss": 0.4456259608268738, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3735443949699402, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.84765625, "eval_runtime": 57.3844, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6240 }, { "epoch": 0.5758044054895629, "grad_norm": 1.843632281650483, "learning_rate": 5.088404583436944e-07, "loss": 0.5237, "step": 6241 }, { "epoch": 0.5758966670510899, "grad_norm": 1.1925620217158261, "learning_rate": 5.086555952994274e-07, "loss": 0.5959, "step": 6242 }, { "epoch": 0.5759889286126167, "grad_norm": 1.8954381024669165, "learning_rate": 5.084707427984735e-07, "loss": 0.6655, "step": 6243 }, { "epoch": 0.5760811901741437, "grad_norm": 2.8560300470362288, "learning_rate": 5.082859008575844e-07, "loss": 0.9426, "step": 6244 }, { "epoch": 0.5761734517356706, "grad_norm": 2.4007087021532008, "learning_rate": 5.081010694935102e-07, "loss": 0.8362, "step": 6245 }, { "epoch": 0.5761734517356706, "eval_GEN Loss": 0.4449399709701538, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3680694103240967, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8457632064819336, "eval_runtime": 57.4413, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6245 }, { "epoch": 0.5762657132971976, "grad_norm": 1.8522733425907665, "learning_rate": 5.079162487230016e-07, "loss": 0.592, "step": 6246 }, { "epoch": 0.5763579748587245, "grad_norm": 1.7095599288890162, "learning_rate": 5.077314385628067e-07, "loss": 0.7616, "step": 6247 }, { "epoch": 0.5764502364202514, "grad_norm": 3.2767200775512353, "learning_rate": 5.075466390296735e-07, "loss": 0.7846, "step": 6248 }, { "epoch": 0.5765424979817784, "grad_norm": 1.3149887909056912, "learning_rate": 5.073618501403485e-07, "loss": 0.5795, "step": 6249 }, { "epoch": 0.5766347595433052, "grad_norm": 3.2123919431283485, "learning_rate": 5.07177071911578e-07, "loss": 0.9979, "step": 6250 }, { "epoch": 0.5766347595433052, "eval_GEN Loss": 0.44393929839134216, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36147376894950867, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8466646671295166, "eval_runtime": 57.1671, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6250 }, { "epoch": 0.5767270211048322, "grad_norm": 1.5750175134131081, "learning_rate": 5.069923043601066e-07, "loss": 0.5442, "step": 6251 }, { "epoch": 0.5768192826663592, "grad_norm": 3.1293236809123033, "learning_rate": 5.068075475026784e-07, "loss": 0.8603, "step": 6252 }, { "epoch": 0.576911544227886, "grad_norm": 2.0553066472715593, "learning_rate": 5.066228013560363e-07, "loss": 0.7489, "step": 6253 }, { "epoch": 0.577003805789413, "grad_norm": 2.2145444563581407, "learning_rate": 5.064380659369224e-07, "loss": 0.7646, "step": 6254 }, { "epoch": 0.5770960673509399, "grad_norm": 2.1598061127323747, "learning_rate": 5.062533412620774e-07, "loss": 0.5759, "step": 6255 }, { "epoch": 0.5770960673509399, "eval_GEN Loss": 0.44289496541023254, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3601723313331604, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8483774065971375, "eval_runtime": 57.4472, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 6255 }, { "epoch": 0.5771883289124669, "grad_norm": 2.457290089704898, "learning_rate": 5.060686273482413e-07, "loss": 0.7559, "step": 6256 }, { "epoch": 0.5772805904739938, "grad_norm": 2.650896940737318, "learning_rate": 5.058839242121537e-07, "loss": 0.8371, "step": 6257 }, { "epoch": 0.5773728520355207, "grad_norm": 2.449056681175489, "learning_rate": 5.056992318705524e-07, "loss": 0.7286, "step": 6258 }, { "epoch": 0.5774651135970477, "grad_norm": 1.34394039304556, "learning_rate": 5.055145503401742e-07, "loss": 0.5618, "step": 6259 }, { "epoch": 0.5775573751585745, "grad_norm": 2.1255001658686674, "learning_rate": 5.053298796377558e-07, "loss": 0.6661, "step": 6260 }, { "epoch": 0.5775573751585745, "eval_GEN Loss": 0.44230708479881287, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36031216382980347, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.844531238079071, "eval_runtime": 57.4223, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6260 }, { "epoch": 0.5776496367201015, "grad_norm": 1.9793485007299743, "learning_rate": 5.051452197800321e-07, "loss": 0.6457, "step": 6261 }, { "epoch": 0.5777418982816284, "grad_norm": 1.6664710909440852, "learning_rate": 5.049605707837371e-07, "loss": 0.6058, "step": 6262 }, { "epoch": 0.5778341598431553, "grad_norm": 1.1550179285404405, "learning_rate": 5.047759326656041e-07, "loss": 0.7131, "step": 6263 }, { "epoch": 0.5779264214046823, "grad_norm": 2.3115722249202504, "learning_rate": 5.045913054423654e-07, "loss": 0.6716, "step": 6264 }, { "epoch": 0.5780186829662092, "grad_norm": 1.6942400930624286, "learning_rate": 5.044066891307521e-07, "loss": 0.7231, "step": 6265 }, { "epoch": 0.5780186829662092, "eval_GEN Loss": 0.44247403740882874, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3615669310092926, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8438401222229004, "eval_runtime": 57.2733, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6265 }, { "epoch": 0.5781109445277361, "grad_norm": 2.3643043527321015, "learning_rate": 5.042220837474945e-07, "loss": 0.6277, "step": 6266 }, { "epoch": 0.578203206089263, "grad_norm": 2.239889924641611, "learning_rate": 5.040374893093216e-07, "loss": 0.7217, "step": 6267 }, { "epoch": 0.57829546765079, "grad_norm": 2.4853813367192, "learning_rate": 5.03852905832962e-07, "loss": 0.6224, "step": 6268 }, { "epoch": 0.578387729212317, "grad_norm": 1.2993049628261604, "learning_rate": 5.036683333351427e-07, "loss": 0.5844, "step": 6269 }, { "epoch": 0.5784799907738438, "grad_norm": 1.7405560383155774, "learning_rate": 5.034837718325898e-07, "loss": 0.7771, "step": 6270 }, { "epoch": 0.5784799907738438, "eval_GEN Loss": 0.44289132952690125, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35844630002975464, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8411959409713745, "eval_runtime": 56.2499, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6270 }, { "epoch": 0.5785722523353708, "grad_norm": 1.4686108293130504, "learning_rate": 5.032992213420291e-07, "loss": 0.544, "step": 6271 }, { "epoch": 0.5786645138968977, "grad_norm": 3.2371706941018754, "learning_rate": 5.031146818801844e-07, "loss": 0.8877, "step": 6272 }, { "epoch": 0.5787567754584246, "grad_norm": 2.4803819605256407, "learning_rate": 5.029301534637792e-07, "loss": 0.8763, "step": 6273 }, { "epoch": 0.5788490370199516, "grad_norm": 1.8970274086804548, "learning_rate": 5.027456361095355e-07, "loss": 0.56, "step": 6274 }, { "epoch": 0.5789412985814785, "grad_norm": 2.455877829542905, "learning_rate": 5.025611298341746e-07, "loss": 0.878, "step": 6275 }, { "epoch": 0.5789412985814785, "eval_GEN Loss": 0.4429391324520111, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3621702492237091, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8396634459495544, "eval_runtime": 57.2951, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6275 }, { "epoch": 0.5790335601430054, "grad_norm": 3.2251583862203934, "learning_rate": 5.023766346544169e-07, "loss": 0.7686, "step": 6276 }, { "epoch": 0.5791258217045323, "grad_norm": 1.9479865836231116, "learning_rate": 5.021921505869816e-07, "loss": 0.7707, "step": 6277 }, { "epoch": 0.5792180832660593, "grad_norm": 1.5524351140581134, "learning_rate": 5.020076776485869e-07, "loss": 0.58, "step": 6278 }, { "epoch": 0.5793103448275863, "grad_norm": 1.519012393718598, "learning_rate": 5.018232158559502e-07, "loss": 0.6036, "step": 6279 }, { "epoch": 0.5794026063891131, "grad_norm": 2.0416936311821448, "learning_rate": 5.016387652257875e-07, "loss": 0.6293, "step": 6280 }, { "epoch": 0.5794026063891131, "eval_GEN Loss": 0.4442954361438751, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3694881498813629, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8370493054389954, "eval_runtime": 57.3396, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6280 }, { "epoch": 0.5794948679506401, "grad_norm": 1.7865320122746156, "learning_rate": 5.014543257748138e-07, "loss": 0.5878, "step": 6281 }, { "epoch": 0.579587129512167, "grad_norm": 2.4777519949035205, "learning_rate": 5.012698975197438e-07, "loss": 0.6083, "step": 6282 }, { "epoch": 0.5796793910736939, "grad_norm": 1.6135418325346162, "learning_rate": 5.010854804772905e-07, "loss": 0.557, "step": 6283 }, { "epoch": 0.5797716526352209, "grad_norm": 1.4613067619218074, "learning_rate": 5.009010746641658e-07, "loss": 0.5939, "step": 6284 }, { "epoch": 0.5798639141967478, "grad_norm": 2.5948786423169676, "learning_rate": 5.007166800970812e-07, "loss": 0.8604, "step": 6285 }, { "epoch": 0.5798639141967478, "eval_GEN Loss": 0.44443362951278687, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37374812364578247, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8397836685180664, "eval_runtime": 57.0403, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6285 }, { "epoch": 0.5799561757582747, "grad_norm": 1.8141132517970568, "learning_rate": 5.005322967927466e-07, "loss": 0.6753, "step": 6286 }, { "epoch": 0.5800484373198016, "grad_norm": 2.108167251244058, "learning_rate": 5.003479247678713e-07, "loss": 0.6162, "step": 6287 }, { "epoch": 0.5801406988813286, "grad_norm": 1.4581910217297223, "learning_rate": 5.001635640391631e-07, "loss": 0.3945, "step": 6288 }, { "epoch": 0.5802329604428555, "grad_norm": 1.6632769325541847, "learning_rate": 4.999792146233293e-07, "loss": 0.7814, "step": 6289 }, { "epoch": 0.5803252220043824, "grad_norm": 2.040496561050976, "learning_rate": 4.99794876537076e-07, "loss": 0.6227, "step": 6290 }, { "epoch": 0.5803252220043824, "eval_GEN Loss": 0.4442143738269806, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37518489360809326, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8455829620361328, "eval_runtime": 57.1761, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6290 }, { "epoch": 0.5804174835659094, "grad_norm": 2.3321307787079606, "learning_rate": 4.996105497971077e-07, "loss": 0.6832, "step": 6291 }, { "epoch": 0.5805097451274362, "grad_norm": 2.368584793838458, "learning_rate": 4.99426234420129e-07, "loss": 0.9353, "step": 6292 }, { "epoch": 0.5806020066889632, "grad_norm": 2.0964144106359015, "learning_rate": 4.992419304228426e-07, "loss": 0.6662, "step": 6293 }, { "epoch": 0.5806942682504901, "grad_norm": 1.5565977721455277, "learning_rate": 4.990576378219504e-07, "loss": 0.5956, "step": 6294 }, { "epoch": 0.5807865298120171, "grad_norm": 2.1614000672122726, "learning_rate": 4.988733566341532e-07, "loss": 0.8804, "step": 6295 }, { "epoch": 0.5807865298120171, "eval_GEN Loss": 0.4442565143108368, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3755781054496765, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8527644276618958, "eval_runtime": 57.1918, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6295 }, { "epoch": 0.580878791373544, "grad_norm": 1.9639742551272548, "learning_rate": 4.98689086876151e-07, "loss": 0.9143, "step": 6296 }, { "epoch": 0.5809710529350709, "grad_norm": 2.597084382572254, "learning_rate": 4.985048285646426e-07, "loss": 0.7808, "step": 6297 }, { "epoch": 0.5810633144965979, "grad_norm": 2.6293191136813134, "learning_rate": 4.983205817163258e-07, "loss": 0.7581, "step": 6298 }, { "epoch": 0.5811555760581247, "grad_norm": 2.046438334957246, "learning_rate": 4.981363463478971e-07, "loss": 0.6627, "step": 6299 }, { "epoch": 0.5812478376196517, "grad_norm": 1.4895247222017614, "learning_rate": 4.979521224760525e-07, "loss": 0.6744, "step": 6300 }, { "epoch": 0.5812478376196517, "eval_GEN Loss": 0.44413647055625916, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3791421353816986, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8539062738418579, "eval_runtime": 56.4142, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6300 }, { "epoch": 0.5813400991811787, "grad_norm": 2.451819491882502, "learning_rate": 4.977679101174866e-07, "loss": 0.8531, "step": 6301 }, { "epoch": 0.5814323607427055, "grad_norm": 1.5795226193015892, "learning_rate": 4.975837092888928e-07, "loss": 0.6306, "step": 6302 }, { "epoch": 0.5815246223042325, "grad_norm": 2.1860492052888403, "learning_rate": 4.973995200069638e-07, "loss": 0.6333, "step": 6303 }, { "epoch": 0.5816168838657594, "grad_norm": 1.4055319141572524, "learning_rate": 4.972153422883913e-07, "loss": 0.5979, "step": 6304 }, { "epoch": 0.5817091454272864, "grad_norm": 1.4755694853048007, "learning_rate": 4.970311761498656e-07, "loss": 0.5261, "step": 6305 }, { "epoch": 0.5817091454272864, "eval_GEN Loss": 0.44374459981918335, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38112762570381165, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.851832926273346, "eval_runtime": 57.259, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6305 }, { "epoch": 0.5818014069888133, "grad_norm": 2.2001000874785404, "learning_rate": 4.968470216080759e-07, "loss": 0.57, "step": 6306 }, { "epoch": 0.5818936685503402, "grad_norm": 2.510790698824779, "learning_rate": 4.966628786797111e-07, "loss": 0.701, "step": 6307 }, { "epoch": 0.5819859301118672, "grad_norm": 1.9789588740976152, "learning_rate": 4.964787473814582e-07, "loss": 0.6007, "step": 6308 }, { "epoch": 0.582078191673394, "grad_norm": 2.5065788086234644, "learning_rate": 4.962946277300034e-07, "loss": 0.7856, "step": 6309 }, { "epoch": 0.582170453234921, "grad_norm": 1.8520981949203834, "learning_rate": 4.961105197420321e-07, "loss": 0.7045, "step": 6310 }, { "epoch": 0.582170453234921, "eval_GEN Loss": 0.44272610545158386, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3802703022956848, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.848437488079071, "eval_runtime": 57.3111, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6310 }, { "epoch": 0.582262714796448, "grad_norm": 2.1157385848926884, "learning_rate": 4.959264234342283e-07, "loss": 0.7055, "step": 6311 }, { "epoch": 0.5823549763579748, "grad_norm": 2.159289235060167, "learning_rate": 4.957423388232753e-07, "loss": 0.5475, "step": 6312 }, { "epoch": 0.5824472379195018, "grad_norm": 2.5108060066041986, "learning_rate": 4.955582659258548e-07, "loss": 0.6717, "step": 6313 }, { "epoch": 0.5825394994810287, "grad_norm": 3.0379103860845826, "learning_rate": 4.953742047586482e-07, "loss": 0.598, "step": 6314 }, { "epoch": 0.5826317610425557, "grad_norm": 1.4903435992595202, "learning_rate": 4.951901553383352e-07, "loss": 0.6608, "step": 6315 }, { "epoch": 0.5826317610425557, "eval_GEN Loss": 0.4429214596748352, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37416115403175354, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8474158644676208, "eval_runtime": 57.4865, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 6315 }, { "epoch": 0.5827240226040826, "grad_norm": 2.0775702547374206, "learning_rate": 4.950061176815945e-07, "loss": 0.773, "step": 6316 }, { "epoch": 0.5828162841656095, "grad_norm": 2.0804216411475998, "learning_rate": 4.94822091805104e-07, "loss": 0.7467, "step": 6317 }, { "epoch": 0.5829085457271365, "grad_norm": 2.0743450504072225, "learning_rate": 4.946380777255406e-07, "loss": 0.4655, "step": 6318 }, { "epoch": 0.5830008072886633, "grad_norm": 1.391862940111571, "learning_rate": 4.944540754595799e-07, "loss": 0.5445, "step": 6319 }, { "epoch": 0.5830930688501903, "grad_norm": 1.3839252587051885, "learning_rate": 4.942700850238959e-07, "loss": 0.5456, "step": 6320 }, { "epoch": 0.5830930688501903, "eval_GEN Loss": 0.44036203622817993, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3720378875732422, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8463341593742371, "eval_runtime": 57.1007, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6320 }, { "epoch": 0.5831853304117173, "grad_norm": 2.7710609014344207, "learning_rate": 4.94086106435163e-07, "loss": 0.7679, "step": 6321 }, { "epoch": 0.5832775919732441, "grad_norm": 1.7834977000149344, "learning_rate": 4.939021397100531e-07, "loss": 0.5372, "step": 6322 }, { "epoch": 0.5833698535347711, "grad_norm": 1.8951693050704401, "learning_rate": 4.937181848652375e-07, "loss": 0.7232, "step": 6323 }, { "epoch": 0.583462115096298, "grad_norm": 2.226408515806397, "learning_rate": 4.935342419173868e-07, "loss": 0.6092, "step": 6324 }, { "epoch": 0.583554376657825, "grad_norm": 2.074179129635041, "learning_rate": 4.933503108831701e-07, "loss": 0.6004, "step": 6325 }, { "epoch": 0.583554376657825, "eval_GEN Loss": 0.4406622052192688, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3691295087337494, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8461538553237915, "eval_runtime": 57.2617, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6325 }, { "epoch": 0.5836466382193518, "grad_norm": 2.1560652496204638, "learning_rate": 4.931663917792553e-07, "loss": 0.673, "step": 6326 }, { "epoch": 0.5837388997808788, "grad_norm": 2.0338475033024586, "learning_rate": 4.929824846223094e-07, "loss": 0.6847, "step": 6327 }, { "epoch": 0.5838311613424058, "grad_norm": 2.299214555895757, "learning_rate": 4.927985894289988e-07, "loss": 0.7344, "step": 6328 }, { "epoch": 0.5839234229039326, "grad_norm": 2.1072673019465085, "learning_rate": 4.926147062159881e-07, "loss": 0.6978, "step": 6329 }, { "epoch": 0.5840156844654596, "grad_norm": 3.4832658474393563, "learning_rate": 4.924308349999411e-07, "loss": 0.7795, "step": 6330 }, { "epoch": 0.5840156844654596, "eval_GEN Loss": 0.4412643611431122, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3700779378414154, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8445011973381042, "eval_runtime": 56.2308, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6330 }, { "epoch": 0.5841079460269865, "grad_norm": 2.041076100289549, "learning_rate": 4.922469757975202e-07, "loss": 0.5703, "step": 6331 }, { "epoch": 0.5842002075885134, "grad_norm": 2.087624595157083, "learning_rate": 4.920631286253877e-07, "loss": 0.7623, "step": 6332 }, { "epoch": 0.5842924691500404, "grad_norm": 1.927244339935134, "learning_rate": 4.918792935002037e-07, "loss": 0.6059, "step": 6333 }, { "epoch": 0.5843847307115673, "grad_norm": 2.1782142807916225, "learning_rate": 4.916954704386274e-07, "loss": 0.7809, "step": 6334 }, { "epoch": 0.5844769922730942, "grad_norm": 3.0772800940299767, "learning_rate": 4.915116594573177e-07, "loss": 0.6957, "step": 6335 }, { "epoch": 0.5844769922730942, "eval_GEN Loss": 0.4407137632369995, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3753919303417206, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8417067527770996, "eval_runtime": 56.4171, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6335 }, { "epoch": 0.5845692538346211, "grad_norm": 1.4363302015534385, "learning_rate": 4.913278605729314e-07, "loss": 0.5564, "step": 6336 }, { "epoch": 0.5846615153961481, "grad_norm": 3.010118973568409, "learning_rate": 4.911440738021248e-07, "loss": 0.986, "step": 6337 }, { "epoch": 0.584753776957675, "grad_norm": 1.578629755208319, "learning_rate": 4.909602991615527e-07, "loss": 0.66, "step": 6338 }, { "epoch": 0.5848460385192019, "grad_norm": 2.1003052352339218, "learning_rate": 4.907765366678695e-07, "loss": 0.6356, "step": 6339 }, { "epoch": 0.5849383000807289, "grad_norm": 1.8445080183027478, "learning_rate": 4.905927863377279e-07, "loss": 0.6926, "step": 6340 }, { "epoch": 0.5849383000807289, "eval_GEN Loss": 0.44224226474761963, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.38645339012145996, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8432692289352417, "eval_runtime": 56.5157, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6340 }, { "epoch": 0.5850305616422558, "grad_norm": 2.311893297779681, "learning_rate": 4.904090481877792e-07, "loss": 0.8451, "step": 6341 }, { "epoch": 0.5851228232037827, "grad_norm": 2.213082397886451, "learning_rate": 4.902253222346746e-07, "loss": 0.8056, "step": 6342 }, { "epoch": 0.5852150847653097, "grad_norm": 2.4697836448702657, "learning_rate": 4.900416084950637e-07, "loss": 0.7727, "step": 6343 }, { "epoch": 0.5853073463268366, "grad_norm": 2.6726922541668525, "learning_rate": 4.898579069855944e-07, "loss": 0.6871, "step": 6344 }, { "epoch": 0.5853996078883635, "grad_norm": 1.776549134004778, "learning_rate": 4.896742177229143e-07, "loss": 0.7941, "step": 6345 }, { "epoch": 0.5853996078883635, "eval_GEN Loss": 0.4420793950557709, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3891884386539459, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8507512211799622, "eval_runtime": 56.6157, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 6345 }, { "epoch": 0.5854918694498904, "grad_norm": 2.3821863663358718, "learning_rate": 4.894905407236696e-07, "loss": 0.9005, "step": 6346 }, { "epoch": 0.5855841310114174, "grad_norm": 1.5916868697808213, "learning_rate": 4.893068760045054e-07, "loss": 0.8775, "step": 6347 }, { "epoch": 0.5856763925729443, "grad_norm": 1.7094582019607243, "learning_rate": 4.891232235820656e-07, "loss": 0.6847, "step": 6348 }, { "epoch": 0.5857686541344712, "grad_norm": 1.955528493131927, "learning_rate": 4.889395834729934e-07, "loss": 0.6795, "step": 6349 }, { "epoch": 0.5858609156959982, "grad_norm": 2.8118427103897137, "learning_rate": 4.887559556939301e-07, "loss": 0.8416, "step": 6350 }, { "epoch": 0.5858609156959982, "eval_GEN Loss": 0.4428744912147522, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3934004306793213, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8495192527770996, "eval_runtime": 56.312, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6350 }, { "epoch": 0.585953177257525, "grad_norm": 1.5413329514594336, "learning_rate": 4.885723402615167e-07, "loss": 0.6495, "step": 6351 }, { "epoch": 0.586045438819052, "grad_norm": 1.4748978707504359, "learning_rate": 4.883887371923923e-07, "loss": 0.6651, "step": 6352 }, { "epoch": 0.586137700380579, "grad_norm": 2.0225482972211193, "learning_rate": 4.882051465031958e-07, "loss": 0.6693, "step": 6353 }, { "epoch": 0.5862299619421059, "grad_norm": 2.104639667350112, "learning_rate": 4.880215682105642e-07, "loss": 0.6866, "step": 6354 }, { "epoch": 0.5863222235036328, "grad_norm": 2.097344814375573, "learning_rate": 4.878380023311337e-07, "loss": 0.6633, "step": 6355 }, { "epoch": 0.5863222235036328, "eval_GEN Loss": 0.4431023597717285, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.38204213976860046, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8510516881942749, "eval_runtime": 56.4405, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6355 }, { "epoch": 0.5864144850651597, "grad_norm": 2.32764207806017, "learning_rate": 4.876544488815391e-07, "loss": 0.6264, "step": 6356 }, { "epoch": 0.5865067466266867, "grad_norm": 2.058804402241401, "learning_rate": 4.874709078784148e-07, "loss": 0.6048, "step": 6357 }, { "epoch": 0.5865990081882135, "grad_norm": 2.056025516621196, "learning_rate": 4.872873793383932e-07, "loss": 0.6682, "step": 6358 }, { "epoch": 0.5866912697497405, "grad_norm": 2.764498621048737, "learning_rate": 4.871038632781061e-07, "loss": 0.6149, "step": 6359 }, { "epoch": 0.5867835313112675, "grad_norm": 2.6725250149700397, "learning_rate": 4.86920359714184e-07, "loss": 0.5839, "step": 6360 }, { "epoch": 0.5867835313112675, "eval_GEN Loss": 0.4418243169784546, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36558327078819275, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8512019515037537, "eval_runtime": 56.4061, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6360 }, { "epoch": 0.5868757928727943, "grad_norm": 1.4678435602088913, "learning_rate": 4.867368686632562e-07, "loss": 0.6793, "step": 6361 }, { "epoch": 0.5869680544343213, "grad_norm": 1.6303672106339337, "learning_rate": 4.86553390141951e-07, "loss": 0.6536, "step": 6362 }, { "epoch": 0.5870603159958482, "grad_norm": 2.3622014557314777, "learning_rate": 4.863699241668953e-07, "loss": 0.6522, "step": 6363 }, { "epoch": 0.5871525775573752, "grad_norm": 1.4522805270109873, "learning_rate": 4.861864707547155e-07, "loss": 0.6952, "step": 6364 }, { "epoch": 0.5872448391189021, "grad_norm": 1.743194882159659, "learning_rate": 4.860030299220363e-07, "loss": 0.5572, "step": 6365 }, { "epoch": 0.5872448391189021, "eval_GEN Loss": 0.44202345609664917, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.354360967874527, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8638821840286255, "eval_runtime": 56.2228, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6365 }, { "epoch": 0.587337100680429, "grad_norm": 1.3703777359892166, "learning_rate": 4.858196016854809e-07, "loss": 0.6615, "step": 6366 }, { "epoch": 0.587429362241956, "grad_norm": 1.970332804009397, "learning_rate": 4.856361860616726e-07, "loss": 0.7595, "step": 6367 }, { "epoch": 0.5875216238034828, "grad_norm": 2.421696323283443, "learning_rate": 4.854527830672325e-07, "loss": 0.7434, "step": 6368 }, { "epoch": 0.5876138853650098, "grad_norm": 3.8773145142819025, "learning_rate": 4.852693927187808e-07, "loss": 0.8145, "step": 6369 }, { "epoch": 0.5877061469265368, "grad_norm": 2.1178770114383623, "learning_rate": 4.850860150329367e-07, "loss": 0.6911, "step": 6370 }, { "epoch": 0.5877061469265368, "eval_GEN Loss": 0.4411100447177887, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35600876808166504, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8661057949066162, "eval_runtime": 56.1708, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6370 }, { "epoch": 0.5877984084880636, "grad_norm": 1.4612553205864607, "learning_rate": 4.84902650026318e-07, "loss": 0.5906, "step": 6371 }, { "epoch": 0.5878906700495906, "grad_norm": 1.7211096838689979, "learning_rate": 4.847192977155419e-07, "loss": 0.6271, "step": 6372 }, { "epoch": 0.5879829316111175, "grad_norm": 2.5860348471763315, "learning_rate": 4.845359581172235e-07, "loss": 0.5875, "step": 6373 }, { "epoch": 0.5880751931726445, "grad_norm": 1.8568817249199407, "learning_rate": 4.84352631247978e-07, "loss": 0.761, "step": 6374 }, { "epoch": 0.5881674547341714, "grad_norm": 2.1615719619733555, "learning_rate": 4.841693171244184e-07, "loss": 0.9243, "step": 6375 }, { "epoch": 0.5881674547341714, "eval_GEN Loss": 0.43982282280921936, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3575236201286316, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8550480604171753, "eval_runtime": 56.2656, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6375 }, { "epoch": 0.5882597162956983, "grad_norm": 1.7830165711878478, "learning_rate": 4.839860157631568e-07, "loss": 0.7258, "step": 6376 }, { "epoch": 0.5883519778572253, "grad_norm": 2.3646416153974847, "learning_rate": 4.838027271808043e-07, "loss": 0.7114, "step": 6377 }, { "epoch": 0.5884442394187521, "grad_norm": 1.5797951957792824, "learning_rate": 4.836194513939712e-07, "loss": 0.6892, "step": 6378 }, { "epoch": 0.5885365009802791, "grad_norm": 2.109488333025438, "learning_rate": 4.834361884192659e-07, "loss": 0.8391, "step": 6379 }, { "epoch": 0.5886287625418061, "grad_norm": 2.064741291650644, "learning_rate": 4.832529382732959e-07, "loss": 0.5245, "step": 6380 }, { "epoch": 0.5886287625418061, "eval_GEN Loss": 0.43987032771110535, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35861408710479736, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8521634340286255, "eval_runtime": 56.5027, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6380 }, { "epoch": 0.5887210241033329, "grad_norm": 2.077270007291993, "learning_rate": 4.830697009726679e-07, "loss": 0.6842, "step": 6381 }, { "epoch": 0.5888132856648599, "grad_norm": 1.4241280098633957, "learning_rate": 4.82886476533987e-07, "loss": 0.5452, "step": 6382 }, { "epoch": 0.5889055472263868, "grad_norm": 1.5333289934109766, "learning_rate": 4.827032649738571e-07, "loss": 0.5641, "step": 6383 }, { "epoch": 0.5889978087879137, "grad_norm": 1.7646132035185702, "learning_rate": 4.825200663088813e-07, "loss": 0.6511, "step": 6384 }, { "epoch": 0.5890900703494407, "grad_norm": 2.1311463084657056, "learning_rate": 4.823368805556616e-07, "loss": 0.6467, "step": 6385 }, { "epoch": 0.5890900703494407, "eval_GEN Loss": 0.439827024936676, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36315295100212097, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8506009578704834, "eval_runtime": 56.3637, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 6385 }, { "epoch": 0.5891823319109676, "grad_norm": 2.5252884288930186, "learning_rate": 4.821537077307982e-07, "loss": 0.5419, "step": 6386 }, { "epoch": 0.5892745934724946, "grad_norm": 1.6149830362805024, "learning_rate": 4.819705478508909e-07, "loss": 0.5706, "step": 6387 }, { "epoch": 0.5893668550340214, "grad_norm": 1.8488946018414398, "learning_rate": 4.817874009325371e-07, "loss": 0.6326, "step": 6388 }, { "epoch": 0.5894591165955484, "grad_norm": 1.8826796251944264, "learning_rate": 4.816042669923349e-07, "loss": 0.5947, "step": 6389 }, { "epoch": 0.5895513781570753, "grad_norm": 2.1680882718335197, "learning_rate": 4.814211460468797e-07, "loss": 0.7838, "step": 6390 }, { "epoch": 0.5895513781570753, "eval_GEN Loss": 0.44034624099731445, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3696105182170868, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8560396432876587, "eval_runtime": 56.3357, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6390 }, { "epoch": 0.5896436397186022, "grad_norm": 2.146358580315923, "learning_rate": 4.81238038112766e-07, "loss": 0.5641, "step": 6391 }, { "epoch": 0.5897359012801292, "grad_norm": 2.1065444958684165, "learning_rate": 4.810549432065877e-07, "loss": 0.7043, "step": 6392 }, { "epoch": 0.5898281628416561, "grad_norm": 1.9644209621161839, "learning_rate": 4.808718613449371e-07, "loss": 0.7328, "step": 6393 }, { "epoch": 0.589920424403183, "grad_norm": 1.7893361484986339, "learning_rate": 4.806887925444053e-07, "loss": 0.8122, "step": 6394 }, { "epoch": 0.5900126859647099, "grad_norm": 2.7973133751411394, "learning_rate": 4.805057368215822e-07, "loss": 0.8761, "step": 6395 }, { "epoch": 0.5900126859647099, "eval_GEN Loss": 0.44051992893218994, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3689947724342346, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8536959290504456, "eval_runtime": 56.4024, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6395 }, { "epoch": 0.5901049475262369, "grad_norm": 1.811831248407308, "learning_rate": 4.803226941930568e-07, "loss": 0.4958, "step": 6396 }, { "epoch": 0.5901972090877639, "grad_norm": 2.0905987011532394, "learning_rate": 4.801396646754165e-07, "loss": 0.687, "step": 6397 }, { "epoch": 0.5902894706492907, "grad_norm": 1.9614263486550298, "learning_rate": 4.799566482852475e-07, "loss": 0.6489, "step": 6398 }, { "epoch": 0.5903817322108177, "grad_norm": 2.3299526202037444, "learning_rate": 4.797736450391357e-07, "loss": 0.828, "step": 6399 }, { "epoch": 0.5904739937723446, "grad_norm": 2.0166873066799273, "learning_rate": 4.795906549536647e-07, "loss": 0.7585, "step": 6400 }, { "epoch": 0.5904739937723446, "eval_GEN Loss": 0.4413924217224121, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3728821277618408, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8537560105323792, "eval_runtime": 56.5532, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 6400 }, { "epoch": 0.5905662553338715, "grad_norm": 2.7344086175348683, "learning_rate": 4.794076780454175e-07, "loss": 0.757, "step": 6401 }, { "epoch": 0.5906585168953985, "grad_norm": 1.8894973906203802, "learning_rate": 4.792247143309753e-07, "loss": 0.6053, "step": 6402 }, { "epoch": 0.5907507784569254, "grad_norm": 1.7211671765975134, "learning_rate": 4.790417638269193e-07, "loss": 0.4439, "step": 6403 }, { "epoch": 0.5908430400184523, "grad_norm": 1.6997807020138318, "learning_rate": 4.788588265498284e-07, "loss": 0.6213, "step": 6404 }, { "epoch": 0.5909353015799792, "grad_norm": 2.5547435112561874, "learning_rate": 4.786759025162805e-07, "loss": 0.5909, "step": 6405 }, { "epoch": 0.5909353015799792, "eval_GEN Loss": 0.4413280785083771, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37154340744018555, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.857151448726654, "eval_runtime": 56.2402, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6405 }, { "epoch": 0.5910275631415062, "grad_norm": 2.368035316622676, "learning_rate": 4.784929917428528e-07, "loss": 0.7115, "step": 6406 }, { "epoch": 0.5911198247030331, "grad_norm": 2.001956057921037, "learning_rate": 4.783100942461208e-07, "loss": 0.6849, "step": 6407 }, { "epoch": 0.59121208626456, "grad_norm": 2.47432020801104, "learning_rate": 4.78127210042659e-07, "loss": 0.8058, "step": 6408 }, { "epoch": 0.591304347826087, "grad_norm": 1.6951619051729707, "learning_rate": 4.779443391490401e-07, "loss": 0.6494, "step": 6409 }, { "epoch": 0.5913966093876138, "grad_norm": 2.1657267717112343, "learning_rate": 4.777614815818371e-07, "loss": 0.7043, "step": 6410 }, { "epoch": 0.5913966093876138, "eval_GEN Loss": 0.44058799743652344, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3643389046192169, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8560396432876587, "eval_runtime": 56.4493, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 6410 }, { "epoch": 0.5914888709491408, "grad_norm": 2.135630789181945, "learning_rate": 4.775786373576205e-07, "loss": 0.7615, "step": 6411 }, { "epoch": 0.5915811325106678, "grad_norm": 2.475879747956815, "learning_rate": 4.773958064929594e-07, "loss": 0.8368, "step": 6412 }, { "epoch": 0.5916733940721947, "grad_norm": 1.7373482518582977, "learning_rate": 4.77212989004423e-07, "loss": 0.5903, "step": 6413 }, { "epoch": 0.5917656556337216, "grad_norm": 1.885625012391937, "learning_rate": 4.770301849085781e-07, "loss": 0.7055, "step": 6414 }, { "epoch": 0.5918579171952485, "grad_norm": 1.8796481682906139, "learning_rate": 4.768473942219907e-07, "loss": 0.6003, "step": 6415 }, { "epoch": 0.5918579171952485, "eval_GEN Loss": 0.44151726365089417, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36554262042045593, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8587139248847961, "eval_runtime": 56.5029, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6415 }, { "epoch": 0.5919501787567755, "grad_norm": 2.136727328194295, "learning_rate": 4.766646169612256e-07, "loss": 0.7684, "step": 6416 }, { "epoch": 0.5920424403183023, "grad_norm": 1.697300819022544, "learning_rate": 4.7648185314284654e-07, "loss": 0.6949, "step": 6417 }, { "epoch": 0.5921347018798293, "grad_norm": 2.7715115403272286, "learning_rate": 4.7629910278341566e-07, "loss": 0.7045, "step": 6418 }, { "epoch": 0.5922269634413563, "grad_norm": 2.9164263132136066, "learning_rate": 4.76116365899494e-07, "loss": 0.6322, "step": 6419 }, { "epoch": 0.5923192250028831, "grad_norm": 2.0269560765475294, "learning_rate": 4.7593364250764165e-07, "loss": 0.5973, "step": 6420 }, { "epoch": 0.5923192250028831, "eval_GEN Loss": 0.4410720467567444, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35991284251213074, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8563100695610046, "eval_runtime": 56.5167, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6420 }, { "epoch": 0.5924114865644101, "grad_norm": 2.735370430449146, "learning_rate": 4.757509326244174e-07, "loss": 0.7976, "step": 6421 }, { "epoch": 0.592503748125937, "grad_norm": 2.0434911280494825, "learning_rate": 4.755682362663785e-07, "loss": 0.7614, "step": 6422 }, { "epoch": 0.592596009687464, "grad_norm": 1.4553768032667422, "learning_rate": 4.75385553450081e-07, "loss": 0.4036, "step": 6423 }, { "epoch": 0.5926882712489909, "grad_norm": 1.467675601861643, "learning_rate": 4.752028841920804e-07, "loss": 0.6869, "step": 6424 }, { "epoch": 0.5927805328105178, "grad_norm": 1.8587339158996627, "learning_rate": 4.750202285089302e-07, "loss": 0.4906, "step": 6425 }, { "epoch": 0.5927805328105178, "eval_GEN Loss": 0.4408237040042877, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35697683691978455, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8539062738418579, "eval_runtime": 56.5281, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6425 }, { "epoch": 0.5928727943720448, "grad_norm": 1.6616590109670193, "learning_rate": 4.74837586417183e-07, "loss": 0.4564, "step": 6426 }, { "epoch": 0.5929650559335716, "grad_norm": 4.441414311181033, "learning_rate": 4.7465495793338977e-07, "loss": 1.1734, "step": 6427 }, { "epoch": 0.5930573174950986, "grad_norm": 2.2661948403823637, "learning_rate": 4.744723430741012e-07, "loss": 0.8081, "step": 6428 }, { "epoch": 0.5931495790566256, "grad_norm": 2.490995028912069, "learning_rate": 4.742897418558659e-07, "loss": 0.8822, "step": 6429 }, { "epoch": 0.5932418406181524, "grad_norm": 2.2736010568551337, "learning_rate": 4.741071542952312e-07, "loss": 0.8079, "step": 6430 }, { "epoch": 0.5932418406181524, "eval_GEN Loss": 0.44084686040878296, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36095044016838074, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8500000238418579, "eval_runtime": 56.4585, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 6430 }, { "epoch": 0.5933341021796794, "grad_norm": 1.6176980926757594, "learning_rate": 4.7392458040874384e-07, "loss": 0.4944, "step": 6431 }, { "epoch": 0.5934263637412063, "grad_norm": 3.3619785789496617, "learning_rate": 4.7374202021294877e-07, "loss": 0.8906, "step": 6432 }, { "epoch": 0.5935186253027332, "grad_norm": 2.298869072932653, "learning_rate": 4.7355947372438994e-07, "loss": 0.688, "step": 6433 }, { "epoch": 0.5936108868642602, "grad_norm": 1.8793452007935396, "learning_rate": 4.7337694095960965e-07, "loss": 0.5888, "step": 6434 }, { "epoch": 0.5937031484257871, "grad_norm": 2.1617683283961284, "learning_rate": 4.7319442193514996e-07, "loss": 0.7854, "step": 6435 }, { "epoch": 0.5937031484257871, "eval_GEN Loss": 0.44120359420776367, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3709085285663605, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8528245091438293, "eval_runtime": 56.2729, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6435 }, { "epoch": 0.5937954099873141, "grad_norm": 1.9382805174607527, "learning_rate": 4.7301191666755073e-07, "loss": 0.6335, "step": 6436 }, { "epoch": 0.5938876715488409, "grad_norm": 1.6030783254302945, "learning_rate": 4.728294251733505e-07, "loss": 0.6108, "step": 6437 }, { "epoch": 0.5939799331103679, "grad_norm": 1.7115048658422194, "learning_rate": 4.7264694746908756e-07, "loss": 0.5921, "step": 6438 }, { "epoch": 0.5940721946718949, "grad_norm": 1.295117419816494, "learning_rate": 4.7246448357129815e-07, "loss": 0.5508, "step": 6439 }, { "epoch": 0.5941644562334217, "grad_norm": 1.3824056190634864, "learning_rate": 4.7228203349651717e-07, "loss": 0.5768, "step": 6440 }, { "epoch": 0.5941644562334217, "eval_GEN Loss": 0.4422346353530884, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37767842411994934, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8572716116905212, "eval_runtime": 56.2548, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6440 }, { "epoch": 0.5942567177949487, "grad_norm": 1.9732800112723954, "learning_rate": 4.7209959726127866e-07, "loss": 0.6701, "step": 6441 }, { "epoch": 0.5943489793564756, "grad_norm": 1.4247227885987437, "learning_rate": 4.7191717488211544e-07, "loss": 0.4858, "step": 6442 }, { "epoch": 0.5944412409180025, "grad_norm": 1.4716726546995955, "learning_rate": 4.7173476637555877e-07, "loss": 0.622, "step": 6443 }, { "epoch": 0.5945335024795295, "grad_norm": 2.6074311333566835, "learning_rate": 4.7155237175813857e-07, "loss": 0.6344, "step": 6444 }, { "epoch": 0.5946257640410564, "grad_norm": 2.286324370503418, "learning_rate": 4.713699910463842e-07, "loss": 0.7415, "step": 6445 }, { "epoch": 0.5946257640410564, "eval_GEN Loss": 0.4428369402885437, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3816942274570465, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8628004789352417, "eval_runtime": 56.3154, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6445 }, { "epoch": 0.5947180256025834, "grad_norm": 1.8257100332726224, "learning_rate": 4.7118762425682307e-07, "loss": 0.7406, "step": 6446 }, { "epoch": 0.5948102871641102, "grad_norm": 2.3548876004911627, "learning_rate": 4.710052714059816e-07, "loss": 0.7278, "step": 6447 }, { "epoch": 0.5949025487256372, "grad_norm": 2.0244416984368265, "learning_rate": 4.708229325103845e-07, "loss": 0.797, "step": 6448 }, { "epoch": 0.594994810287164, "grad_norm": 1.9943694786620234, "learning_rate": 4.706406075865562e-07, "loss": 0.6407, "step": 6449 }, { "epoch": 0.595087071848691, "grad_norm": 1.454188470871012, "learning_rate": 4.70458296651019e-07, "loss": 0.6535, "step": 6450 }, { "epoch": 0.595087071848691, "eval_GEN Loss": 0.44378387928009033, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3770894408226013, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8625901341438293, "eval_runtime": 56.4734, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 6450 }, { "epoch": 0.595179333410218, "grad_norm": 1.6745886950725293, "learning_rate": 4.702759997202942e-07, "loss": 0.651, "step": 6451 }, { "epoch": 0.5952715949717449, "grad_norm": 1.5989023168694987, "learning_rate": 4.700937168109018e-07, "loss": 0.7902, "step": 6452 }, { "epoch": 0.5953638565332718, "grad_norm": 1.9885092623867306, "learning_rate": 4.6991144793936066e-07, "loss": 0.761, "step": 6453 }, { "epoch": 0.5954561180947987, "grad_norm": 2.5133955592809363, "learning_rate": 4.697291931221882e-07, "loss": 0.8365, "step": 6454 }, { "epoch": 0.5955483796563257, "grad_norm": 1.936780889341621, "learning_rate": 4.6954695237590044e-07, "loss": 0.7249, "step": 6455 }, { "epoch": 0.5955483796563257, "eval_GEN Loss": 0.4422670900821686, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37465909123420715, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8682091236114502, "eval_runtime": 56.644, "eval_samples_per_second": 1.148, "eval_steps_per_second": 0.088, "step": 6455 }, { "epoch": 0.5956406412178527, "grad_norm": 2.2596875712811735, "learning_rate": 4.693647257170128e-07, "loss": 0.6086, "step": 6456 }, { "epoch": 0.5957329027793795, "grad_norm": 3.1552957839902533, "learning_rate": 4.6918251316203865e-07, "loss": 0.7688, "step": 6457 }, { "epoch": 0.5958251643409065, "grad_norm": 2.764774672416707, "learning_rate": 4.6900031472749045e-07, "loss": 0.7014, "step": 6458 }, { "epoch": 0.5959174259024334, "grad_norm": 1.281245006063962, "learning_rate": 4.6881813042987905e-07, "loss": 0.6266, "step": 6459 }, { "epoch": 0.5960096874639603, "grad_norm": 1.8744019560085594, "learning_rate": 4.6863596028571475e-07, "loss": 0.5373, "step": 6460 }, { "epoch": 0.5960096874639603, "eval_GEN Loss": 0.442702978849411, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37321579456329346, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8775841593742371, "eval_runtime": 56.2986, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6460 }, { "epoch": 0.5961019490254873, "grad_norm": 1.6226400717670013, "learning_rate": 4.684538043115058e-07, "loss": 0.6575, "step": 6461 }, { "epoch": 0.5961942105870142, "grad_norm": 1.976118787673476, "learning_rate": 4.682716625237595e-07, "loss": 0.6579, "step": 6462 }, { "epoch": 0.5962864721485411, "grad_norm": 2.5011602649985085, "learning_rate": 4.680895349389817e-07, "loss": 0.5649, "step": 6463 }, { "epoch": 0.596378733710068, "grad_norm": 1.6211096249298098, "learning_rate": 4.6790742157367744e-07, "loss": 0.5527, "step": 6464 }, { "epoch": 0.596470995271595, "grad_norm": 2.429687056232111, "learning_rate": 4.677253224443498e-07, "loss": 0.6304, "step": 6465 }, { "epoch": 0.596470995271595, "eval_GEN Loss": 0.4419209361076355, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3695679008960724, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8763220906257629, "eval_runtime": 56.5231, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6465 }, { "epoch": 0.596563256833122, "grad_norm": 2.0022583370501206, "learning_rate": 4.6754323756750096e-07, "loss": 0.6195, "step": 6466 }, { "epoch": 0.5966555183946488, "grad_norm": 3.2915706714978685, "learning_rate": 4.6736116695963186e-07, "loss": 0.7045, "step": 6467 }, { "epoch": 0.5967477799561758, "grad_norm": 1.8741000764226092, "learning_rate": 4.67179110637242e-07, "loss": 0.6409, "step": 6468 }, { "epoch": 0.5968400415177026, "grad_norm": 2.1588251093322173, "learning_rate": 4.669970686168292e-07, "loss": 0.6191, "step": 6469 }, { "epoch": 0.5969323030792296, "grad_norm": 2.1607988855965097, "learning_rate": 4.668150409148911e-07, "loss": 0.7928, "step": 6470 }, { "epoch": 0.5969323030792296, "eval_GEN Loss": 0.44284215569496155, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.373485803604126, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8795673251152039, "eval_runtime": 56.2507, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6470 }, { "epoch": 0.5970245646407566, "grad_norm": 1.9629726741339855, "learning_rate": 4.666330275479229e-07, "loss": 0.8013, "step": 6471 }, { "epoch": 0.5971168262022835, "grad_norm": 2.4673628047856506, "learning_rate": 4.6645102853241904e-07, "loss": 0.7449, "step": 6472 }, { "epoch": 0.5972090877638104, "grad_norm": 1.755627251074481, "learning_rate": 4.6626904388487227e-07, "loss": 0.5996, "step": 6473 }, { "epoch": 0.5973013493253373, "grad_norm": 2.4711435828071506, "learning_rate": 4.6608707362177484e-07, "loss": 0.9529, "step": 6474 }, { "epoch": 0.5973936108868643, "grad_norm": 1.6522424162494653, "learning_rate": 4.6590511775961697e-07, "loss": 0.6095, "step": 6475 }, { "epoch": 0.5973936108868643, "eval_GEN Loss": 0.4425080120563507, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3732866644859314, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8754206895828247, "eval_runtime": 56.3661, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 6475 }, { "epoch": 0.5974858724483912, "grad_norm": 3.1677358809202363, "learning_rate": 4.657231763148877e-07, "loss": 0.7602, "step": 6476 }, { "epoch": 0.5975781340099181, "grad_norm": 1.3615558030139567, "learning_rate": 4.6554124930407477e-07, "loss": 0.5189, "step": 6477 }, { "epoch": 0.5976703955714451, "grad_norm": 1.871186074358157, "learning_rate": 4.6535933674366497e-07, "loss": 0.6052, "step": 6478 }, { "epoch": 0.5977626571329719, "grad_norm": 2.082535441467036, "learning_rate": 4.6517743865014343e-07, "loss": 0.4398, "step": 6479 }, { "epoch": 0.5978549186944989, "grad_norm": 1.3771300233798123, "learning_rate": 4.649955550399936e-07, "loss": 0.5132, "step": 6480 }, { "epoch": 0.5978549186944989, "eval_GEN Loss": 0.4416561424732208, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3741852343082428, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8768329620361328, "eval_runtime": 56.4124, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6480 }, { "epoch": 0.5979471802560258, "grad_norm": 2.273912064866879, "learning_rate": 4.6481368592969867e-07, "loss": 0.5876, "step": 6481 }, { "epoch": 0.5980394418175528, "grad_norm": 2.002363030567707, "learning_rate": 4.6463183133573964e-07, "loss": 0.7087, "step": 6482 }, { "epoch": 0.5981317033790797, "grad_norm": 1.6881975773200744, "learning_rate": 4.6444999127459657e-07, "loss": 0.7956, "step": 6483 }, { "epoch": 0.5982239649406066, "grad_norm": 1.6785134560855524, "learning_rate": 4.642681657627478e-07, "loss": 0.5531, "step": 6484 }, { "epoch": 0.5983162265021336, "grad_norm": 1.968929306626621, "learning_rate": 4.64086354816671e-07, "loss": 0.8097, "step": 6485 }, { "epoch": 0.5983162265021336, "eval_GEN Loss": 0.44243672490119934, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3748646378517151, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8784555196762085, "eval_runtime": 56.5732, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 6485 }, { "epoch": 0.5984084880636604, "grad_norm": 2.1453494611493826, "learning_rate": 4.6390455845284195e-07, "loss": 0.6622, "step": 6486 }, { "epoch": 0.5985007496251874, "grad_norm": 1.984034127058499, "learning_rate": 4.637227766877353e-07, "loss": 0.7646, "step": 6487 }, { "epoch": 0.5985930111867144, "grad_norm": 2.3643895128860852, "learning_rate": 4.6354100953782467e-07, "loss": 0.58, "step": 6488 }, { "epoch": 0.5986852727482412, "grad_norm": 1.696765662962337, "learning_rate": 4.633592570195819e-07, "loss": 0.6053, "step": 6489 }, { "epoch": 0.5987775343097682, "grad_norm": 1.7397194311622015, "learning_rate": 4.631775191494776e-07, "loss": 0.5755, "step": 6490 }, { "epoch": 0.5987775343097682, "eval_GEN Loss": 0.4420222043991089, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3736725151538849, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8753605484962463, "eval_runtime": 56.2511, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6490 }, { "epoch": 0.5988697958712951, "grad_norm": 1.9887006421943416, "learning_rate": 4.62995795943981e-07, "loss": 0.6654, "step": 6491 }, { "epoch": 0.598962057432822, "grad_norm": 1.8173701020465307, "learning_rate": 4.6281408741956067e-07, "loss": 0.8145, "step": 6492 }, { "epoch": 0.599054318994349, "grad_norm": 2.335625844912686, "learning_rate": 4.62632393592683e-07, "loss": 0.819, "step": 6493 }, { "epoch": 0.5991465805558759, "grad_norm": 1.9312172738797744, "learning_rate": 4.6245071447981305e-07, "loss": 0.5581, "step": 6494 }, { "epoch": 0.5992388421174029, "grad_norm": 1.4279390860445451, "learning_rate": 4.622690500974156e-07, "loss": 0.5817, "step": 6495 }, { "epoch": 0.5992388421174029, "eval_GEN Loss": 0.4414561688899994, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3730050325393677, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8756610751152039, "eval_runtime": 56.5267, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6495 }, { "epoch": 0.5993311036789297, "grad_norm": 2.0690147306828948, "learning_rate": 4.6208740046195284e-07, "loss": 0.6807, "step": 6496 }, { "epoch": 0.5994233652404567, "grad_norm": 2.8341700927048166, "learning_rate": 4.619057655898864e-07, "loss": 0.706, "step": 6497 }, { "epoch": 0.5995156268019837, "grad_norm": 2.3530556916924397, "learning_rate": 4.6172414549767604e-07, "loss": 0.9692, "step": 6498 }, { "epoch": 0.5996078883635105, "grad_norm": 2.457410524690488, "learning_rate": 4.6154254020178055e-07, "loss": 0.8322, "step": 6499 }, { "epoch": 0.5997001499250375, "grad_norm": 1.941080886775474, "learning_rate": 4.6136094971865753e-07, "loss": 0.5503, "step": 6500 }, { "epoch": 0.5997001499250375, "eval_GEN Loss": 0.44297531247138977, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3858383595943451, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8776442408561707, "eval_runtime": 56.4036, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6500 }, { "epoch": 0.5997924114865644, "grad_norm": 1.2913268487980396, "learning_rate": 4.611793740647627e-07, "loss": 0.547, "step": 6501 }, { "epoch": 0.5998846730480913, "grad_norm": 1.6350492663273162, "learning_rate": 4.6099781325655095e-07, "loss": 0.6506, "step": 6502 }, { "epoch": 0.5999769346096183, "grad_norm": 1.748101815670312, "learning_rate": 4.608162673104755e-07, "loss": 0.6981, "step": 6503 }, { "epoch": 0.6000691961711452, "grad_norm": 1.9274540299788245, "learning_rate": 4.606347362429884e-07, "loss": 0.6819, "step": 6504 }, { "epoch": 0.6001614577326722, "grad_norm": 1.601001243359987, "learning_rate": 4.604532200705399e-07, "loss": 0.5012, "step": 6505 }, { "epoch": 0.6001614577326722, "eval_GEN Loss": 0.44396957755088806, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.4034756124019623, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8856069445610046, "eval_runtime": 58.2113, "eval_samples_per_second": 1.117, "eval_steps_per_second": 0.086, "step": 6505 }, { "epoch": 0.600253719294199, "grad_norm": 2.7093879915133003, "learning_rate": 4.602717188095799e-07, "loss": 0.8189, "step": 6506 }, { "epoch": 0.600345980855726, "grad_norm": 2.4337643332277072, "learning_rate": 4.60090232476556e-07, "loss": 0.7162, "step": 6507 }, { "epoch": 0.600438242417253, "grad_norm": 2.402187383341364, "learning_rate": 4.599087610879148e-07, "loss": 0.8028, "step": 6508 }, { "epoch": 0.6005305039787798, "grad_norm": 1.760520386312224, "learning_rate": 4.5972730466010126e-07, "loss": 0.5898, "step": 6509 }, { "epoch": 0.6006227655403068, "grad_norm": 2.344522641113234, "learning_rate": 4.595458632095598e-07, "loss": 0.723, "step": 6510 }, { "epoch": 0.6006227655403068, "eval_GEN Loss": 0.4437510669231415, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.4104132354259491, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8838942050933838, "eval_runtime": 56.1344, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6510 }, { "epoch": 0.6007150271018337, "grad_norm": 1.481143727190678, "learning_rate": 4.5936443675273267e-07, "loss": 0.715, "step": 6511 }, { "epoch": 0.6008072886633606, "grad_norm": 1.6565688487062826, "learning_rate": 4.5918302530606077e-07, "loss": 0.6079, "step": 6512 }, { "epoch": 0.6008995502248875, "grad_norm": 1.5295336665750248, "learning_rate": 4.590016288859843e-07, "loss": 0.5176, "step": 6513 }, { "epoch": 0.6009918117864145, "grad_norm": 2.021107463672094, "learning_rate": 4.588202475089415e-07, "loss": 0.5844, "step": 6514 }, { "epoch": 0.6010840733479414, "grad_norm": 1.8492255574102388, "learning_rate": 4.5863888119136947e-07, "loss": 0.7135, "step": 6515 }, { "epoch": 0.6010840733479414, "eval_GEN Loss": 0.4439164102077484, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.41919270157814026, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8856370449066162, "eval_runtime": 56.1582, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6515 }, { "epoch": 0.6011763349094683, "grad_norm": 1.7915320340862368, "learning_rate": 4.5845752994970364e-07, "loss": 0.7086, "step": 6516 }, { "epoch": 0.6012685964709953, "grad_norm": 2.0396685292554197, "learning_rate": 4.582761938003788e-07, "loss": 0.6939, "step": 6517 }, { "epoch": 0.6013608580325221, "grad_norm": 2.0008997801927806, "learning_rate": 4.580948727598277e-07, "loss": 0.6053, "step": 6518 }, { "epoch": 0.6014531195940491, "grad_norm": 1.8580444426487772, "learning_rate": 4.5791356684448176e-07, "loss": 0.66, "step": 6519 }, { "epoch": 0.6015453811555761, "grad_norm": 1.9547018994508802, "learning_rate": 4.5773227607077157e-07, "loss": 0.7546, "step": 6520 }, { "epoch": 0.6015453811555761, "eval_GEN Loss": 0.4438962936401367, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.41245993971824646, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8835036158561707, "eval_runtime": 56.132, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6520 }, { "epoch": 0.601637642717103, "grad_norm": 1.9622798486170103, "learning_rate": 4.575510004551258e-07, "loss": 0.7161, "step": 6521 }, { "epoch": 0.6017299042786299, "grad_norm": 2.1819427328248464, "learning_rate": 4.573697400139719e-07, "loss": 0.644, "step": 6522 }, { "epoch": 0.6018221658401568, "grad_norm": 2.2643809840945264, "learning_rate": 4.57188494763736e-07, "loss": 0.7409, "step": 6523 }, { "epoch": 0.6019144274016838, "grad_norm": 1.6920723690406057, "learning_rate": 4.570072647208429e-07, "loss": 0.6174, "step": 6524 }, { "epoch": 0.6020066889632107, "grad_norm": 2.1001823656451286, "learning_rate": 4.5682604990171587e-07, "loss": 0.5417, "step": 6525 }, { "epoch": 0.6020066889632107, "eval_GEN Loss": 0.4423701763153076, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3939453065395355, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8782151341438293, "eval_runtime": 56.2877, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6525 }, { "epoch": 0.6020989505247376, "grad_norm": 1.8436910082880869, "learning_rate": 4.5664485032277674e-07, "loss": 0.6311, "step": 6526 }, { "epoch": 0.6021912120862646, "grad_norm": 2.175159938658578, "learning_rate": 4.564636660004465e-07, "loss": 0.4689, "step": 6527 }, { "epoch": 0.6022834736477914, "grad_norm": 2.296025607711605, "learning_rate": 4.562824969511441e-07, "loss": 0.6603, "step": 6528 }, { "epoch": 0.6023757352093184, "grad_norm": 2.048968097930958, "learning_rate": 4.5610134319128737e-07, "loss": 0.8147, "step": 6529 }, { "epoch": 0.6024679967708454, "grad_norm": 2.9965042072009185, "learning_rate": 4.559202047372926e-07, "loss": 0.8977, "step": 6530 }, { "epoch": 0.6024679967708454, "eval_GEN Loss": 0.4415931701660156, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.37783971428871155, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8833533525466919, "eval_runtime": 56.263, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6530 }, { "epoch": 0.6025602583323723, "grad_norm": 2.200002686849985, "learning_rate": 4.5573908160557517e-07, "loss": 0.7091, "step": 6531 }, { "epoch": 0.6026525198938992, "grad_norm": 2.2022047831185336, "learning_rate": 4.555579738125486e-07, "loss": 0.7227, "step": 6532 }, { "epoch": 0.6027447814554261, "grad_norm": 1.5181070028522146, "learning_rate": 4.553768813746251e-07, "loss": 0.6712, "step": 6533 }, { "epoch": 0.6028370430169531, "grad_norm": 2.0623318137564044, "learning_rate": 4.551958043082157e-07, "loss": 0.7917, "step": 6534 }, { "epoch": 0.60292930457848, "grad_norm": 2.0705941645284165, "learning_rate": 4.550147426297296e-07, "loss": 0.7956, "step": 6535 }, { "epoch": 0.60292930457848, "eval_GEN Loss": 0.44126561284065247, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.37181028723716736, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8792667984962463, "eval_runtime": 56.8891, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 6535 }, { "epoch": 0.6030215661400069, "grad_norm": 1.5139878940913798, "learning_rate": 4.5483369635557524e-07, "loss": 0.4469, "step": 6536 }, { "epoch": 0.6031138277015339, "grad_norm": 1.9437606120058815, "learning_rate": 4.546526655021591e-07, "loss": 0.5368, "step": 6537 }, { "epoch": 0.6032060892630607, "grad_norm": 2.3694303125917933, "learning_rate": 4.5447165008588657e-07, "loss": 0.8032, "step": 6538 }, { "epoch": 0.6032983508245877, "grad_norm": 1.70946552381227, "learning_rate": 4.5429065012316156e-07, "loss": 0.6672, "step": 6539 }, { "epoch": 0.6033906123861147, "grad_norm": 1.841202695880723, "learning_rate": 4.5410966563038657e-07, "loss": 0.6544, "step": 6540 }, { "epoch": 0.6033906123861147, "eval_GEN Loss": 0.44033557176589966, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3672216534614563, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8744291067123413, "eval_runtime": 57.19, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6540 }, { "epoch": 0.6034828739476416, "grad_norm": 1.9400113352575645, "learning_rate": 4.539286966239624e-07, "loss": 0.593, "step": 6541 }, { "epoch": 0.6035751355091685, "grad_norm": 1.8681659256125793, "learning_rate": 4.537477431202893e-07, "loss": 0.6692, "step": 6542 }, { "epoch": 0.6036673970706954, "grad_norm": 2.704831925035844, "learning_rate": 4.5356680513576515e-07, "loss": 0.8993, "step": 6543 }, { "epoch": 0.6037596586322224, "grad_norm": 2.2477151619415574, "learning_rate": 4.533858826867868e-07, "loss": 0.7808, "step": 6544 }, { "epoch": 0.6038519201937492, "grad_norm": 2.959177805064278, "learning_rate": 4.532049757897501e-07, "loss": 0.7325, "step": 6545 }, { "epoch": 0.6038519201937492, "eval_GEN Loss": 0.4416760206222534, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.37004104256629944, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.87890625, "eval_runtime": 57.1626, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6545 }, { "epoch": 0.6039441817552762, "grad_norm": 2.5910224126301737, "learning_rate": 4.5302408446104893e-07, "loss": 0.8424, "step": 6546 }, { "epoch": 0.6040364433168032, "grad_norm": 1.7208226264832645, "learning_rate": 4.528432087170759e-07, "loss": 0.5938, "step": 6547 }, { "epoch": 0.60412870487833, "grad_norm": 1.9608733156963565, "learning_rate": 4.5266234857422224e-07, "loss": 0.594, "step": 6548 }, { "epoch": 0.604220966439857, "grad_norm": 2.2150547936146983, "learning_rate": 4.524815040488778e-07, "loss": 0.6822, "step": 6549 }, { "epoch": 0.6043132280013839, "grad_norm": 1.5798852876767027, "learning_rate": 4.523006751574311e-07, "loss": 0.6463, "step": 6550 }, { "epoch": 0.6043132280013839, "eval_GEN Loss": 0.4414481222629547, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.37594714760780334, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8659855723381042, "eval_runtime": 57.0383, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6550 }, { "epoch": 0.6044054895629108, "grad_norm": 2.0988826195812678, "learning_rate": 4.521198619162688e-07, "loss": 0.6573, "step": 6551 }, { "epoch": 0.6044977511244378, "grad_norm": 1.9364797694324598, "learning_rate": 4.519390643417769e-07, "loss": 0.7433, "step": 6552 }, { "epoch": 0.6045900126859647, "grad_norm": 3.88975652950621, "learning_rate": 4.517582824503395e-07, "loss": 0.7976, "step": 6553 }, { "epoch": 0.6046822742474917, "grad_norm": 1.6231356611902712, "learning_rate": 4.5157751625833913e-07, "loss": 0.6151, "step": 6554 }, { "epoch": 0.6047745358090185, "grad_norm": 1.8108745529105352, "learning_rate": 4.5139676578215705e-07, "loss": 0.7397, "step": 6555 }, { "epoch": 0.6047745358090185, "eval_GEN Loss": 0.4416932165622711, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3846496045589447, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8633413314819336, "eval_runtime": 57.1345, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6555 }, { "epoch": 0.6048667973705455, "grad_norm": 1.7512219382740548, "learning_rate": 4.512160310381735e-07, "loss": 0.5923, "step": 6556 }, { "epoch": 0.6049590589320725, "grad_norm": 2.3853148574907292, "learning_rate": 4.510353120427668e-07, "loss": 0.6022, "step": 6557 }, { "epoch": 0.6050513204935993, "grad_norm": 2.078317609944487, "learning_rate": 4.508546088123138e-07, "loss": 0.7516, "step": 6558 }, { "epoch": 0.6051435820551263, "grad_norm": 1.7923903992779129, "learning_rate": 4.5067392136319034e-07, "loss": 0.5541, "step": 6559 }, { "epoch": 0.6052358436166532, "grad_norm": 2.6690224339115427, "learning_rate": 4.504932497117706e-07, "loss": 0.8548, "step": 6560 }, { "epoch": 0.6052358436166532, "eval_GEN Loss": 0.4419732391834259, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38830965757369995, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8607872724533081, "eval_runtime": 57.2792, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6560 }, { "epoch": 0.6053281051781801, "grad_norm": 2.34149427952874, "learning_rate": 4.5031259387442715e-07, "loss": 0.631, "step": 6561 }, { "epoch": 0.6054203667397071, "grad_norm": 1.8551245658934126, "learning_rate": 4.5013195386753126e-07, "loss": 0.6751, "step": 6562 }, { "epoch": 0.605512628301234, "grad_norm": 2.038660108230616, "learning_rate": 4.499513297074531e-07, "loss": 0.649, "step": 6563 }, { "epoch": 0.605604889862761, "grad_norm": 3.3673721183977277, "learning_rate": 4.4977072141056106e-07, "loss": 0.6439, "step": 6564 }, { "epoch": 0.6056971514242878, "grad_norm": 1.5072575322076207, "learning_rate": 4.495901289932221e-07, "loss": 0.6034, "step": 6565 }, { "epoch": 0.6056971514242878, "eval_GEN Loss": 0.44144243001937866, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38185223937034607, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8576021790504456, "eval_runtime": 55.9982, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 6565 }, { "epoch": 0.6057894129858148, "grad_norm": 2.4624546628004453, "learning_rate": 4.494095524718014e-07, "loss": 0.9368, "step": 6566 }, { "epoch": 0.6058816745473418, "grad_norm": 2.0637519545631107, "learning_rate": 4.4922899186266367e-07, "loss": 0.7606, "step": 6567 }, { "epoch": 0.6059739361088686, "grad_norm": 1.776278915440757, "learning_rate": 4.490484471821714e-07, "loss": 0.7091, "step": 6568 }, { "epoch": 0.6060661976703956, "grad_norm": 1.3875259349017763, "learning_rate": 4.488679184466857e-07, "loss": 0.4801, "step": 6569 }, { "epoch": 0.6061584592319225, "grad_norm": 1.5795538268564753, "learning_rate": 4.4868740567256665e-07, "loss": 0.6576, "step": 6570 }, { "epoch": 0.6061584592319225, "eval_GEN Loss": 0.44262662529945374, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37747591733932495, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8562800288200378, "eval_runtime": 57.034, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6570 }, { "epoch": 0.6062507207934494, "grad_norm": 2.219674808419999, "learning_rate": 4.485069088761722e-07, "loss": 0.806, "step": 6571 }, { "epoch": 0.6063429823549764, "grad_norm": 1.9105327509187766, "learning_rate": 4.483264280738596e-07, "loss": 0.7094, "step": 6572 }, { "epoch": 0.6064352439165033, "grad_norm": 2.0429249689052407, "learning_rate": 4.4814596328198406e-07, "loss": 0.7772, "step": 6573 }, { "epoch": 0.6065275054780302, "grad_norm": 1.8697360285824849, "learning_rate": 4.4796551451689983e-07, "loss": 0.7183, "step": 6574 }, { "epoch": 0.6066197670395571, "grad_norm": 1.848582891760901, "learning_rate": 4.477850817949594e-07, "loss": 0.5964, "step": 6575 }, { "epoch": 0.6066197670395571, "eval_GEN Loss": 0.4414747655391693, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38106411695480347, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8553184866905212, "eval_runtime": 57.0637, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6575 }, { "epoch": 0.6067120286010841, "grad_norm": 2.0884035954541322, "learning_rate": 4.476046651325135e-07, "loss": 0.6683, "step": 6576 }, { "epoch": 0.606804290162611, "grad_norm": 1.8230945980029107, "learning_rate": 4.474242645459123e-07, "loss": 0.6061, "step": 6577 }, { "epoch": 0.6068965517241379, "grad_norm": 1.9155468290983484, "learning_rate": 4.4724388005150375e-07, "loss": 0.6765, "step": 6578 }, { "epoch": 0.6069888132856649, "grad_norm": 2.6370836169057204, "learning_rate": 4.470635116656346e-07, "loss": 0.7865, "step": 6579 }, { "epoch": 0.6070810748471918, "grad_norm": 1.8201531996521823, "learning_rate": 4.468831594046498e-07, "loss": 0.6177, "step": 6580 }, { "epoch": 0.6070810748471918, "eval_GEN Loss": 0.4427815079689026, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3773242235183716, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8566105961799622, "eval_runtime": 57.4052, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6580 }, { "epoch": 0.6071733364087187, "grad_norm": 1.6424872678956162, "learning_rate": 4.467028232848938e-07, "loss": 0.7419, "step": 6581 }, { "epoch": 0.6072655979702456, "grad_norm": 2.012523171001019, "learning_rate": 4.465225033227085e-07, "loss": 0.5044, "step": 6582 }, { "epoch": 0.6073578595317726, "grad_norm": 3.22714240680025, "learning_rate": 4.4634219953443485e-07, "loss": 0.8188, "step": 6583 }, { "epoch": 0.6074501210932995, "grad_norm": 2.224999611288978, "learning_rate": 4.461619119364123e-07, "loss": 0.6306, "step": 6584 }, { "epoch": 0.6075423826548264, "grad_norm": 1.8164462892762898, "learning_rate": 4.4598164054497893e-07, "loss": 0.6723, "step": 6585 }, { "epoch": 0.6075423826548264, "eval_GEN Loss": 0.44281795620918274, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3813951909542084, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8591646552085876, "eval_runtime": 57.2694, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6585 }, { "epoch": 0.6076346442163534, "grad_norm": 2.1394607725019483, "learning_rate": 4.4580138537647097e-07, "loss": 0.6781, "step": 6586 }, { "epoch": 0.6077269057778802, "grad_norm": 2.2728210784832084, "learning_rate": 4.456211464472233e-07, "loss": 0.7967, "step": 6587 }, { "epoch": 0.6078191673394072, "grad_norm": 1.9851374230489816, "learning_rate": 4.454409237735699e-07, "loss": 0.6014, "step": 6588 }, { "epoch": 0.6079114289009342, "grad_norm": 1.653126801680408, "learning_rate": 4.452607173718426e-07, "loss": 0.638, "step": 6589 }, { "epoch": 0.608003690462461, "grad_norm": 2.256608557305069, "learning_rate": 4.4508052725837185e-07, "loss": 0.6339, "step": 6590 }, { "epoch": 0.608003690462461, "eval_GEN Loss": 0.44318410754203796, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.376788854598999, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8568209409713745, "eval_runtime": 57.4958, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 6590 }, { "epoch": 0.608095952023988, "grad_norm": 1.338998170049878, "learning_rate": 4.449003534494871e-07, "loss": 0.6244, "step": 6591 }, { "epoch": 0.6081882135855149, "grad_norm": 3.0036318489277, "learning_rate": 4.447201959615159e-07, "loss": 0.7374, "step": 6592 }, { "epoch": 0.6082804751470419, "grad_norm": 1.960574273312072, "learning_rate": 4.445400548107842e-07, "loss": 0.5774, "step": 6593 }, { "epoch": 0.6083727367085688, "grad_norm": 2.809134037278999, "learning_rate": 4.443599300136167e-07, "loss": 0.6388, "step": 6594 }, { "epoch": 0.6084649982700957, "grad_norm": 2.8148494531532027, "learning_rate": 4.4417982158633673e-07, "loss": 0.8485, "step": 6595 }, { "epoch": 0.6084649982700957, "eval_GEN Loss": 0.4432031512260437, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.38040289282798767, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8595853447914124, "eval_runtime": 57.0973, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6595 }, { "epoch": 0.6085572598316227, "grad_norm": 1.9157269010500657, "learning_rate": 4.439997295452661e-07, "loss": 0.5926, "step": 6596 }, { "epoch": 0.6086495213931495, "grad_norm": 1.0942978148423934, "learning_rate": 4.438196539067248e-07, "loss": 0.5533, "step": 6597 }, { "epoch": 0.6087417829546765, "grad_norm": 2.50465879783922, "learning_rate": 4.436395946870313e-07, "loss": 0.8038, "step": 6598 }, { "epoch": 0.6088340445162035, "grad_norm": 1.7911323129839756, "learning_rate": 4.4345955190250353e-07, "loss": 0.7633, "step": 6599 }, { "epoch": 0.6089263060777304, "grad_norm": 1.8898196419759243, "learning_rate": 4.432795255694569e-07, "loss": 0.667, "step": 6600 }, { "epoch": 0.6089263060777304, "eval_GEN Loss": 0.44424280524253845, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3880135416984558, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8607872724533081, "eval_runtime": 57.2526, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6600 }, { "epoch": 0.6090185676392573, "grad_norm": 2.17285889145079, "learning_rate": 4.430995157042055e-07, "loss": 0.6225, "step": 6601 }, { "epoch": 0.6091108292007842, "grad_norm": 2.133453194456059, "learning_rate": 4.4291952232306245e-07, "loss": 0.6873, "step": 6602 }, { "epoch": 0.6092030907623112, "grad_norm": 2.5885911234216947, "learning_rate": 4.4273954544233897e-07, "loss": 0.6808, "step": 6603 }, { "epoch": 0.6092953523238381, "grad_norm": 1.6970926968659892, "learning_rate": 4.425595850783447e-07, "loss": 0.5509, "step": 6604 }, { "epoch": 0.609387613885365, "grad_norm": 1.9007477399997459, "learning_rate": 4.42379641247388e-07, "loss": 0.5999, "step": 6605 }, { "epoch": 0.609387613885365, "eval_GEN Loss": 0.44344159960746765, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.38816967606544495, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8600961565971375, "eval_runtime": 57.2238, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6605 }, { "epoch": 0.609479875446892, "grad_norm": 1.4605714879503162, "learning_rate": 4.4219971396577563e-07, "loss": 0.6447, "step": 6606 }, { "epoch": 0.6095721370084188, "grad_norm": 1.51268566418591, "learning_rate": 4.4201980324981284e-07, "loss": 0.7057, "step": 6607 }, { "epoch": 0.6096643985699458, "grad_norm": 2.0235568709394456, "learning_rate": 4.4183990911580346e-07, "loss": 0.7487, "step": 6608 }, { "epoch": 0.6097566601314727, "grad_norm": 1.6661958455322965, "learning_rate": 4.4166003158004997e-07, "loss": 0.692, "step": 6609 }, { "epoch": 0.6098489216929996, "grad_norm": 1.9708852039089118, "learning_rate": 4.414801706588531e-07, "loss": 0.6166, "step": 6610 }, { "epoch": 0.6098489216929996, "eval_GEN Loss": 0.44294121861457825, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.38012024760246277, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8567908406257629, "eval_runtime": 57.0242, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6610 }, { "epoch": 0.6099411832545266, "grad_norm": 2.40444698819471, "learning_rate": 4.413003263685119e-07, "loss": 0.5889, "step": 6611 }, { "epoch": 0.6100334448160535, "grad_norm": 1.7439037678783427, "learning_rate": 4.4112049872532403e-07, "loss": 0.5943, "step": 6612 }, { "epoch": 0.6101257063775805, "grad_norm": 2.68040125678665, "learning_rate": 4.409406877455863e-07, "loss": 0.7495, "step": 6613 }, { "epoch": 0.6102179679391073, "grad_norm": 1.6592276829937045, "learning_rate": 4.4076089344559316e-07, "loss": 0.7033, "step": 6614 }, { "epoch": 0.6103102295006343, "grad_norm": 2.4852511356185487, "learning_rate": 4.405811158416375e-07, "loss": 0.9237, "step": 6615 }, { "epoch": 0.6103102295006343, "eval_GEN Loss": 0.44384315609931946, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3699069023132324, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8537259697914124, "eval_runtime": 57.1941, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6615 }, { "epoch": 0.6104024910621613, "grad_norm": 2.168760189173499, "learning_rate": 4.4040135495001176e-07, "loss": 0.6299, "step": 6616 }, { "epoch": 0.6104947526236881, "grad_norm": 2.087596887932457, "learning_rate": 4.402216107870058e-07, "loss": 0.8397, "step": 6617 }, { "epoch": 0.6105870141852151, "grad_norm": 1.953248946411384, "learning_rate": 4.400418833689082e-07, "loss": 0.6554, "step": 6618 }, { "epoch": 0.610679275746742, "grad_norm": 2.3656632493487266, "learning_rate": 4.398621727120063e-07, "loss": 0.7433, "step": 6619 }, { "epoch": 0.6107715373082689, "grad_norm": 1.511208247166357, "learning_rate": 4.3968247883258576e-07, "loss": 0.4735, "step": 6620 }, { "epoch": 0.6107715373082689, "eval_GEN Loss": 0.44411700963974, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36628812551498413, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8517728447914124, "eval_runtime": 57.4043, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6620 }, { "epoch": 0.6108637988697959, "grad_norm": 1.2854041117896544, "learning_rate": 4.3950280174693063e-07, "loss": 0.4606, "step": 6621 }, { "epoch": 0.6109560604313228, "grad_norm": 1.6021064836174637, "learning_rate": 4.393231414713234e-07, "loss": 0.6075, "step": 6622 }, { "epoch": 0.6110483219928498, "grad_norm": 1.9763768550560126, "learning_rate": 4.391434980220456e-07, "loss": 0.6786, "step": 6623 }, { "epoch": 0.6111405835543766, "grad_norm": 1.7830028021558906, "learning_rate": 4.3896387141537656e-07, "loss": 0.7106, "step": 6624 }, { "epoch": 0.6112328451159036, "grad_norm": 2.0850422356808807, "learning_rate": 4.3878426166759427e-07, "loss": 0.8277, "step": 6625 }, { "epoch": 0.6112328451159036, "eval_GEN Loss": 0.4440293312072754, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36204802989959717, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8515925407409668, "eval_runtime": 57.1165, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6625 }, { "epoch": 0.6113251066774306, "grad_norm": 2.658986705229409, "learning_rate": 4.3860466879497506e-07, "loss": 0.7852, "step": 6626 }, { "epoch": 0.6114173682389574, "grad_norm": 2.6282207370960142, "learning_rate": 4.3842509281379445e-07, "loss": 0.858, "step": 6627 }, { "epoch": 0.6115096298004844, "grad_norm": 3.4052608596188274, "learning_rate": 4.382455337403256e-07, "loss": 0.4998, "step": 6628 }, { "epoch": 0.6116018913620113, "grad_norm": 1.8020467996861664, "learning_rate": 4.3806599159084044e-07, "loss": 0.6826, "step": 6629 }, { "epoch": 0.6116941529235382, "grad_norm": 2.8203603765030856, "learning_rate": 4.3788646638160915e-07, "loss": 0.6738, "step": 6630 }, { "epoch": 0.6116941529235382, "eval_GEN Loss": 0.44341230392456055, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3622773587703705, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8452824354171753, "eval_runtime": 56.1042, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 6630 }, { "epoch": 0.6117864144850652, "grad_norm": 1.5041085157763179, "learning_rate": 4.37706958128901e-07, "loss": 0.4823, "step": 6631 }, { "epoch": 0.6118786760465921, "grad_norm": 2.0879148825873717, "learning_rate": 4.37527466848983e-07, "loss": 0.7966, "step": 6632 }, { "epoch": 0.611970937608119, "grad_norm": 2.395677337396138, "learning_rate": 4.3734799255812087e-07, "loss": 0.6838, "step": 6633 }, { "epoch": 0.6120631991696459, "grad_norm": 2.338858128751212, "learning_rate": 4.3716853527257935e-07, "loss": 0.6285, "step": 6634 }, { "epoch": 0.6121554607311729, "grad_norm": 2.936031699659857, "learning_rate": 4.3698909500862073e-07, "loss": 0.8109, "step": 6635 }, { "epoch": 0.6121554607311729, "eval_GEN Loss": 0.4432564973831177, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3628139793872833, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8452523946762085, "eval_runtime": 56.2596, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6635 }, { "epoch": 0.6122477222926999, "grad_norm": 1.9229955341531624, "learning_rate": 4.3680967178250627e-07, "loss": 0.6914, "step": 6636 }, { "epoch": 0.6123399838542267, "grad_norm": 1.6890577748945823, "learning_rate": 4.3663026561049526e-07, "loss": 0.6804, "step": 6637 }, { "epoch": 0.6124322454157537, "grad_norm": 2.815730473133586, "learning_rate": 4.364508765088464e-07, "loss": 0.7663, "step": 6638 }, { "epoch": 0.6125245069772806, "grad_norm": 1.8921068040103435, "learning_rate": 4.362715044938159e-07, "loss": 0.7294, "step": 6639 }, { "epoch": 0.6126167685388075, "grad_norm": 2.763394989065926, "learning_rate": 4.360921495816586e-07, "loss": 0.7409, "step": 6640 }, { "epoch": 0.6126167685388075, "eval_GEN Loss": 0.4428410232067108, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.35922956466674805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8427283763885498, "eval_runtime": 56.2146, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6640 }, { "epoch": 0.6127090301003344, "grad_norm": 2.4945492454356533, "learning_rate": 4.3591281178862814e-07, "loss": 0.6038, "step": 6641 }, { "epoch": 0.6128012916618614, "grad_norm": 2.264367723588917, "learning_rate": 4.357334911309763e-07, "loss": 0.7602, "step": 6642 }, { "epoch": 0.6128935532233883, "grad_norm": 1.755759567655524, "learning_rate": 4.3555418762495335e-07, "loss": 0.7172, "step": 6643 }, { "epoch": 0.6129858147849152, "grad_norm": 1.8201612559373033, "learning_rate": 4.3537490128680795e-07, "loss": 0.5072, "step": 6644 }, { "epoch": 0.6130780763464422, "grad_norm": 2.0513001402730087, "learning_rate": 4.3519563213278773e-07, "loss": 0.7265, "step": 6645 }, { "epoch": 0.6130780763464422, "eval_GEN Loss": 0.44287657737731934, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3593670725822449, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8437199592590332, "eval_runtime": 56.3739, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 6645 }, { "epoch": 0.613170337907969, "grad_norm": 2.5698694341683685, "learning_rate": 4.350163801791381e-07, "loss": 0.7831, "step": 6646 }, { "epoch": 0.613262599469496, "grad_norm": 1.489901786974972, "learning_rate": 4.3483714544210277e-07, "loss": 0.6247, "step": 6647 }, { "epoch": 0.613354861031023, "grad_norm": 2.9709528977346786, "learning_rate": 4.34657927937925e-07, "loss": 0.6825, "step": 6648 }, { "epoch": 0.6134471225925499, "grad_norm": 1.8911080970372092, "learning_rate": 4.3447872768284535e-07, "loss": 0.7748, "step": 6649 }, { "epoch": 0.6135393841540768, "grad_norm": 2.1963535192333077, "learning_rate": 4.3429954469310324e-07, "loss": 0.596, "step": 6650 }, { "epoch": 0.6135393841540768, "eval_GEN Loss": 0.4419402778148651, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3601812720298767, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8408052921295166, "eval_runtime": 56.1857, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6650 }, { "epoch": 0.6136316457156037, "grad_norm": 1.7957285568715113, "learning_rate": 4.341203789849364e-07, "loss": 0.6884, "step": 6651 }, { "epoch": 0.6137239072771307, "grad_norm": 1.7703175363786465, "learning_rate": 4.3394123057458146e-07, "loss": 0.6375, "step": 6652 }, { "epoch": 0.6138161688386576, "grad_norm": 1.6626862207824358, "learning_rate": 4.337620994782729e-07, "loss": 0.6258, "step": 6653 }, { "epoch": 0.6139084304001845, "grad_norm": 2.6212401541759154, "learning_rate": 4.335829857122439e-07, "loss": 0.6417, "step": 6654 }, { "epoch": 0.6140006919617115, "grad_norm": 1.6972168072217768, "learning_rate": 4.33403889292726e-07, "loss": 0.6377, "step": 6655 }, { "epoch": 0.6140006919617115, "eval_GEN Loss": 0.4413183927536011, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3600755035877228, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8416767120361328, "eval_runtime": 56.1086, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6655 }, { "epoch": 0.6140929535232383, "grad_norm": 1.657688873574811, "learning_rate": 4.332248102359494e-07, "loss": 0.6591, "step": 6656 }, { "epoch": 0.6141852150847653, "grad_norm": 4.094519967127464, "learning_rate": 4.3304574855814226e-07, "loss": 0.8401, "step": 6657 }, { "epoch": 0.6142774766462923, "grad_norm": 2.0435619403968044, "learning_rate": 4.3286670427553123e-07, "loss": 0.6364, "step": 6658 }, { "epoch": 0.6143697382078191, "grad_norm": 2.218499010369319, "learning_rate": 4.3268767740434217e-07, "loss": 0.7242, "step": 6659 }, { "epoch": 0.6144619997693461, "grad_norm": 2.3624757469782676, "learning_rate": 4.3250866796079856e-07, "loss": 0.6232, "step": 6660 }, { "epoch": 0.6144619997693461, "eval_GEN Loss": 0.442717581987381, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3651427626609802, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8405048251152039, "eval_runtime": 56.2839, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 6660 }, { "epoch": 0.614554261330873, "grad_norm": 1.7709009684517358, "learning_rate": 4.323296759611223e-07, "loss": 0.6009, "step": 6661 }, { "epoch": 0.6146465228924, "grad_norm": 1.4591033954581798, "learning_rate": 4.3215070142153396e-07, "loss": 0.4613, "step": 6662 }, { "epoch": 0.6147387844539269, "grad_norm": 1.6171876820395783, "learning_rate": 4.319717443582528e-07, "loss": 0.5718, "step": 6663 }, { "epoch": 0.6148310460154538, "grad_norm": 1.8372055353219328, "learning_rate": 4.31792804787496e-07, "loss": 0.5748, "step": 6664 }, { "epoch": 0.6149233075769808, "grad_norm": 1.5924167417569384, "learning_rate": 4.316138827254792e-07, "loss": 0.689, "step": 6665 }, { "epoch": 0.6149233075769808, "eval_GEN Loss": 0.4415847063064575, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.3630744516849518, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8364783525466919, "eval_runtime": 56.1456, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6665 }, { "epoch": 0.6150155691385076, "grad_norm": 2.3443286781293504, "learning_rate": 4.3143497818841687e-07, "loss": 0.635, "step": 6666 }, { "epoch": 0.6151078307000346, "grad_norm": 1.666222568732319, "learning_rate": 4.312560911925215e-07, "loss": 0.4942, "step": 6667 }, { "epoch": 0.6152000922615616, "grad_norm": 1.9284253997511807, "learning_rate": 4.3107722175400416e-07, "loss": 0.6823, "step": 6668 }, { "epoch": 0.6152923538230884, "grad_norm": 2.41936093216755, "learning_rate": 4.308983698890739e-07, "loss": 0.8543, "step": 6669 }, { "epoch": 0.6153846153846154, "grad_norm": 3.3152943975349274, "learning_rate": 4.3071953561393916e-07, "loss": 0.7034, "step": 6670 }, { "epoch": 0.6153846153846154, "eval_GEN Loss": 0.44156384468078613, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3557501435279846, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8344050645828247, "eval_runtime": 56.156, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6670 }, { "epoch": 0.6154768769461423, "grad_norm": 3.0757632048174237, "learning_rate": 4.305407189448059e-07, "loss": 0.9183, "step": 6671 }, { "epoch": 0.6155691385076693, "grad_norm": 2.531502166995524, "learning_rate": 4.3036191989787856e-07, "loss": 0.7109, "step": 6672 }, { "epoch": 0.6156614000691961, "grad_norm": 3.1527376468488972, "learning_rate": 4.3018313848936053e-07, "loss": 0.9904, "step": 6673 }, { "epoch": 0.6157536616307231, "grad_norm": 1.8804997380925919, "learning_rate": 4.300043747354532e-07, "loss": 0.5235, "step": 6674 }, { "epoch": 0.6158459231922501, "grad_norm": 2.5151010852232094, "learning_rate": 4.298256286523564e-07, "loss": 0.7992, "step": 6675 }, { "epoch": 0.6158459231922501, "eval_GEN Loss": 0.44179463386535645, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.35912981629371643, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8286958932876587, "eval_runtime": 56.2146, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6675 }, { "epoch": 0.6159381847537769, "grad_norm": 1.6634482887085855, "learning_rate": 4.2964690025626825e-07, "loss": 0.7183, "step": 6676 }, { "epoch": 0.6160304463153039, "grad_norm": 2.2281833955465244, "learning_rate": 4.2946818956338553e-07, "loss": 0.6193, "step": 6677 }, { "epoch": 0.6161227078768308, "grad_norm": 1.646940497573126, "learning_rate": 4.292894965899033e-07, "loss": 0.7534, "step": 6678 }, { "epoch": 0.6162149694383577, "grad_norm": 2.127712851211642, "learning_rate": 4.291108213520147e-07, "loss": 0.5716, "step": 6679 }, { "epoch": 0.6163072309998847, "grad_norm": 2.2301035464020127, "learning_rate": 4.289321638659119e-07, "loss": 0.7959, "step": 6680 }, { "epoch": 0.6163072309998847, "eval_GEN Loss": 0.44211873412132263, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8819875776397516, "eval_PRM F1 AUC": 0.7755369303300157, "eval_PRM F1 Neg": 0.6274509803921569, "eval_PRM Loss": 0.355842649936676, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.9102564102564102, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.826442301273346, "eval_runtime": 56.1557, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6680 }, { "epoch": 0.6163994925614116, "grad_norm": 2.3065132605721557, "learning_rate": 4.2875352414778517e-07, "loss": 0.7409, "step": 6681 }, { "epoch": 0.6164917541229386, "grad_norm": 3.1632163250276926, "learning_rate": 4.28574902213823e-07, "loss": 0.7071, "step": 6682 }, { "epoch": 0.6165840156844654, "grad_norm": 2.3250807210084554, "learning_rate": 4.283962980802121e-07, "loss": 0.6783, "step": 6683 }, { "epoch": 0.6166762772459924, "grad_norm": 1.4784893466326363, "learning_rate": 4.282177117631383e-07, "loss": 0.6287, "step": 6684 }, { "epoch": 0.6167685388075194, "grad_norm": 1.8619921950352265, "learning_rate": 4.2803914327878525e-07, "loss": 0.686, "step": 6685 }, { "epoch": 0.6167685388075194, "eval_GEN Loss": 0.4409331977367401, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3457377552986145, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8216646909713745, "eval_runtime": 56.2447, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6685 }, { "epoch": 0.6168608003690462, "grad_norm": 6.080746855278037, "learning_rate": 4.27860592643335e-07, "loss": 0.7062, "step": 6686 }, { "epoch": 0.6169530619305732, "grad_norm": 2.5510465481767666, "learning_rate": 4.27682059872968e-07, "loss": 0.7329, "step": 6687 }, { "epoch": 0.6170453234921001, "grad_norm": 1.8352186015772478, "learning_rate": 4.275035449838635e-07, "loss": 0.6222, "step": 6688 }, { "epoch": 0.617137585053627, "grad_norm": 1.6715946476363195, "learning_rate": 4.2732504799219865e-07, "loss": 0.4934, "step": 6689 }, { "epoch": 0.617229846615154, "grad_norm": 2.137822630299853, "learning_rate": 4.2714656891414893e-07, "loss": 0.5956, "step": 6690 }, { "epoch": 0.617229846615154, "eval_GEN Loss": 0.4415217339992523, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3464350402355194, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8242487907409668, "eval_runtime": 57.0721, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6690 }, { "epoch": 0.6173221081766809, "grad_norm": 2.651565817355499, "learning_rate": 4.2696810776588876e-07, "loss": 0.6977, "step": 6691 }, { "epoch": 0.6174143697382078, "grad_norm": 2.4501914340165873, "learning_rate": 4.2678966456359034e-07, "loss": 0.8138, "step": 6692 }, { "epoch": 0.6175066312997347, "grad_norm": 3.3101721176032726, "learning_rate": 4.266112393234245e-07, "loss": 0.8425, "step": 6693 }, { "epoch": 0.6175988928612617, "grad_norm": 1.7629367523146748, "learning_rate": 4.264328320615602e-07, "loss": 0.616, "step": 6694 }, { "epoch": 0.6176911544227887, "grad_norm": 1.532780412105217, "learning_rate": 4.2625444279416535e-07, "loss": 0.5973, "step": 6695 }, { "epoch": 0.6176911544227887, "eval_GEN Loss": 0.44120967388153076, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3545803129673004, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8247896432876587, "eval_runtime": 56.1084, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 6695 }, { "epoch": 0.6177834159843155, "grad_norm": 1.823549859624137, "learning_rate": 4.260760715374058e-07, "loss": 0.6552, "step": 6696 }, { "epoch": 0.6178756775458425, "grad_norm": 1.5144638186415147, "learning_rate": 4.2589771830744543e-07, "loss": 0.5501, "step": 6697 }, { "epoch": 0.6179679391073694, "grad_norm": 1.8317731558729824, "learning_rate": 4.2571938312044757e-07, "loss": 0.6409, "step": 6698 }, { "epoch": 0.6180602006688963, "grad_norm": 1.8326622824218883, "learning_rate": 4.2554106599257294e-07, "loss": 0.7344, "step": 6699 }, { "epoch": 0.6181524622304233, "grad_norm": 2.4340557003127428, "learning_rate": 4.253627669399807e-07, "loss": 0.7242, "step": 6700 }, { "epoch": 0.6181524622304233, "eval_GEN Loss": 0.44004538655281067, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3608366549015045, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8263822197914124, "eval_runtime": 56.1819, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6700 }, { "epoch": 0.6182447237919502, "grad_norm": 1.571258946110733, "learning_rate": 4.251844859788287e-07, "loss": 0.589, "step": 6701 }, { "epoch": 0.6183369853534771, "grad_norm": 2.923734695183278, "learning_rate": 4.250062231252733e-07, "loss": 0.709, "step": 6702 }, { "epoch": 0.618429246915004, "grad_norm": 2.44325285002879, "learning_rate": 4.2482797839546867e-07, "loss": 0.9552, "step": 6703 }, { "epoch": 0.618521508476531, "grad_norm": 2.394592507028263, "learning_rate": 4.2464975180556743e-07, "loss": 0.7997, "step": 6704 }, { "epoch": 0.6186137700380578, "grad_norm": 2.067693003223893, "learning_rate": 4.2447154337172134e-07, "loss": 0.8093, "step": 6705 }, { "epoch": 0.6186137700380578, "eval_GEN Loss": 0.439814031124115, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3562334179878235, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8260817527770996, "eval_runtime": 56.2294, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6705 }, { "epoch": 0.6187060315995848, "grad_norm": 1.9833543255914499, "learning_rate": 4.242933531100796e-07, "loss": 0.7158, "step": 6706 }, { "epoch": 0.6187982931611118, "grad_norm": 1.7566125378528963, "learning_rate": 4.2411518103679014e-07, "loss": 0.647, "step": 6707 }, { "epoch": 0.6188905547226387, "grad_norm": 2.509612203852972, "learning_rate": 4.239370271679989e-07, "loss": 0.9215, "step": 6708 }, { "epoch": 0.6189828162841656, "grad_norm": 2.710333436003454, "learning_rate": 4.237588915198511e-07, "loss": 0.733, "step": 6709 }, { "epoch": 0.6190750778456925, "grad_norm": 2.9126667477540082, "learning_rate": 4.2358077410848913e-07, "loss": 0.8341, "step": 6710 }, { "epoch": 0.6190750778456925, "eval_GEN Loss": 0.4400528371334076, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3513861894607544, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.83203125, "eval_runtime": 57.4018, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 6710 }, { "epoch": 0.6191673394072195, "grad_norm": 1.738523019094873, "learning_rate": 4.2340267495005445e-07, "loss": 0.6738, "step": 6711 }, { "epoch": 0.6192596009687464, "grad_norm": 2.2649797339287163, "learning_rate": 4.232245940606867e-07, "loss": 0.8906, "step": 6712 }, { "epoch": 0.6193518625302733, "grad_norm": 1.951763278133777, "learning_rate": 4.2304653145652395e-07, "loss": 0.4582, "step": 6713 }, { "epoch": 0.6194441240918003, "grad_norm": 1.447328002131117, "learning_rate": 4.228684871537023e-07, "loss": 0.5685, "step": 6714 }, { "epoch": 0.6195363856533271, "grad_norm": 1.2188162467181263, "learning_rate": 4.2269046116835633e-07, "loss": 0.5489, "step": 6715 }, { "epoch": 0.6195363856533271, "eval_GEN Loss": 0.4398825764656067, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34742462635040283, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8307692408561707, "eval_runtime": 56.1856, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6715 }, { "epoch": 0.6196286472148541, "grad_norm": 1.7668915863000731, "learning_rate": 4.2251245351661947e-07, "loss": 0.5599, "step": 6716 }, { "epoch": 0.6197209087763811, "grad_norm": 1.7910720451454614, "learning_rate": 4.2233446421462273e-07, "loss": 0.6466, "step": 6717 }, { "epoch": 0.619813170337908, "grad_norm": 2.300499405154613, "learning_rate": 4.221564932784959e-07, "loss": 0.6757, "step": 6718 }, { "epoch": 0.6199054318994349, "grad_norm": 1.3595799064857514, "learning_rate": 4.2197854072436666e-07, "loss": 0.5518, "step": 6719 }, { "epoch": 0.6199976934609618, "grad_norm": 3.348639043902415, "learning_rate": 4.2180060656836176e-07, "loss": 0.605, "step": 6720 }, { "epoch": 0.6199976934609618, "eval_GEN Loss": 0.4387657642364502, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34064534306526184, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8353365659713745, "eval_runtime": 57.1993, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6720 }, { "epoch": 0.6200899550224888, "grad_norm": 1.741546378556244, "learning_rate": 4.216226908266059e-07, "loss": 0.4837, "step": 6721 }, { "epoch": 0.6201822165840157, "grad_norm": 1.8143860293530312, "learning_rate": 4.2144479351522173e-07, "loss": 0.6667, "step": 6722 }, { "epoch": 0.6202744781455426, "grad_norm": 1.783156170153062, "learning_rate": 4.2126691465033076e-07, "loss": 0.6171, "step": 6723 }, { "epoch": 0.6203667397070696, "grad_norm": 2.3761140947950805, "learning_rate": 4.210890542480528e-07, "loss": 0.7722, "step": 6724 }, { "epoch": 0.6204590012685964, "grad_norm": 1.5068300951224367, "learning_rate": 4.209112123245057e-07, "loss": 0.7314, "step": 6725 }, { "epoch": 0.6204590012685964, "eval_GEN Loss": 0.4396437108516693, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33593544363975525, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8410456776618958, "eval_runtime": 56.3969, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 6725 }, { "epoch": 0.6205512628301234, "grad_norm": 1.7947619429095194, "learning_rate": 4.207333888958057e-07, "loss": 0.5867, "step": 6726 }, { "epoch": 0.6206435243916504, "grad_norm": 2.182102987604302, "learning_rate": 4.2055558397806753e-07, "loss": 0.662, "step": 6727 }, { "epoch": 0.6207357859531772, "grad_norm": 2.8087114504896094, "learning_rate": 4.203777975874042e-07, "loss": 0.7296, "step": 6728 }, { "epoch": 0.6208280475147042, "grad_norm": 3.5097819526536957, "learning_rate": 4.202000297399267e-07, "loss": 0.8526, "step": 6729 }, { "epoch": 0.6209203090762311, "grad_norm": 2.6446712648710426, "learning_rate": 4.200222804517451e-07, "loss": 0.6088, "step": 6730 }, { "epoch": 0.6209203090762311, "eval_GEN Loss": 0.4400152862071991, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3346721827983856, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.838942289352417, "eval_runtime": 56.4307, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6730 }, { "epoch": 0.621012570637758, "grad_norm": 2.396928742909074, "learning_rate": 4.1984454973896707e-07, "loss": 0.6617, "step": 6731 }, { "epoch": 0.6211048321992849, "grad_norm": 1.3024285334315227, "learning_rate": 4.196668376176989e-07, "loss": 0.4805, "step": 6732 }, { "epoch": 0.6211970937608119, "grad_norm": 1.6746990921675684, "learning_rate": 4.1948914410404484e-07, "loss": 0.5595, "step": 6733 }, { "epoch": 0.6212893553223389, "grad_norm": 1.8411081076379547, "learning_rate": 4.1931146921410827e-07, "loss": 0.5525, "step": 6734 }, { "epoch": 0.6213816168838657, "grad_norm": 2.6961384952403975, "learning_rate": 4.191338129639901e-07, "loss": 0.8404, "step": 6735 }, { "epoch": 0.6213816168838657, "eval_GEN Loss": 0.4395016133785248, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3378206789493561, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8323917984962463, "eval_runtime": 56.3439, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6735 }, { "epoch": 0.6214738784453927, "grad_norm": 4.536313350856954, "learning_rate": 4.1895617536978974e-07, "loss": 0.858, "step": 6736 }, { "epoch": 0.6215661400069196, "grad_norm": 2.130705822620825, "learning_rate": 4.187785564476052e-07, "loss": 0.637, "step": 6737 }, { "epoch": 0.6216584015684465, "grad_norm": 2.2868002150322306, "learning_rate": 4.186009562135325e-07, "loss": 0.7458, "step": 6738 }, { "epoch": 0.6217506631299735, "grad_norm": 1.7431225570431579, "learning_rate": 4.18423374683666e-07, "loss": 0.6552, "step": 6739 }, { "epoch": 0.6218429246915004, "grad_norm": 1.5544747050413052, "learning_rate": 4.182458118740981e-07, "loss": 0.5834, "step": 6740 }, { "epoch": 0.6218429246915004, "eval_GEN Loss": 0.44010594487190247, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35035446286201477, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8280649185180664, "eval_runtime": 56.2354, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6740 }, { "epoch": 0.6219351862530274, "grad_norm": 2.4403217962530714, "learning_rate": 4.180682678009206e-07, "loss": 0.7807, "step": 6741 }, { "epoch": 0.6220274478145542, "grad_norm": 1.8336526249280867, "learning_rate": 4.1789074248022224e-07, "loss": 0.6461, "step": 6742 }, { "epoch": 0.6221197093760812, "grad_norm": 2.0113515057118434, "learning_rate": 4.177132359280906e-07, "loss": 0.7549, "step": 6743 }, { "epoch": 0.6222119709376082, "grad_norm": 3.799909139578203, "learning_rate": 4.175357481606121e-07, "loss": 0.8086, "step": 6744 }, { "epoch": 0.622304232499135, "grad_norm": 1.7087835254974453, "learning_rate": 4.1735827919387057e-07, "loss": 0.5288, "step": 6745 }, { "epoch": 0.622304232499135, "eval_GEN Loss": 0.44124436378479004, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM Loss": 0.3712894022464752, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8314903974533081, "eval_runtime": 55.9803, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 6745 }, { "epoch": 0.622396494060662, "grad_norm": 1.8891941511369197, "learning_rate": 4.171808290439486e-07, "loss": 0.6119, "step": 6746 }, { "epoch": 0.6224887556221889, "grad_norm": 2.80580652176809, "learning_rate": 4.1700339772692693e-07, "loss": 0.7288, "step": 6747 }, { "epoch": 0.6225810171837158, "grad_norm": 2.0431533931129042, "learning_rate": 4.1682598525888493e-07, "loss": 0.7307, "step": 6748 }, { "epoch": 0.6226732787452428, "grad_norm": 2.639344290133345, "learning_rate": 4.1664859165589974e-07, "loss": 0.9605, "step": 6749 }, { "epoch": 0.6227655403067697, "grad_norm": 1.8109408468749595, "learning_rate": 4.164712169340471e-07, "loss": 0.7372, "step": 6750 }, { "epoch": 0.6227655403067697, "eval_GEN Loss": 0.44269901514053345, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.3966447412967682, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8453726172447205, "eval_runtime": 56.026, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 6750 }, { "epoch": 0.6228578018682966, "grad_norm": 2.0121172692918474, "learning_rate": 4.162938611094008e-07, "loss": 0.7011, "step": 6751 }, { "epoch": 0.6229500634298235, "grad_norm": 1.728157996842971, "learning_rate": 4.161165241980336e-07, "loss": 0.6829, "step": 6752 }, { "epoch": 0.6230423249913505, "grad_norm": 1.7214870736834067, "learning_rate": 4.159392062160157e-07, "loss": 0.651, "step": 6753 }, { "epoch": 0.6231345865528775, "grad_norm": 2.5396816767265986, "learning_rate": 4.1576190717941576e-07, "loss": 0.5671, "step": 6754 }, { "epoch": 0.6232268481144043, "grad_norm": 2.162217081627846, "learning_rate": 4.155846271043014e-07, "loss": 0.6655, "step": 6755 }, { "epoch": 0.6232268481144043, "eval_GEN Loss": 0.44300490617752075, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.4011622965335846, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8472957015037537, "eval_runtime": 56.0134, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 6755 }, { "epoch": 0.6233191096759313, "grad_norm": 2.2817516476328206, "learning_rate": 4.154073660067378e-07, "loss": 0.5585, "step": 6756 }, { "epoch": 0.6234113712374582, "grad_norm": 2.3936706748220575, "learning_rate": 4.1523012390278854e-07, "loss": 0.8311, "step": 6757 }, { "epoch": 0.6235036327989851, "grad_norm": 3.3436937303182965, "learning_rate": 4.1505290080851554e-07, "loss": 0.6686, "step": 6758 }, { "epoch": 0.6235958943605121, "grad_norm": 2.717826058709118, "learning_rate": 4.148756967399791e-07, "loss": 0.8317, "step": 6759 }, { "epoch": 0.623688155922039, "grad_norm": 3.1931880284556122, "learning_rate": 4.146985117132379e-07, "loss": 0.6769, "step": 6760 }, { "epoch": 0.623688155922039, "eval_GEN Loss": 0.44279590249061584, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.38605302572250366, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.842067301273346, "eval_runtime": 57.0449, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6760 }, { "epoch": 0.6237804174835659, "grad_norm": 1.342782084431095, "learning_rate": 4.145213457443485e-07, "loss": 0.6601, "step": 6761 }, { "epoch": 0.6238726790450928, "grad_norm": 1.8339207699235405, "learning_rate": 4.143441988493661e-07, "loss": 0.5372, "step": 6762 }, { "epoch": 0.6239649406066198, "grad_norm": 2.2985576176711318, "learning_rate": 4.1416707104434405e-07, "loss": 0.8207, "step": 6763 }, { "epoch": 0.6240572021681466, "grad_norm": 1.8546514594341812, "learning_rate": 4.1398996234533383e-07, "loss": 0.7062, "step": 6764 }, { "epoch": 0.6241494637296736, "grad_norm": 1.9055415529233064, "learning_rate": 4.1381287276838516e-07, "loss": 0.6871, "step": 6765 }, { "epoch": 0.6241494637296736, "eval_GEN Loss": 0.4428922235965729, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3686590790748596, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8353966474533081, "eval_runtime": 56.3397, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6765 }, { "epoch": 0.6242417252912006, "grad_norm": 2.0177461004414057, "learning_rate": 4.1363580232954654e-07, "loss": 0.6591, "step": 6766 }, { "epoch": 0.6243339868527275, "grad_norm": 2.12401290205334, "learning_rate": 4.134587510448643e-07, "loss": 0.7836, "step": 6767 }, { "epoch": 0.6244262484142544, "grad_norm": 2.142805321886337, "learning_rate": 4.132817189303827e-07, "loss": 0.7655, "step": 6768 }, { "epoch": 0.6245185099757813, "grad_norm": 2.15164795302417, "learning_rate": 4.131047060021452e-07, "loss": 0.6988, "step": 6769 }, { "epoch": 0.6246107715373083, "grad_norm": 3.90573332214759, "learning_rate": 4.129277122761928e-07, "loss": 0.8251, "step": 6770 }, { "epoch": 0.6246107715373083, "eval_GEN Loss": 0.44371268153190613, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3654974400997162, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8413161039352417, "eval_runtime": 56.4548, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 6770 }, { "epoch": 0.6247030330988352, "grad_norm": 1.8254680563284242, "learning_rate": 4.1275073776856494e-07, "loss": 0.6018, "step": 6771 }, { "epoch": 0.6247952946603621, "grad_norm": 1.8883380836099093, "learning_rate": 4.125737824952992e-07, "loss": 0.5674, "step": 6772 }, { "epoch": 0.6248875562218891, "grad_norm": 2.02392794869848, "learning_rate": 4.123968464724318e-07, "loss": 0.8847, "step": 6773 }, { "epoch": 0.6249798177834159, "grad_norm": 2.8891753824945057, "learning_rate": 4.122199297159967e-07, "loss": 0.7749, "step": 6774 }, { "epoch": 0.6250720793449429, "grad_norm": 1.927121250119538, "learning_rate": 4.1204303224202655e-07, "loss": 0.5388, "step": 6775 }, { "epoch": 0.6250720793449429, "eval_GEN Loss": 0.4431971311569214, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3675469756126404, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8429387211799622, "eval_runtime": 55.99, "eval_samples_per_second": 1.161, "eval_steps_per_second": 0.089, "step": 6775 }, { "epoch": 0.6251643409064699, "grad_norm": 1.515506861458831, "learning_rate": 4.118661540665518e-07, "loss": 0.5035, "step": 6776 }, { "epoch": 0.6252566024679967, "grad_norm": 1.6921035784656744, "learning_rate": 4.116892952056019e-07, "loss": 0.4932, "step": 6777 }, { "epoch": 0.6253488640295237, "grad_norm": 1.68700677030698, "learning_rate": 4.1151245567520376e-07, "loss": 0.4915, "step": 6778 }, { "epoch": 0.6254411255910506, "grad_norm": 1.3975139330859871, "learning_rate": 4.113356354913827e-07, "loss": 0.5301, "step": 6779 }, { "epoch": 0.6255333871525776, "grad_norm": 2.3775924275490143, "learning_rate": 4.11158834670163e-07, "loss": 0.8046, "step": 6780 }, { "epoch": 0.6255333871525776, "eval_GEN Loss": 0.4425168037414551, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.36813732981681824, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8423377275466919, "eval_runtime": 56.0981, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 6780 }, { "epoch": 0.6256256487141045, "grad_norm": 2.003272032127654, "learning_rate": 4.109820532275662e-07, "loss": 0.8457, "step": 6781 }, { "epoch": 0.6257179102756314, "grad_norm": 1.4943659425018103, "learning_rate": 4.108052911796126e-07, "loss": 0.5902, "step": 6782 }, { "epoch": 0.6258101718371584, "grad_norm": 2.709542578194603, "learning_rate": 4.106285485423205e-07, "loss": 0.6979, "step": 6783 }, { "epoch": 0.6259024333986852, "grad_norm": 2.156954118856963, "learning_rate": 4.1045182533170697e-07, "loss": 0.772, "step": 6784 }, { "epoch": 0.6259946949602122, "grad_norm": 2.8788787155263007, "learning_rate": 4.1027512156378675e-07, "loss": 0.6715, "step": 6785 }, { "epoch": 0.6259946949602122, "eval_GEN Loss": 0.44285258650779724, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.36810004711151123, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8470553159713745, "eval_runtime": 56.3214, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6785 }, { "epoch": 0.6260869565217392, "grad_norm": 2.304829650806243, "learning_rate": 4.100984372545726e-07, "loss": 0.6388, "step": 6786 }, { "epoch": 0.626179218083266, "grad_norm": 1.8313860310827939, "learning_rate": 4.099217724200767e-07, "loss": 0.6613, "step": 6787 }, { "epoch": 0.626271479644793, "grad_norm": 3.16998302506931, "learning_rate": 4.097451270763084e-07, "loss": 0.833, "step": 6788 }, { "epoch": 0.6263637412063199, "grad_norm": 1.8209720478069722, "learning_rate": 4.0956850123927537e-07, "loss": 0.5903, "step": 6789 }, { "epoch": 0.6264560027678469, "grad_norm": 2.131558397773082, "learning_rate": 4.0939189492498357e-07, "loss": 0.63, "step": 6790 }, { "epoch": 0.6264560027678469, "eval_GEN Loss": 0.44296520948410034, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.37811532616615295, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.849879801273346, "eval_runtime": 57.3154, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6790 }, { "epoch": 0.6265482643293738, "grad_norm": 2.0056151576001864, "learning_rate": 4.0921530814943793e-07, "loss": 0.6712, "step": 6791 }, { "epoch": 0.6266405258909007, "grad_norm": 1.8997183366865888, "learning_rate": 4.0903874092864076e-07, "loss": 0.7194, "step": 6792 }, { "epoch": 0.6267327874524277, "grad_norm": 2.203299133026998, "learning_rate": 4.0886219327859256e-07, "loss": 0.6866, "step": 6793 }, { "epoch": 0.6268250490139545, "grad_norm": 2.487315902307103, "learning_rate": 4.086856652152929e-07, "loss": 0.8383, "step": 6794 }, { "epoch": 0.6269173105754815, "grad_norm": 2.3648361861887994, "learning_rate": 4.085091567547385e-07, "loss": 0.8422, "step": 6795 }, { "epoch": 0.6269173105754815, "eval_GEN Loss": 0.4439067542552948, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.39057716727256775, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8559495210647583, "eval_runtime": 56.0631, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 6795 }, { "epoch": 0.6270095721370084, "grad_norm": 2.4525558881341034, "learning_rate": 4.0833266791292527e-07, "loss": 0.5322, "step": 6796 }, { "epoch": 0.6271018336985353, "grad_norm": 1.8642226081954036, "learning_rate": 4.0815619870584663e-07, "loss": 0.4894, "step": 6797 }, { "epoch": 0.6271940952600623, "grad_norm": 1.5586971771310254, "learning_rate": 4.0797974914949456e-07, "loss": 0.5416, "step": 6798 }, { "epoch": 0.6272863568215892, "grad_norm": 2.152781430208435, "learning_rate": 4.0780331925985934e-07, "loss": 0.6378, "step": 6799 }, { "epoch": 0.6273786183831161, "grad_norm": 1.7637128184501707, "learning_rate": 4.076269090529289e-07, "loss": 0.5647, "step": 6800 }, { "epoch": 0.6273786183831161, "eval_GEN Loss": 0.4439007043838501, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.400821715593338, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8638521432876587, "eval_runtime": 57.2663, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6800 }, { "epoch": 0.627470879944643, "grad_norm": 1.711250569556545, "learning_rate": 4.074505185446903e-07, "loss": 0.5649, "step": 6801 }, { "epoch": 0.62756314150617, "grad_norm": 2.1072741449312113, "learning_rate": 4.072741477511283e-07, "loss": 0.6399, "step": 6802 }, { "epoch": 0.627655403067697, "grad_norm": 2.145144058290914, "learning_rate": 4.070977966882256e-07, "loss": 0.7711, "step": 6803 }, { "epoch": 0.6277476646292238, "grad_norm": 2.6583624682407163, "learning_rate": 4.069214653719633e-07, "loss": 0.7061, "step": 6804 }, { "epoch": 0.6278399261907508, "grad_norm": 1.4758472843862538, "learning_rate": 4.0674515381832134e-07, "loss": 0.5643, "step": 6805 }, { "epoch": 0.6278399261907508, "eval_GEN Loss": 0.4436876177787781, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.39445194602012634, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.860546886920929, "eval_runtime": 56.3134, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6805 }, { "epoch": 0.6279321877522777, "grad_norm": 1.8068288238821577, "learning_rate": 4.0656886204327716e-07, "loss": 0.5966, "step": 6806 }, { "epoch": 0.6280244493138046, "grad_norm": 1.552371602958913, "learning_rate": 4.0639259006280643e-07, "loss": 0.5739, "step": 6807 }, { "epoch": 0.6281167108753316, "grad_norm": 1.9587765132452062, "learning_rate": 4.0621633789288315e-07, "loss": 0.7518, "step": 6808 }, { "epoch": 0.6282089724368585, "grad_norm": 1.5590897218916073, "learning_rate": 4.060401055494799e-07, "loss": 0.5127, "step": 6809 }, { "epoch": 0.6283012339983854, "grad_norm": 1.6707498346373368, "learning_rate": 4.0586389304856685e-07, "loss": 0.594, "step": 6810 }, { "epoch": 0.6283012339983854, "eval_GEN Loss": 0.4434267282485962, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3877648413181305, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8595853447914124, "eval_runtime": 57.2173, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6810 }, { "epoch": 0.6283934955599123, "grad_norm": 3.0623270778483684, "learning_rate": 4.056877004061126e-07, "loss": 0.6845, "step": 6811 }, { "epoch": 0.6284857571214393, "grad_norm": 1.8344457027075065, "learning_rate": 4.055115276380843e-07, "loss": 0.4703, "step": 6812 }, { "epoch": 0.6285780186829663, "grad_norm": 1.9835120276633036, "learning_rate": 4.053353747604468e-07, "loss": 0.6689, "step": 6813 }, { "epoch": 0.6286702802444931, "grad_norm": 2.145340598960444, "learning_rate": 4.051592417891635e-07, "loss": 0.7854, "step": 6814 }, { "epoch": 0.6287625418060201, "grad_norm": 2.548370939181327, "learning_rate": 4.0498312874019545e-07, "loss": 0.9855, "step": 6815 }, { "epoch": 0.6287625418060201, "eval_GEN Loss": 0.4427202343940735, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37023523449897766, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8596153855323792, "eval_runtime": 57.2402, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6815 }, { "epoch": 0.628854803367547, "grad_norm": 2.8129795273808598, "learning_rate": 4.048070356295028e-07, "loss": 0.8011, "step": 6816 }, { "epoch": 0.6289470649290739, "grad_norm": 2.4611156941720314, "learning_rate": 4.046309624730432e-07, "loss": 0.7828, "step": 6817 }, { "epoch": 0.6290393264906009, "grad_norm": 1.8438841024695967, "learning_rate": 4.044549092867725e-07, "loss": 0.5896, "step": 6818 }, { "epoch": 0.6291315880521278, "grad_norm": 1.0884287266643122, "learning_rate": 4.042788760866453e-07, "loss": 0.5336, "step": 6819 }, { "epoch": 0.6292238496136547, "grad_norm": 3.3291619857620818, "learning_rate": 4.0410286288861367e-07, "loss": 0.7275, "step": 6820 }, { "epoch": 0.6292238496136547, "eval_GEN Loss": 0.4428213834762573, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3631264269351959, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8638221025466919, "eval_runtime": 57.0414, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 6820 }, { "epoch": 0.6293161111751816, "grad_norm": 2.974800646895025, "learning_rate": 4.0392686970862836e-07, "loss": 0.7066, "step": 6821 }, { "epoch": 0.6294083727367086, "grad_norm": 1.9918412595089148, "learning_rate": 4.0375089656263774e-07, "loss": 0.5839, "step": 6822 }, { "epoch": 0.6295006342982356, "grad_norm": 2.3221423821456346, "learning_rate": 4.0357494346658947e-07, "loss": 0.6029, "step": 6823 }, { "epoch": 0.6295928958597624, "grad_norm": 1.5340343564043806, "learning_rate": 4.0339901043642825e-07, "loss": 0.5617, "step": 6824 }, { "epoch": 0.6296851574212894, "grad_norm": 2.322106285942456, "learning_rate": 4.032230974880974e-07, "loss": 0.6532, "step": 6825 }, { "epoch": 0.6296851574212894, "eval_GEN Loss": 0.4424263834953308, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36258140206336975, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.860546886920929, "eval_runtime": 57.2085, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6825 }, { "epoch": 0.6297774189828163, "grad_norm": 1.784779974714975, "learning_rate": 4.030472046375387e-07, "loss": 0.6749, "step": 6826 }, { "epoch": 0.6298696805443432, "grad_norm": 3.120002497266539, "learning_rate": 4.0287133190069166e-07, "loss": 0.9775, "step": 6827 }, { "epoch": 0.6299619421058701, "grad_norm": 2.010568251568145, "learning_rate": 4.0269547929349425e-07, "loss": 0.6925, "step": 6828 }, { "epoch": 0.6300542036673971, "grad_norm": 2.4757878736434074, "learning_rate": 4.025196468318822e-07, "loss": 0.7625, "step": 6829 }, { "epoch": 0.630146465228924, "grad_norm": 2.120763605763381, "learning_rate": 4.023438345317901e-07, "loss": 0.6795, "step": 6830 }, { "epoch": 0.630146465228924, "eval_GEN Loss": 0.4424962103366852, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3619265556335449, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8638221025466919, "eval_runtime": 57.4491, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 6830 }, { "epoch": 0.6302387267904509, "grad_norm": 2.921624745583971, "learning_rate": 4.021680424091501e-07, "loss": 0.7705, "step": 6831 }, { "epoch": 0.6303309883519779, "grad_norm": 1.7947186547150464, "learning_rate": 4.019922704798927e-07, "loss": 0.5906, "step": 6832 }, { "epoch": 0.6304232499135047, "grad_norm": 1.7687573744968907, "learning_rate": 4.01816518759947e-07, "loss": 0.5719, "step": 6833 }, { "epoch": 0.6305155114750317, "grad_norm": 2.7425873116418797, "learning_rate": 4.0164078726523967e-07, "loss": 0.6623, "step": 6834 }, { "epoch": 0.6306077730365587, "grad_norm": 1.8453744632931732, "learning_rate": 4.014650760116957e-07, "loss": 0.4447, "step": 6835 }, { "epoch": 0.6306077730365587, "eval_GEN Loss": 0.4429917335510254, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3666442334651947, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8644831776618958, "eval_runtime": 57.2219, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6835 }, { "epoch": 0.6307000345980855, "grad_norm": 2.6477714101885694, "learning_rate": 4.012893850152383e-07, "loss": 0.8161, "step": 6836 }, { "epoch": 0.6307922961596125, "grad_norm": 1.9405892504332671, "learning_rate": 4.011137142917891e-07, "loss": 0.5872, "step": 6837 }, { "epoch": 0.6308845577211394, "grad_norm": 2.7977820506944697, "learning_rate": 4.009380638572675e-07, "loss": 0.7432, "step": 6838 }, { "epoch": 0.6309768192826664, "grad_norm": 2.2949325375892458, "learning_rate": 4.007624337275912e-07, "loss": 0.811, "step": 6839 }, { "epoch": 0.6310690808441933, "grad_norm": 1.8422322612142183, "learning_rate": 4.00586823918676e-07, "loss": 0.5369, "step": 6840 }, { "epoch": 0.6310690808441933, "eval_GEN Loss": 0.442391574382782, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36809033155441284, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8634315133094788, "eval_runtime": 56.5253, "eval_samples_per_second": 1.15, "eval_steps_per_second": 0.088, "step": 6840 }, { "epoch": 0.6311613424057202, "grad_norm": 2.4365761806358286, "learning_rate": 4.004112344464361e-07, "loss": 0.7874, "step": 6841 }, { "epoch": 0.6312536039672472, "grad_norm": 1.9907597212902193, "learning_rate": 4.002356653267838e-07, "loss": 0.7135, "step": 6842 }, { "epoch": 0.631345865528774, "grad_norm": 2.0509846447061006, "learning_rate": 4.0006011657562913e-07, "loss": 0.7247, "step": 6843 }, { "epoch": 0.631438127090301, "grad_norm": 1.7385070978927342, "learning_rate": 3.998845882088809e-07, "loss": 0.5826, "step": 6844 }, { "epoch": 0.631530388651828, "grad_norm": 2.2498323436065917, "learning_rate": 3.997090802424455e-07, "loss": 0.7773, "step": 6845 }, { "epoch": 0.631530388651828, "eval_GEN Loss": 0.44177380204200745, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.36768338084220886, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8628305196762085, "eval_runtime": 57.0845, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6845 }, { "epoch": 0.6316226502133548, "grad_norm": 1.6787372016762163, "learning_rate": 3.99533592692228e-07, "loss": 0.6498, "step": 6846 }, { "epoch": 0.6317149117748818, "grad_norm": 1.6979055955331477, "learning_rate": 3.993581255741309e-07, "loss": 0.673, "step": 6847 }, { "epoch": 0.6318071733364087, "grad_norm": 2.512622963538286, "learning_rate": 3.991826789040559e-07, "loss": 0.7068, "step": 6848 }, { "epoch": 0.6318994348979357, "grad_norm": 1.5417710972787617, "learning_rate": 3.99007252697902e-07, "loss": 0.6488, "step": 6849 }, { "epoch": 0.6319916964594626, "grad_norm": 2.694902670486016, "learning_rate": 3.988318469715663e-07, "loss": 0.5625, "step": 6850 }, { "epoch": 0.6319916964594626, "eval_GEN Loss": 0.4424646198749542, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3706446588039398, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8665865659713745, "eval_runtime": 57.0581, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6850 }, { "epoch": 0.6320839580209895, "grad_norm": 1.5813615097756348, "learning_rate": 3.9865646174094485e-07, "loss": 0.5481, "step": 6851 }, { "epoch": 0.6321762195825165, "grad_norm": 2.5821406589546414, "learning_rate": 3.984810970219312e-07, "loss": 0.5642, "step": 6852 }, { "epoch": 0.6322684811440433, "grad_norm": 2.3968287933267174, "learning_rate": 3.98305752830417e-07, "loss": 0.6347, "step": 6853 }, { "epoch": 0.6323607427055703, "grad_norm": 1.858317190083208, "learning_rate": 3.981304291822922e-07, "loss": 0.6545, "step": 6854 }, { "epoch": 0.6324530042670973, "grad_norm": 2.3893905720449453, "learning_rate": 3.9795512609344515e-07, "loss": 0.7536, "step": 6855 }, { "epoch": 0.6324530042670973, "eval_GEN Loss": 0.44355449080467224, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37406110763549805, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8667668104171753, "eval_runtime": 56.4144, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 6855 }, { "epoch": 0.6325452658286241, "grad_norm": 1.973764101116914, "learning_rate": 3.9777984357976183e-07, "loss": 0.7717, "step": 6856 }, { "epoch": 0.6326375273901511, "grad_norm": 2.3959457815669776, "learning_rate": 3.976045816571266e-07, "loss": 0.6659, "step": 6857 }, { "epoch": 0.632729788951678, "grad_norm": 1.9016308378519438, "learning_rate": 3.974293403414223e-07, "loss": 0.6881, "step": 6858 }, { "epoch": 0.632822050513205, "grad_norm": 2.389044135919377, "learning_rate": 3.9725411964852945e-07, "loss": 0.7351, "step": 6859 }, { "epoch": 0.6329143120747318, "grad_norm": 3.1898348214006775, "learning_rate": 3.970789195943267e-07, "loss": 0.7369, "step": 6860 }, { "epoch": 0.6329143120747318, "eval_GEN Loss": 0.44391733407974243, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3860008716583252, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8693209290504456, "eval_runtime": 56.2079, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 6860 }, { "epoch": 0.6330065736362588, "grad_norm": 1.9288033601811556, "learning_rate": 3.969037401946908e-07, "loss": 0.7124, "step": 6861 }, { "epoch": 0.6330988351977858, "grad_norm": 1.7794927957823172, "learning_rate": 3.9672858146549725e-07, "loss": 0.7096, "step": 6862 }, { "epoch": 0.6331910967593126, "grad_norm": 2.4845437740274248, "learning_rate": 3.965534434226189e-07, "loss": 0.7441, "step": 6863 }, { "epoch": 0.6332833583208396, "grad_norm": 1.593801639384076, "learning_rate": 3.96378326081927e-07, "loss": 0.5178, "step": 6864 }, { "epoch": 0.6333756198823665, "grad_norm": 1.9817284914631124, "learning_rate": 3.9620322945929115e-07, "loss": 0.6257, "step": 6865 }, { "epoch": 0.6333756198823665, "eval_GEN Loss": 0.4431268274784088, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3875719904899597, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8712139129638672, "eval_runtime": 56.4681, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 6865 }, { "epoch": 0.6334678814438934, "grad_norm": 2.315170834327458, "learning_rate": 3.960281535705787e-07, "loss": 0.7345, "step": 6866 }, { "epoch": 0.6335601430054204, "grad_norm": 2.7037305364420128, "learning_rate": 3.958530984316554e-07, "loss": 0.7193, "step": 6867 }, { "epoch": 0.6336524045669473, "grad_norm": 2.8288317237422658, "learning_rate": 3.9567806405838495e-07, "loss": 0.7103, "step": 6868 }, { "epoch": 0.6337446661284742, "grad_norm": 2.334593413520641, "learning_rate": 3.955030504666294e-07, "loss": 0.7616, "step": 6869 }, { "epoch": 0.6338369276900011, "grad_norm": 1.6788838908497168, "learning_rate": 3.953280576722487e-07, "loss": 0.5799, "step": 6870 }, { "epoch": 0.6338369276900011, "eval_GEN Loss": 0.44294634461402893, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3783740997314453, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8668269515037537, "eval_runtime": 56.3272, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6870 }, { "epoch": 0.6339291892515281, "grad_norm": 2.0896168735056575, "learning_rate": 3.951530856911008e-07, "loss": 0.6554, "step": 6871 }, { "epoch": 0.634021450813055, "grad_norm": 1.876141901466242, "learning_rate": 3.949781345390419e-07, "loss": 0.6567, "step": 6872 }, { "epoch": 0.6341137123745819, "grad_norm": 1.9381782030898589, "learning_rate": 3.9480320423192677e-07, "loss": 0.8079, "step": 6873 }, { "epoch": 0.6342059739361089, "grad_norm": 2.4344677984565757, "learning_rate": 3.9462829478560753e-07, "loss": 0.8635, "step": 6874 }, { "epoch": 0.6342982354976358, "grad_norm": 1.9798449292771287, "learning_rate": 3.944534062159347e-07, "loss": 0.6304, "step": 6875 }, { "epoch": 0.6342982354976358, "eval_GEN Loss": 0.44391706585884094, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.37103477120399475, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8692908883094788, "eval_runtime": 56.3436, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6875 }, { "epoch": 0.6343904970591627, "grad_norm": 2.0396657905253917, "learning_rate": 3.942785385387572e-07, "loss": 0.7516, "step": 6876 }, { "epoch": 0.6344827586206897, "grad_norm": 2.2875317845245537, "learning_rate": 3.9410369176992183e-07, "loss": 0.729, "step": 6877 }, { "epoch": 0.6345750201822166, "grad_norm": 1.6390418597065588, "learning_rate": 3.939288659252732e-07, "loss": 0.6635, "step": 6878 }, { "epoch": 0.6346672817437435, "grad_norm": 2.1622725192854286, "learning_rate": 3.9375406102065453e-07, "loss": 0.5252, "step": 6879 }, { "epoch": 0.6347595433052704, "grad_norm": 3.2171037730611305, "learning_rate": 3.9357927707190683e-07, "loss": 0.9816, "step": 6880 }, { "epoch": 0.6347595433052704, "eval_GEN Loss": 0.4444407820701599, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37013834714889526, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8661057949066162, "eval_runtime": 57.2221, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6880 }, { "epoch": 0.6348518048667974, "grad_norm": 1.970978494042417, "learning_rate": 3.934045140948693e-07, "loss": 0.7965, "step": 6881 }, { "epoch": 0.6349440664283243, "grad_norm": 2.7059238728096915, "learning_rate": 3.9322977210537905e-07, "loss": 0.8189, "step": 6882 }, { "epoch": 0.6350363279898512, "grad_norm": 1.9131532443808075, "learning_rate": 3.930550511192718e-07, "loss": 0.6145, "step": 6883 }, { "epoch": 0.6351285895513782, "grad_norm": 1.9760930064405364, "learning_rate": 3.9288035115238097e-07, "loss": 0.7508, "step": 6884 }, { "epoch": 0.635220851112905, "grad_norm": 2.5626550058086797, "learning_rate": 3.9270567222053815e-07, "loss": 0.7142, "step": 6885 }, { "epoch": 0.635220851112905, "eval_GEN Loss": 0.4446733593940735, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37378090620040894, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8701622486114502, "eval_runtime": 57.119, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 6885 }, { "epoch": 0.635313112674432, "grad_norm": 2.1787942581660733, "learning_rate": 3.925310143395726e-07, "loss": 0.6498, "step": 6886 }, { "epoch": 0.635405374235959, "grad_norm": 2.644957346776576, "learning_rate": 3.9235637752531267e-07, "loss": 0.7213, "step": 6887 }, { "epoch": 0.6354976357974859, "grad_norm": 1.7854498457727848, "learning_rate": 3.9218176179358415e-07, "loss": 0.7373, "step": 6888 }, { "epoch": 0.6355898973590128, "grad_norm": 2.0383702372291266, "learning_rate": 3.9200716716021053e-07, "loss": 0.5559, "step": 6889 }, { "epoch": 0.6356821589205397, "grad_norm": 1.7449576276672987, "learning_rate": 3.9183259364101444e-07, "loss": 0.7042, "step": 6890 }, { "epoch": 0.6356821589205397, "eval_GEN Loss": 0.44557079672813416, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.37430664896965027, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8682091236114502, "eval_runtime": 57.1896, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6890 }, { "epoch": 0.6357744204820667, "grad_norm": 1.6865475540207848, "learning_rate": 3.9165804125181563e-07, "loss": 0.6246, "step": 6891 }, { "epoch": 0.6358666820435935, "grad_norm": 1.6165831203484426, "learning_rate": 3.914835100084324e-07, "loss": 0.5508, "step": 6892 }, { "epoch": 0.6359589436051205, "grad_norm": 2.802108411134903, "learning_rate": 3.913089999266809e-07, "loss": 0.7265, "step": 6893 }, { "epoch": 0.6360512051666475, "grad_norm": 1.5316820986784931, "learning_rate": 3.9113451102237574e-07, "loss": 0.5487, "step": 6894 }, { "epoch": 0.6361434667281743, "grad_norm": 1.85206164912579, "learning_rate": 3.909600433113295e-07, "loss": 0.811, "step": 6895 }, { "epoch": 0.6361434667281743, "eval_GEN Loss": 0.44694429636001587, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3719564378261566, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8663160800933838, "eval_runtime": 57.2256, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6895 }, { "epoch": 0.6362357282897013, "grad_norm": 1.2303676859651853, "learning_rate": 3.907855968093524e-07, "loss": 0.6209, "step": 6896 }, { "epoch": 0.6363279898512282, "grad_norm": 2.826021117990372, "learning_rate": 3.906111715322529e-07, "loss": 0.685, "step": 6897 }, { "epoch": 0.6364202514127552, "grad_norm": 1.4873042566146777, "learning_rate": 3.904367674958383e-07, "loss": 0.6362, "step": 6898 }, { "epoch": 0.6365125129742821, "grad_norm": 2.4473173538045425, "learning_rate": 3.90262384715913e-07, "loss": 0.67, "step": 6899 }, { "epoch": 0.636604774535809, "grad_norm": 1.7899012349824994, "learning_rate": 3.9008802320827973e-07, "loss": 0.5687, "step": 6900 }, { "epoch": 0.636604774535809, "eval_GEN Loss": 0.4466889202594757, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3666170835494995, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8607872724533081, "eval_runtime": 57.3801, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6900 }, { "epoch": 0.636697036097336, "grad_norm": 1.8598237720060165, "learning_rate": 3.8991368298873975e-07, "loss": 0.5629, "step": 6901 }, { "epoch": 0.6367892976588628, "grad_norm": 1.2783502119409806, "learning_rate": 3.8973936407309176e-07, "loss": 0.5608, "step": 6902 }, { "epoch": 0.6368815592203898, "grad_norm": 1.8431864645049734, "learning_rate": 3.8956506647713293e-07, "loss": 0.7843, "step": 6903 }, { "epoch": 0.6369738207819168, "grad_norm": 1.6883894111888333, "learning_rate": 3.893907902166582e-07, "loss": 0.5729, "step": 6904 }, { "epoch": 0.6370660823434436, "grad_norm": 1.405649096073794, "learning_rate": 3.892165353074611e-07, "loss": 0.4744, "step": 6905 }, { "epoch": 0.6370660823434436, "eval_GEN Loss": 0.4475747346878052, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3635445237159729, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8585637211799622, "eval_runtime": 57.1481, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6905 }, { "epoch": 0.6371583439049706, "grad_norm": 1.8657577858576249, "learning_rate": 3.890423017653327e-07, "loss": 0.5723, "step": 6906 }, { "epoch": 0.6372506054664975, "grad_norm": 1.3391629928488287, "learning_rate": 3.8886808960606204e-07, "loss": 0.4884, "step": 6907 }, { "epoch": 0.6373428670280245, "grad_norm": 1.6943434029962312, "learning_rate": 3.886938988454371e-07, "loss": 0.6305, "step": 6908 }, { "epoch": 0.6374351285895514, "grad_norm": 2.393189034657867, "learning_rate": 3.885197294992429e-07, "loss": 0.6863, "step": 6909 }, { "epoch": 0.6375273901510783, "grad_norm": 1.7752946135098124, "learning_rate": 3.8834558158326304e-07, "loss": 0.6039, "step": 6910 }, { "epoch": 0.6375273901510783, "eval_GEN Loss": 0.4473362863063812, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35687240958213806, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8519230484962463, "eval_runtime": 57.3163, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6910 }, { "epoch": 0.6376196517126053, "grad_norm": 1.8486251374961478, "learning_rate": 3.881714551132789e-07, "loss": 0.5112, "step": 6911 }, { "epoch": 0.6377119132741321, "grad_norm": 2.0839629241720856, "learning_rate": 3.879973501050705e-07, "loss": 0.6275, "step": 6912 }, { "epoch": 0.6378041748356591, "grad_norm": 2.479718546427877, "learning_rate": 3.8782326657441526e-07, "loss": 0.5808, "step": 6913 }, { "epoch": 0.6378964363971861, "grad_norm": 2.5152884043835404, "learning_rate": 3.8764920453708885e-07, "loss": 0.7395, "step": 6914 }, { "epoch": 0.6379886979587129, "grad_norm": 1.9458669889138476, "learning_rate": 3.8747516400886516e-07, "loss": 0.646, "step": 6915 }, { "epoch": 0.6379886979587129, "eval_GEN Loss": 0.44740691781044006, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34758833050727844, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8487379550933838, "eval_runtime": 57.2334, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6915 }, { "epoch": 0.6380809595202399, "grad_norm": 1.6889573700258513, "learning_rate": 3.8730114500551604e-07, "loss": 0.6471, "step": 6916 }, { "epoch": 0.6381732210817668, "grad_norm": 1.4495598088460082, "learning_rate": 3.8712714754281135e-07, "loss": 0.5001, "step": 6917 }, { "epoch": 0.6382654826432937, "grad_norm": 2.130338449370267, "learning_rate": 3.8695317163651865e-07, "loss": 0.6659, "step": 6918 }, { "epoch": 0.6383577442048207, "grad_norm": 2.0639686356047577, "learning_rate": 3.8677921730240447e-07, "loss": 0.7295, "step": 6919 }, { "epoch": 0.6384500057663476, "grad_norm": 2.4063042444622367, "learning_rate": 3.8660528455623254e-07, "loss": 0.6622, "step": 6920 }, { "epoch": 0.6384500057663476, "eval_GEN Loss": 0.4476137161254883, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34076741337776184, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8494290709495544, "eval_runtime": 57.3679, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6920 }, { "epoch": 0.6385422673278746, "grad_norm": 1.966063477321812, "learning_rate": 3.864313734137648e-07, "loss": 0.6159, "step": 6921 }, { "epoch": 0.6386345288894014, "grad_norm": 2.5702570511190364, "learning_rate": 3.862574838907617e-07, "loss": 0.7603, "step": 6922 }, { "epoch": 0.6387267904509284, "grad_norm": 2.1784982175546546, "learning_rate": 3.8608361600298125e-07, "loss": 0.4977, "step": 6923 }, { "epoch": 0.6388190520124553, "grad_norm": 1.634770536334807, "learning_rate": 3.859097697661796e-07, "loss": 0.6778, "step": 6924 }, { "epoch": 0.6389113135739822, "grad_norm": 2.3100651617720867, "learning_rate": 3.8573594519611075e-07, "loss": 0.6939, "step": 6925 }, { "epoch": 0.6389113135739822, "eval_GEN Loss": 0.4471907913684845, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33959782123565674, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8453726172447205, "eval_runtime": 57.1511, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 6925 }, { "epoch": 0.6390035751355092, "grad_norm": 2.7670239395700227, "learning_rate": 3.8556214230852736e-07, "loss": 0.7856, "step": 6926 }, { "epoch": 0.6390958366970361, "grad_norm": 3.8063892410177407, "learning_rate": 3.853883611191794e-07, "loss": 0.8777, "step": 6927 }, { "epoch": 0.639188098258563, "grad_norm": 1.458512099969704, "learning_rate": 3.8521460164381535e-07, "loss": 0.6437, "step": 6928 }, { "epoch": 0.6392803598200899, "grad_norm": 1.4208737585833204, "learning_rate": 3.850408638981813e-07, "loss": 0.4785, "step": 6929 }, { "epoch": 0.6393726213816169, "grad_norm": 1.452660293413529, "learning_rate": 3.8486714789802217e-07, "loss": 0.4139, "step": 6930 }, { "epoch": 0.6393726213816169, "eval_GEN Loss": 0.4465237855911255, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34699901938438416, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.840114176273346, "eval_runtime": 55.9402, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 6930 }, { "epoch": 0.6394648829431439, "grad_norm": 3.296331706436945, "learning_rate": 3.8469345365908006e-07, "loss": 0.7107, "step": 6931 }, { "epoch": 0.6395571445046707, "grad_norm": 1.6083501967457308, "learning_rate": 3.845197811970951e-07, "loss": 0.5753, "step": 6932 }, { "epoch": 0.6396494060661977, "grad_norm": 1.8404612888571514, "learning_rate": 3.8434613052780636e-07, "loss": 0.6568, "step": 6933 }, { "epoch": 0.6397416676277246, "grad_norm": 3.2882086386139155, "learning_rate": 3.841725016669501e-07, "loss": 0.8014, "step": 6934 }, { "epoch": 0.6398339291892515, "grad_norm": 2.1717466896413993, "learning_rate": 3.839988946302607e-07, "loss": 0.6109, "step": 6935 }, { "epoch": 0.6398339291892515, "eval_GEN Loss": 0.44702526926994324, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.35440823435783386, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.839062511920929, "eval_runtime": 56.3433, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 6935 }, { "epoch": 0.6399261907507785, "grad_norm": 1.781779272126664, "learning_rate": 3.838253094334708e-07, "loss": 0.7311, "step": 6936 }, { "epoch": 0.6400184523123054, "grad_norm": 2.7772269930573272, "learning_rate": 3.836517460923111e-07, "loss": 0.7401, "step": 6937 }, { "epoch": 0.6401107138738323, "grad_norm": 2.6833154511709467, "learning_rate": 3.8347820462250996e-07, "loss": 0.6987, "step": 6938 }, { "epoch": 0.6402029754353592, "grad_norm": 4.918832528089281, "learning_rate": 3.83304685039794e-07, "loss": 0.9551, "step": 6939 }, { "epoch": 0.6402952369968862, "grad_norm": 1.6086025880565138, "learning_rate": 3.8313118735988803e-07, "loss": 0.5303, "step": 6940 }, { "epoch": 0.6402952369968862, "eval_GEN Loss": 0.44749605655670166, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36444953083992004, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8432692289352417, "eval_runtime": 56.2034, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 6940 }, { "epoch": 0.6403874985584131, "grad_norm": 1.8570133590656868, "learning_rate": 3.829577115985146e-07, "loss": 0.7639, "step": 6941 }, { "epoch": 0.64047976011994, "grad_norm": 2.0916081937872955, "learning_rate": 3.827842577713943e-07, "loss": 0.6976, "step": 6942 }, { "epoch": 0.640572021681467, "grad_norm": 1.7330612661122404, "learning_rate": 3.8261082589424554e-07, "loss": 0.5833, "step": 6943 }, { "epoch": 0.6406642832429938, "grad_norm": 2.206949844533287, "learning_rate": 3.824374159827856e-07, "loss": 0.6355, "step": 6944 }, { "epoch": 0.6407565448045208, "grad_norm": 2.195589007901985, "learning_rate": 3.822640280527288e-07, "loss": 0.7539, "step": 6945 }, { "epoch": 0.6407565448045208, "eval_GEN Loss": 0.44642820954322815, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3702472448348999, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8378305435180664, "eval_runtime": 57.3067, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6945 }, { "epoch": 0.6408488063660478, "grad_norm": 2.0946660060765154, "learning_rate": 3.820906621197877e-07, "loss": 0.7294, "step": 6946 }, { "epoch": 0.6409410679275747, "grad_norm": 1.6263740734645407, "learning_rate": 3.819173181996731e-07, "loss": 0.5634, "step": 6947 }, { "epoch": 0.6410333294891016, "grad_norm": 1.7956987926006476, "learning_rate": 3.817439963080939e-07, "loss": 0.7632, "step": 6948 }, { "epoch": 0.6411255910506285, "grad_norm": 1.7738298469298306, "learning_rate": 3.815706964607567e-07, "loss": 0.7111, "step": 6949 }, { "epoch": 0.6412178526121555, "grad_norm": 2.2256096152599314, "learning_rate": 3.81397418673366e-07, "loss": 0.6559, "step": 6950 }, { "epoch": 0.6412178526121555, "eval_GEN Loss": 0.44628575444221497, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM Loss": 0.3708188831806183, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8369290828704834, "eval_runtime": 57.2322, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6950 }, { "epoch": 0.6413101141736824, "grad_norm": 2.110557086895702, "learning_rate": 3.812241629616248e-07, "loss": 0.6887, "step": 6951 }, { "epoch": 0.6414023757352093, "grad_norm": 1.6766192525025363, "learning_rate": 3.810509293412336e-07, "loss": 0.5697, "step": 6952 }, { "epoch": 0.6414946372967363, "grad_norm": 1.4235163814196747, "learning_rate": 3.8087771782789094e-07, "loss": 0.5584, "step": 6953 }, { "epoch": 0.6415868988582631, "grad_norm": 2.2688448482782264, "learning_rate": 3.80704528437294e-07, "loss": 0.7799, "step": 6954 }, { "epoch": 0.6416791604197901, "grad_norm": 2.9186278015699743, "learning_rate": 3.805313611851373e-07, "loss": 0.719, "step": 6955 }, { "epoch": 0.6416791604197901, "eval_GEN Loss": 0.44653522968292236, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8553459119496856, "eval_PRM F1 AUC": 0.7357255107386066, "eval_PRM F1 Neg": 0.5660377358490566, "eval_PRM Loss": 0.3731921315193176, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8947368421052632, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8352764248847961, "eval_runtime": 57.0529, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6955 }, { "epoch": 0.641771421981317, "grad_norm": 1.4285104941384161, "learning_rate": 3.803582160871133e-07, "loss": 0.5915, "step": 6956 }, { "epoch": 0.641863683542844, "grad_norm": 1.4910207737253443, "learning_rate": 3.8018509315891265e-07, "loss": 0.3669, "step": 6957 }, { "epoch": 0.6419559451043709, "grad_norm": 1.4369308844912188, "learning_rate": 3.8001199241622447e-07, "loss": 0.4815, "step": 6958 }, { "epoch": 0.6420482066658978, "grad_norm": 2.4351202654634334, "learning_rate": 3.798389138747352e-07, "loss": 0.6282, "step": 6959 }, { "epoch": 0.6421404682274248, "grad_norm": 2.5642636295667427, "learning_rate": 3.7966585755012933e-07, "loss": 0.6199, "step": 6960 }, { "epoch": 0.6421404682274248, "eval_GEN Loss": 0.44564467668533325, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.36055073142051697, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.831760823726654, "eval_runtime": 57.2261, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 6960 }, { "epoch": 0.6422327297889516, "grad_norm": 3.288736027033099, "learning_rate": 3.7949282345808954e-07, "loss": 0.7189, "step": 6961 }, { "epoch": 0.6423249913504786, "grad_norm": 1.9878956345196113, "learning_rate": 3.7931981161429666e-07, "loss": 0.7033, "step": 6962 }, { "epoch": 0.6424172529120056, "grad_norm": 2.277278784626361, "learning_rate": 3.791468220344291e-07, "loss": 0.5625, "step": 6963 }, { "epoch": 0.6425095144735324, "grad_norm": 1.5090966908127812, "learning_rate": 3.789738547341633e-07, "loss": 0.5292, "step": 6964 }, { "epoch": 0.6426017760350594, "grad_norm": 2.2719331703981407, "learning_rate": 3.7880090972917434e-07, "loss": 0.7725, "step": 6965 }, { "epoch": 0.6426017760350594, "eval_GEN Loss": 0.44494181871414185, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3473963737487793, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8300480842590332, "eval_runtime": 57.2772, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6965 }, { "epoch": 0.6426940375965863, "grad_norm": 2.472370856964816, "learning_rate": 3.7862798703513434e-07, "loss": 0.5628, "step": 6966 }, { "epoch": 0.6427862991581133, "grad_norm": 2.1156386945809875, "learning_rate": 3.7845508666771404e-07, "loss": 0.5916, "step": 6967 }, { "epoch": 0.6428785607196402, "grad_norm": 2.4361802553297336, "learning_rate": 3.782822086425816e-07, "loss": 0.6797, "step": 6968 }, { "epoch": 0.6429708222811671, "grad_norm": 1.6777803025467544, "learning_rate": 3.7810935297540404e-07, "loss": 0.743, "step": 6969 }, { "epoch": 0.6430630838426941, "grad_norm": 1.5656967822806755, "learning_rate": 3.779365196818454e-07, "loss": 0.5897, "step": 6970 }, { "epoch": 0.6430630838426941, "eval_GEN Loss": 0.44483956694602966, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3431446850299835, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8348256945610046, "eval_runtime": 57.3134, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6970 }, { "epoch": 0.6431553454042209, "grad_norm": 1.4207136058962329, "learning_rate": 3.7776370877756817e-07, "loss": 0.4437, "step": 6971 }, { "epoch": 0.6432476069657479, "grad_norm": 1.9811673877984388, "learning_rate": 3.7759092027823294e-07, "loss": 0.6235, "step": 6972 }, { "epoch": 0.6433398685272749, "grad_norm": 1.9115632223053676, "learning_rate": 3.77418154199498e-07, "loss": 0.6102, "step": 6973 }, { "epoch": 0.6434321300888017, "grad_norm": 2.9582719367406387, "learning_rate": 3.7724541055701945e-07, "loss": 0.7028, "step": 6974 }, { "epoch": 0.6435243916503287, "grad_norm": 1.5587643455648463, "learning_rate": 3.770726893664517e-07, "loss": 0.5526, "step": 6975 }, { "epoch": 0.6435243916503287, "eval_GEN Loss": 0.445298433303833, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34304895997047424, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8378005027770996, "eval_runtime": 57.3466, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 6975 }, { "epoch": 0.6436166532118556, "grad_norm": 1.9883889506055532, "learning_rate": 3.7689999064344726e-07, "loss": 0.6509, "step": 6976 }, { "epoch": 0.6437089147733825, "grad_norm": 2.920132645649781, "learning_rate": 3.7672731440365615e-07, "loss": 0.7466, "step": 6977 }, { "epoch": 0.6438011763349095, "grad_norm": 3.0481324332462902, "learning_rate": 3.765546606627264e-07, "loss": 0.7439, "step": 6978 }, { "epoch": 0.6438934378964364, "grad_norm": 2.6908231131501927, "learning_rate": 3.763820294363046e-07, "loss": 0.8204, "step": 6979 }, { "epoch": 0.6439856994579634, "grad_norm": 1.6651790602814673, "learning_rate": 3.7620942074003465e-07, "loss": 0.5992, "step": 6980 }, { "epoch": 0.6439856994579634, "eval_GEN Loss": 0.44406598806381226, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34257251024246216, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8314303159713745, "eval_runtime": 57.6284, "eval_samples_per_second": 1.128, "eval_steps_per_second": 0.087, "step": 6980 }, { "epoch": 0.6440779610194902, "grad_norm": 1.5925118774587792, "learning_rate": 3.7603683458955846e-07, "loss": 0.616, "step": 6981 }, { "epoch": 0.6441702225810172, "grad_norm": 2.01825155940416, "learning_rate": 3.7586427100051623e-07, "loss": 0.739, "step": 6982 }, { "epoch": 0.6442624841425442, "grad_norm": 3.179324442280715, "learning_rate": 3.756917299885458e-07, "loss": 0.7952, "step": 6983 }, { "epoch": 0.644354745704071, "grad_norm": 1.5290184208156852, "learning_rate": 3.7551921156928334e-07, "loss": 0.4857, "step": 6984 }, { "epoch": 0.644447007265598, "grad_norm": 2.34542414770504, "learning_rate": 3.7534671575836276e-07, "loss": 0.6138, "step": 6985 }, { "epoch": 0.644447007265598, "eval_GEN Loss": 0.4450426995754242, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3518375754356384, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8343148827552795, "eval_runtime": 57.3023, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 6985 }, { "epoch": 0.6445392688271249, "grad_norm": 1.7960090156907975, "learning_rate": 3.7517424257141555e-07, "loss": 0.7472, "step": 6986 }, { "epoch": 0.6446315303886518, "grad_norm": 2.1609357075345237, "learning_rate": 3.750017920240718e-07, "loss": 0.7202, "step": 6987 }, { "epoch": 0.6447237919501787, "grad_norm": 1.877524877185912, "learning_rate": 3.748293641319592e-07, "loss": 0.5794, "step": 6988 }, { "epoch": 0.6448160535117057, "grad_norm": 1.6902799899279854, "learning_rate": 3.746569589107031e-07, "loss": 0.7036, "step": 6989 }, { "epoch": 0.6449083150732327, "grad_norm": 1.9401446470233226, "learning_rate": 3.7448457637592765e-07, "loss": 0.7154, "step": 6990 }, { "epoch": 0.6449083150732327, "eval_GEN Loss": 0.44461897015571594, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3572132885456085, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8315504789352417, "eval_runtime": 57.2586, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 6990 }, { "epoch": 0.6450005766347595, "grad_norm": 2.322307967657928, "learning_rate": 3.7431221654325433e-07, "loss": 0.6255, "step": 6991 }, { "epoch": 0.6450928381962865, "grad_norm": 1.4407896313657145, "learning_rate": 3.7413987942830245e-07, "loss": 0.5226, "step": 6992 }, { "epoch": 0.6451850997578134, "grad_norm": 2.3418699170765365, "learning_rate": 3.739675650466893e-07, "loss": 0.7352, "step": 6993 }, { "epoch": 0.6452773613193403, "grad_norm": 2.271838721016078, "learning_rate": 3.7379527341403085e-07, "loss": 0.7655, "step": 6994 }, { "epoch": 0.6453696228808673, "grad_norm": 2.5448883821040034, "learning_rate": 3.736230045459401e-07, "loss": 0.7326, "step": 6995 }, { "epoch": 0.6453696228808673, "eval_GEN Loss": 0.44521889090538025, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3708037734031677, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8363281488418579, "eval_runtime": 57.0749, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 6995 }, { "epoch": 0.6454618844423942, "grad_norm": 1.8692219874880716, "learning_rate": 3.734507584580281e-07, "loss": 0.6659, "step": 6996 }, { "epoch": 0.6455541460039211, "grad_norm": 1.445863106435294, "learning_rate": 3.7327853516590464e-07, "loss": 0.5647, "step": 6997 }, { "epoch": 0.645646407565448, "grad_norm": 2.25593804563332, "learning_rate": 3.731063346851764e-07, "loss": 0.7853, "step": 6998 }, { "epoch": 0.645738669126975, "grad_norm": 2.201741220167767, "learning_rate": 3.729341570314486e-07, "loss": 0.8209, "step": 6999 }, { "epoch": 0.645830930688502, "grad_norm": 2.0185877755464423, "learning_rate": 3.7276200222032404e-07, "loss": 0.5146, "step": 7000 }, { "epoch": 0.645830930688502, "eval_GEN Loss": 0.44541022181510925, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8481012658227848, "eval_PRM F1 AUC": 0.7297014143530645, "eval_PRM F1 Neg": 0.5555555555555556, "eval_PRM Loss": 0.3909095525741577, "eval_PRM NPV": 0.4838709677419355, "eval_PRM Precision": 0.8933333333333333, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8440805077552795, "eval_runtime": 57.1234, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7000 }, { "epoch": 0.6459231922500288, "grad_norm": 2.2650591804186795, "learning_rate": 3.725898702674041e-07, "loss": 0.6873, "step": 7001 }, { "epoch": 0.6460154538115558, "grad_norm": 1.3267366748338156, "learning_rate": 3.7241776118828746e-07, "loss": 0.584, "step": 7002 }, { "epoch": 0.6461077153730826, "grad_norm": 2.049456019785359, "learning_rate": 3.7224567499857063e-07, "loss": 0.4733, "step": 7003 }, { "epoch": 0.6461999769346096, "grad_norm": 2.9417522368569315, "learning_rate": 3.7207361171384876e-07, "loss": 0.7834, "step": 7004 }, { "epoch": 0.6462922384961366, "grad_norm": 2.519623793070622, "learning_rate": 3.719015713497144e-07, "loss": 0.7781, "step": 7005 }, { "epoch": 0.6462922384961366, "eval_GEN Loss": 0.44533097743988037, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8516129032258064, "eval_PRM F1 AUC": 0.7671555788370874, "eval_PRM F1 Neg": 0.5964912280701754, "eval_PRM Loss": 0.3978186845779419, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.8450420498847961, "eval_runtime": 57.1581, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7005 }, { "epoch": 0.6463845000576635, "grad_norm": 2.602358786869019, "learning_rate": 3.717295539217579e-07, "loss": 0.482, "step": 7006 }, { "epoch": 0.6464767616191904, "grad_norm": 1.9738993307352803, "learning_rate": 3.715575594455678e-07, "loss": 0.7052, "step": 7007 }, { "epoch": 0.6465690231807173, "grad_norm": 2.221634736571983, "learning_rate": 3.7138558793673074e-07, "loss": 0.6154, "step": 7008 }, { "epoch": 0.6466612847422443, "grad_norm": 1.8824976462897298, "learning_rate": 3.7121363941083096e-07, "loss": 0.787, "step": 7009 }, { "epoch": 0.6467535463037712, "grad_norm": 3.1798952757337804, "learning_rate": 3.710417138834503e-07, "loss": 0.9176, "step": 7010 }, { "epoch": 0.6467535463037712, "eval_GEN Loss": 0.44471707940101624, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8607594936708861, "eval_PRM F1 AUC": 0.7574646411733892, "eval_PRM F1 Neg": 0.5925925925925926, "eval_PRM Loss": 0.3890116214752197, "eval_PRM NPV": 0.5161290322580645, "eval_PRM Precision": 0.9066666666666666, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8398737907409668, "eval_runtime": 57.1973, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7010 }, { "epoch": 0.6468458078652981, "grad_norm": 1.342354740164996, "learning_rate": 3.708698113701695e-07, "loss": 0.5292, "step": 7011 }, { "epoch": 0.6469380694268251, "grad_norm": 2.7214034860233163, "learning_rate": 3.706979318865665e-07, "loss": 0.794, "step": 7012 }, { "epoch": 0.6470303309883519, "grad_norm": 2.912428574539251, "learning_rate": 3.7052607544821704e-07, "loss": 0.5938, "step": 7013 }, { "epoch": 0.6471225925498789, "grad_norm": 2.6669897682072343, "learning_rate": 3.70354242070695e-07, "loss": 0.7366, "step": 7014 }, { "epoch": 0.6472148541114059, "grad_norm": 1.7099757320288023, "learning_rate": 3.7018243176957266e-07, "loss": 0.6424, "step": 7015 }, { "epoch": 0.6472148541114059, "eval_GEN Loss": 0.44359835982322693, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM Loss": 0.3719659447669983, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8264723420143127, "eval_runtime": 57.2024, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7015 }, { "epoch": 0.6473071156729328, "grad_norm": 2.674935328437128, "learning_rate": 3.7001064456041936e-07, "loss": 0.6895, "step": 7016 }, { "epoch": 0.6473993772344597, "grad_norm": 1.9546583705341354, "learning_rate": 3.698388804588028e-07, "loss": 0.6549, "step": 7017 }, { "epoch": 0.6474916387959866, "grad_norm": 2.1018496556000765, "learning_rate": 3.6966713948028854e-07, "loss": 0.6199, "step": 7018 }, { "epoch": 0.6475839003575136, "grad_norm": 2.118948037001708, "learning_rate": 3.6949542164043984e-07, "loss": 0.7263, "step": 7019 }, { "epoch": 0.6476761619190404, "grad_norm": 2.147767137144004, "learning_rate": 3.693237269548184e-07, "loss": 0.6502, "step": 7020 }, { "epoch": 0.6476761619190404, "eval_GEN Loss": 0.44322073459625244, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3550911545753479, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8238882422447205, "eval_runtime": 57.0325, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7020 }, { "epoch": 0.6477684234805674, "grad_norm": 2.1619539716779563, "learning_rate": 3.691520554389831e-07, "loss": 0.5818, "step": 7021 }, { "epoch": 0.6478606850420944, "grad_norm": 2.391781599042375, "learning_rate": 3.689804071084914e-07, "loss": 0.7291, "step": 7022 }, { "epoch": 0.6479529466036212, "grad_norm": 2.7611080657701907, "learning_rate": 3.6880878197889825e-07, "loss": 0.8244, "step": 7023 }, { "epoch": 0.6480452081651482, "grad_norm": 1.3960490422859566, "learning_rate": 3.686371800657565e-07, "loss": 0.5504, "step": 7024 }, { "epoch": 0.6481374697266751, "grad_norm": 2.2906346712038492, "learning_rate": 3.6846560138461664e-07, "loss": 0.7673, "step": 7025 }, { "epoch": 0.6481374697266751, "eval_GEN Loss": 0.4436020255088806, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34808075428009033, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8231971263885498, "eval_runtime": 57.1839, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7025 }, { "epoch": 0.648229731288202, "grad_norm": 2.1329309287430602, "learning_rate": 3.6829404595102814e-07, "loss": 0.6975, "step": 7026 }, { "epoch": 0.648321992849729, "grad_norm": 2.088749654010511, "learning_rate": 3.681225137805372e-07, "loss": 0.5719, "step": 7027 }, { "epoch": 0.6484142544112559, "grad_norm": 2.2552223481823854, "learning_rate": 3.679510048886882e-07, "loss": 0.6878, "step": 7028 }, { "epoch": 0.6485065159727829, "grad_norm": 1.9544667772281665, "learning_rate": 3.67779519291024e-07, "loss": 0.7684, "step": 7029 }, { "epoch": 0.6485987775343097, "grad_norm": 1.860125392647406, "learning_rate": 3.676080570030846e-07, "loss": 0.6825, "step": 7030 }, { "epoch": 0.6485987775343097, "eval_GEN Loss": 0.44268667697906494, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33640119433403015, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8245492577552795, "eval_runtime": 57.0394, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7030 }, { "epoch": 0.6486910390958367, "grad_norm": 2.2964113164562234, "learning_rate": 3.674366180404082e-07, "loss": 0.5945, "step": 7031 }, { "epoch": 0.6487833006573637, "grad_norm": 2.3067652900086286, "learning_rate": 3.672652024185307e-07, "loss": 0.6221, "step": 7032 }, { "epoch": 0.6488755622188905, "grad_norm": 2.0568400395066515, "learning_rate": 3.670938101529865e-07, "loss": 0.7046, "step": 7033 }, { "epoch": 0.6489678237804175, "grad_norm": 2.2037563983457353, "learning_rate": 3.6692244125930714e-07, "loss": 0.5325, "step": 7034 }, { "epoch": 0.6490600853419444, "grad_norm": 1.6124502993974417, "learning_rate": 3.66751095753022e-07, "loss": 0.7536, "step": 7035 }, { "epoch": 0.6490600853419444, "eval_GEN Loss": 0.4419425129890442, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3285718858242035, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8260817527770996, "eval_runtime": 57.0126, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7035 }, { "epoch": 0.6491523469034713, "grad_norm": 2.9773191484005013, "learning_rate": 3.6657977364965946e-07, "loss": 0.8609, "step": 7036 }, { "epoch": 0.6492446084649983, "grad_norm": 1.9134037400945887, "learning_rate": 3.664084749647445e-07, "loss": 0.4566, "step": 7037 }, { "epoch": 0.6493368700265252, "grad_norm": 1.4564230336441157, "learning_rate": 3.662371997138006e-07, "loss": 0.6079, "step": 7038 }, { "epoch": 0.6494291315880522, "grad_norm": 3.1059661694003373, "learning_rate": 3.660659479123486e-07, "loss": 0.8109, "step": 7039 }, { "epoch": 0.649521393149579, "grad_norm": 1.8807201234643176, "learning_rate": 3.658947195759084e-07, "loss": 0.6313, "step": 7040 }, { "epoch": 0.649521393149579, "eval_GEN Loss": 0.442638635635376, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.32672548294067383, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8276742696762085, "eval_runtime": 57.2361, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7040 }, { "epoch": 0.649613654711106, "grad_norm": 2.10614578810029, "learning_rate": 3.657235147199964e-07, "loss": 0.7831, "step": 7041 }, { "epoch": 0.649705916272633, "grad_norm": 2.4682614252039508, "learning_rate": 3.655523333601275e-07, "loss": 0.6377, "step": 7042 }, { "epoch": 0.6497981778341598, "grad_norm": 2.2216775720365445, "learning_rate": 3.653811755118148e-07, "loss": 0.7329, "step": 7043 }, { "epoch": 0.6498904393956868, "grad_norm": 3.185605121341088, "learning_rate": 3.6521004119056845e-07, "loss": 0.8381, "step": 7044 }, { "epoch": 0.6499827009572137, "grad_norm": 2.2368502295239807, "learning_rate": 3.6503893041189717e-07, "loss": 0.6659, "step": 7045 }, { "epoch": 0.6499827009572137, "eval_GEN Loss": 0.44209805130958557, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8679245283018868, "eval_PRM F1": 0.9166666666666666, "eval_PRM F1 AUC": 0.7899423782084861, "eval_PRM F1 Neg": 0.6818181818181818, "eval_PRM Loss": 0.3273831903934479, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.9058823529411765, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8300480842590332, "eval_runtime": 57.3432, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7045 }, { "epoch": 0.6500749625187406, "grad_norm": 2.315586706648336, "learning_rate": 3.6486784319130686e-07, "loss": 0.7584, "step": 7046 }, { "epoch": 0.6501672240802676, "grad_norm": 1.988313360773803, "learning_rate": 3.646967795443025e-07, "loss": 0.7758, "step": 7047 }, { "epoch": 0.6502594856417945, "grad_norm": 1.9022630454533316, "learning_rate": 3.645257394863855e-07, "loss": 0.5691, "step": 7048 }, { "epoch": 0.6503517472033215, "grad_norm": 1.9681555079311368, "learning_rate": 3.643547230330562e-07, "loss": 0.635, "step": 7049 }, { "epoch": 0.6504440087648483, "grad_norm": 2.3266741561418605, "learning_rate": 3.6418373019981184e-07, "loss": 0.5942, "step": 7050 }, { "epoch": 0.6504440087648483, "eval_GEN Loss": 0.442396342754364, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33466023206710815, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.830979585647583, "eval_runtime": 57.023, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7050 }, { "epoch": 0.6505362703263753, "grad_norm": 1.9017722871371308, "learning_rate": 3.6401276100214844e-07, "loss": 0.6843, "step": 7051 }, { "epoch": 0.6506285318879022, "grad_norm": 2.0103810940735, "learning_rate": 3.6384181545555965e-07, "loss": 0.6992, "step": 7052 }, { "epoch": 0.6507207934494291, "grad_norm": 1.8167112387227866, "learning_rate": 3.636708935755362e-07, "loss": 0.6785, "step": 7053 }, { "epoch": 0.6508130550109561, "grad_norm": 2.0669649140722934, "learning_rate": 3.634999953775681e-07, "loss": 0.5767, "step": 7054 }, { "epoch": 0.650905316572483, "grad_norm": 1.6511096155768907, "learning_rate": 3.633291208771418e-07, "loss": 0.7029, "step": 7055 }, { "epoch": 0.650905316572483, "eval_GEN Loss": 0.4433680772781372, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33839964866638184, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8296874761581421, "eval_runtime": 57.1416, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7055 }, { "epoch": 0.6509975781340099, "grad_norm": 1.9028210391971083, "learning_rate": 3.6315827008974277e-07, "loss": 0.6008, "step": 7056 }, { "epoch": 0.6510898396955368, "grad_norm": 1.343622530172309, "learning_rate": 3.629874430308529e-07, "loss": 0.4329, "step": 7057 }, { "epoch": 0.6511821012570638, "grad_norm": 2.5530527012946664, "learning_rate": 3.628166397159539e-07, "loss": 0.6677, "step": 7058 }, { "epoch": 0.6512743628185907, "grad_norm": 2.0273664273973324, "learning_rate": 3.626458601605234e-07, "loss": 0.6413, "step": 7059 }, { "epoch": 0.6513666243801176, "grad_norm": 1.695785795852532, "learning_rate": 3.62475104380038e-07, "loss": 0.5747, "step": 7060 }, { "epoch": 0.6513666243801176, "eval_GEN Loss": 0.4426627457141876, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3423755168914795, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8307392001152039, "eval_runtime": 57.0153, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7060 }, { "epoch": 0.6514588859416446, "grad_norm": 1.9498306577564233, "learning_rate": 3.623043723899721e-07, "loss": 0.7546, "step": 7061 }, { "epoch": 0.6515511475031714, "grad_norm": 2.391439054015335, "learning_rate": 3.621336642057972e-07, "loss": 0.6895, "step": 7062 }, { "epoch": 0.6516434090646984, "grad_norm": 1.7654217792620943, "learning_rate": 3.619629798429837e-07, "loss": 0.7033, "step": 7063 }, { "epoch": 0.6517356706262254, "grad_norm": 2.1328035068865185, "learning_rate": 3.617923193169985e-07, "loss": 0.6126, "step": 7064 }, { "epoch": 0.6518279321877523, "grad_norm": 2.5724319505304973, "learning_rate": 3.616216826433081e-07, "loss": 0.6942, "step": 7065 }, { "epoch": 0.6518279321877523, "eval_GEN Loss": 0.44382020831108093, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.346279114484787, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8291466236114502, "eval_runtime": 57.3055, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7065 }, { "epoch": 0.6519201937492792, "grad_norm": 1.945472413398937, "learning_rate": 3.6145106983737514e-07, "loss": 0.7328, "step": 7066 }, { "epoch": 0.6520124553108061, "grad_norm": 1.9234552463082082, "learning_rate": 3.6128048091466113e-07, "loss": 0.6623, "step": 7067 }, { "epoch": 0.6521047168723331, "grad_norm": 2.390023903161741, "learning_rate": 3.611099158906249e-07, "loss": 0.5801, "step": 7068 }, { "epoch": 0.65219697843386, "grad_norm": 1.5498170188105265, "learning_rate": 3.6093937478072383e-07, "loss": 0.5219, "step": 7069 }, { "epoch": 0.6522892399953869, "grad_norm": 2.7814259385870685, "learning_rate": 3.607688576004119e-07, "loss": 0.8064, "step": 7070 }, { "epoch": 0.6522892399953869, "eval_GEN Loss": 0.4425585865974426, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3487868905067444, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.827073335647583, "eval_runtime": 57.1926, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7070 }, { "epoch": 0.6523815015569139, "grad_norm": 2.269085303476714, "learning_rate": 3.6059836436514207e-07, "loss": 0.7135, "step": 7071 }, { "epoch": 0.6524737631184407, "grad_norm": 1.482794851375174, "learning_rate": 3.6042789509036486e-07, "loss": 0.501, "step": 7072 }, { "epoch": 0.6525660246799677, "grad_norm": 1.8316637907213886, "learning_rate": 3.60257449791528e-07, "loss": 0.505, "step": 7073 }, { "epoch": 0.6526582862414947, "grad_norm": 2.1933519648142434, "learning_rate": 3.6008702848407775e-07, "loss": 0.765, "step": 7074 }, { "epoch": 0.6527505478030216, "grad_norm": 2.0712114570814735, "learning_rate": 3.5991663118345793e-07, "loss": 0.7274, "step": 7075 }, { "epoch": 0.6527505478030216, "eval_GEN Loss": 0.4425603747367859, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3535407781600952, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8305588960647583, "eval_runtime": 57.1825, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7075 }, { "epoch": 0.6528428093645485, "grad_norm": 1.9941009194185504, "learning_rate": 3.597462579051106e-07, "loss": 0.5085, "step": 7076 }, { "epoch": 0.6529350709260754, "grad_norm": 1.39261259372122, "learning_rate": 3.5957590866447456e-07, "loss": 0.6178, "step": 7077 }, { "epoch": 0.6530273324876024, "grad_norm": 2.52866763701526, "learning_rate": 3.5940558347698747e-07, "loss": 0.8076, "step": 7078 }, { "epoch": 0.6531195940491292, "grad_norm": 1.491131187173305, "learning_rate": 3.592352823580844e-07, "loss": 0.5478, "step": 7079 }, { "epoch": 0.6532118556106562, "grad_norm": 2.051220277531708, "learning_rate": 3.5906500532319864e-07, "loss": 0.6371, "step": 7080 }, { "epoch": 0.6532118556106562, "eval_GEN Loss": 0.4416806995868683, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35473790764808655, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.832301676273346, "eval_runtime": 57.3524, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7080 }, { "epoch": 0.6533041171721832, "grad_norm": 1.9947122725981166, "learning_rate": 3.588947523877605e-07, "loss": 0.5609, "step": 7081 }, { "epoch": 0.65339637873371, "grad_norm": 2.186913465067447, "learning_rate": 3.5872452356719864e-07, "loss": 0.769, "step": 7082 }, { "epoch": 0.653488640295237, "grad_norm": 1.7010324926413203, "learning_rate": 3.585543188769397e-07, "loss": 0.7084, "step": 7083 }, { "epoch": 0.6535809018567639, "grad_norm": 2.54897847162982, "learning_rate": 3.58384138332408e-07, "loss": 0.7864, "step": 7084 }, { "epoch": 0.6536731634182908, "grad_norm": 1.8544518952454112, "learning_rate": 3.5821398194902505e-07, "loss": 0.5963, "step": 7085 }, { "epoch": 0.6536731634182908, "eval_GEN Loss": 0.4414001703262329, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35758525133132935, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8356069922447205, "eval_runtime": 57.0958, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7085 }, { "epoch": 0.6537654249798178, "grad_norm": 2.2100637286356846, "learning_rate": 3.5804384974221107e-07, "loss": 0.6858, "step": 7086 }, { "epoch": 0.6538576865413447, "grad_norm": 1.2883037280044964, "learning_rate": 3.578737417273837e-07, "loss": 0.6213, "step": 7087 }, { "epoch": 0.6539499481028717, "grad_norm": 1.4258589357282945, "learning_rate": 3.5770365791995815e-07, "loss": 0.5801, "step": 7088 }, { "epoch": 0.6540422096643985, "grad_norm": 2.1470244578681674, "learning_rate": 3.575335983353479e-07, "loss": 0.6906, "step": 7089 }, { "epoch": 0.6541344712259255, "grad_norm": 3.811245982346856, "learning_rate": 3.5736356298896393e-07, "loss": 0.8622, "step": 7090 }, { "epoch": 0.6541344712259255, "eval_GEN Loss": 0.44165563583374023, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36139658093452454, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.831250011920929, "eval_runtime": 57.2621, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7090 }, { "epoch": 0.6542267327874525, "grad_norm": 2.731963845302036, "learning_rate": 3.5719355189621544e-07, "loss": 0.6746, "step": 7091 }, { "epoch": 0.6543189943489793, "grad_norm": 1.9447655278546574, "learning_rate": 3.5702356507250826e-07, "loss": 0.5568, "step": 7092 }, { "epoch": 0.6544112559105063, "grad_norm": 2.09963588203779, "learning_rate": 3.5685360253324796e-07, "loss": 0.65, "step": 7093 }, { "epoch": 0.6545035174720332, "grad_norm": 1.6273385708489903, "learning_rate": 3.5668366429383593e-07, "loss": 0.422, "step": 7094 }, { "epoch": 0.6545957790335601, "grad_norm": 1.9156045157413641, "learning_rate": 3.565137503696729e-07, "loss": 0.4612, "step": 7095 }, { "epoch": 0.6545957790335601, "eval_GEN Loss": 0.4409220218658447, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.36107906699180603, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8297476172447205, "eval_runtime": 57.1058, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7095 }, { "epoch": 0.6546880405950871, "grad_norm": 2.100745661305946, "learning_rate": 3.5634386077615614e-07, "loss": 0.6859, "step": 7096 }, { "epoch": 0.654780302156614, "grad_norm": 2.036779372563396, "learning_rate": 3.5617399552868163e-07, "loss": 0.6168, "step": 7097 }, { "epoch": 0.654872563718141, "grad_norm": 2.7189066944231586, "learning_rate": 3.56004154642643e-07, "loss": 0.8286, "step": 7098 }, { "epoch": 0.6549648252796678, "grad_norm": 1.2234214806251735, "learning_rate": 3.558343381334308e-07, "loss": 0.5256, "step": 7099 }, { "epoch": 0.6550570868411948, "grad_norm": 3.422383250889879, "learning_rate": 3.55664546016435e-07, "loss": 0.753, "step": 7100 }, { "epoch": 0.6550570868411948, "eval_GEN Loss": 0.4405077397823334, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3588952422142029, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8282752633094788, "eval_runtime": 57.2016, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7100 }, { "epoch": 0.6551493484027218, "grad_norm": 2.640648027564156, "learning_rate": 3.5549477830704186e-07, "loss": 0.679, "step": 7101 }, { "epoch": 0.6552416099642486, "grad_norm": 2.5946865631063964, "learning_rate": 3.5532503502063625e-07, "loss": 0.7133, "step": 7102 }, { "epoch": 0.6553338715257756, "grad_norm": 1.6918178143444889, "learning_rate": 3.551553161725999e-07, "loss": 0.6466, "step": 7103 }, { "epoch": 0.6554261330873025, "grad_norm": 2.850369785645166, "learning_rate": 3.5498562177831415e-07, "loss": 0.5881, "step": 7104 }, { "epoch": 0.6555183946488294, "grad_norm": 1.8925431574005347, "learning_rate": 3.54815951853156e-07, "loss": 0.5175, "step": 7105 }, { "epoch": 0.6555183946488294, "eval_GEN Loss": 0.4395768940448761, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35387974977493286, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8239783644676208, "eval_runtime": 57.2488, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7105 }, { "epoch": 0.6556106562103564, "grad_norm": 1.7891133259215901, "learning_rate": 3.5464630641250193e-07, "loss": 0.7424, "step": 7106 }, { "epoch": 0.6557029177718833, "grad_norm": 2.1321597487105266, "learning_rate": 3.544766854717248e-07, "loss": 0.6351, "step": 7107 }, { "epoch": 0.6557951793334102, "grad_norm": 2.1532278272521865, "learning_rate": 3.543070890461963e-07, "loss": 0.4008, "step": 7108 }, { "epoch": 0.6558874408949371, "grad_norm": 3.0473895628359715, "learning_rate": 3.5413751715128544e-07, "loss": 0.5124, "step": 7109 }, { "epoch": 0.6559797024564641, "grad_norm": 2.1457801353921275, "learning_rate": 3.539679698023591e-07, "loss": 0.7241, "step": 7110 }, { "epoch": 0.6559797024564641, "eval_GEN Loss": 0.43975916504859924, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3444506525993347, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8225961327552795, "eval_runtime": 57.0788, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7110 }, { "epoch": 0.656071964017991, "grad_norm": 1.8005883756927707, "learning_rate": 3.537984470147822e-07, "loss": 0.6283, "step": 7111 }, { "epoch": 0.6561642255795179, "grad_norm": 1.3481559971952128, "learning_rate": 3.536289488039167e-07, "loss": 0.5086, "step": 7112 }, { "epoch": 0.6562564871410449, "grad_norm": 1.6735287504736098, "learning_rate": 3.534594751851232e-07, "loss": 0.5412, "step": 7113 }, { "epoch": 0.6563487487025718, "grad_norm": 2.4235341875319403, "learning_rate": 3.53290026173759e-07, "loss": 0.7012, "step": 7114 }, { "epoch": 0.6564410102640987, "grad_norm": 3.292910275615613, "learning_rate": 3.5312060178518084e-07, "loss": 0.7874, "step": 7115 }, { "epoch": 0.6564410102640987, "eval_GEN Loss": 0.43952465057373047, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33753469586372375, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8225660920143127, "eval_runtime": 57.2382, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7115 }, { "epoch": 0.6565332718256256, "grad_norm": 1.6725609439534956, "learning_rate": 3.5295120203474133e-07, "loss": 0.5497, "step": 7116 }, { "epoch": 0.6566255333871526, "grad_norm": 1.8703751975891745, "learning_rate": 3.5278182693779223e-07, "loss": 0.5541, "step": 7117 }, { "epoch": 0.6567177949486795, "grad_norm": 2.323753557267934, "learning_rate": 3.5261247650968234e-07, "loss": 0.6113, "step": 7118 }, { "epoch": 0.6568100565102064, "grad_norm": 1.7268445370132732, "learning_rate": 3.5244315076575886e-07, "loss": 0.6596, "step": 7119 }, { "epoch": 0.6569023180717334, "grad_norm": 3.249569212136461, "learning_rate": 3.522738497213659e-07, "loss": 0.9201, "step": 7120 }, { "epoch": 0.6569023180717334, "eval_GEN Loss": 0.43937167525291443, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33523836731910706, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8177884817123413, "eval_runtime": 57.0982, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7120 }, { "epoch": 0.6569945796332602, "grad_norm": 1.9028262922108932, "learning_rate": 3.5210457339184586e-07, "loss": 0.6254, "step": 7121 }, { "epoch": 0.6570868411947872, "grad_norm": 2.7499654755297227, "learning_rate": 3.519353217925392e-07, "loss": 0.6065, "step": 7122 }, { "epoch": 0.6571791027563142, "grad_norm": 1.9647998563266142, "learning_rate": 3.517660949387833e-07, "loss": 0.4432, "step": 7123 }, { "epoch": 0.6572713643178411, "grad_norm": 2.04327573607519, "learning_rate": 3.515968928459139e-07, "loss": 0.5383, "step": 7124 }, { "epoch": 0.657363625879368, "grad_norm": 1.5999739244977873, "learning_rate": 3.5142771552926434e-07, "loss": 0.6246, "step": 7125 }, { "epoch": 0.657363625879368, "eval_GEN Loss": 0.43918535113334656, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3359406292438507, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8197716474533081, "eval_runtime": 57.2094, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7125 }, { "epoch": 0.6574558874408949, "grad_norm": 4.06663176845447, "learning_rate": 3.5125856300416614e-07, "loss": 0.8587, "step": 7126 }, { "epoch": 0.6575481490024219, "grad_norm": 2.284504851840799, "learning_rate": 3.510894352859476e-07, "loss": 0.6474, "step": 7127 }, { "epoch": 0.6576404105639488, "grad_norm": 2.4564189905711595, "learning_rate": 3.509203323899356e-07, "loss": 0.701, "step": 7128 }, { "epoch": 0.6577326721254757, "grad_norm": 1.742603429902193, "learning_rate": 3.5075125433145435e-07, "loss": 0.6436, "step": 7129 }, { "epoch": 0.6578249336870027, "grad_norm": 2.709097293634501, "learning_rate": 3.505822011258264e-07, "loss": 0.8386, "step": 7130 }, { "epoch": 0.6578249336870027, "eval_GEN Loss": 0.4389955401420593, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3385639190673828, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.817187488079071, "eval_runtime": 56.9815, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7130 }, { "epoch": 0.6579171952485295, "grad_norm": 2.9945832754040724, "learning_rate": 3.504131727883712e-07, "loss": 0.7595, "step": 7131 }, { "epoch": 0.6580094568100565, "grad_norm": 2.4551925478627967, "learning_rate": 3.5024416933440636e-07, "loss": 0.4913, "step": 7132 }, { "epoch": 0.6581017183715835, "grad_norm": 6.712113554296502, "learning_rate": 3.500751907792477e-07, "loss": 0.7018, "step": 7133 }, { "epoch": 0.6581939799331104, "grad_norm": 3.320622812274592, "learning_rate": 3.4990623713820766e-07, "loss": 0.8391, "step": 7134 }, { "epoch": 0.6582862414946373, "grad_norm": 2.2412244238258836, "learning_rate": 3.4973730842659743e-07, "loss": 0.6649, "step": 7135 }, { "epoch": 0.6582862414946373, "eval_GEN Loss": 0.44000011682510376, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33913418650627136, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8198016881942749, "eval_runtime": 56.1413, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 7135 }, { "epoch": 0.6583785030561642, "grad_norm": 1.5340113051503232, "learning_rate": 3.4956840465972565e-07, "loss": 0.5729, "step": 7136 }, { "epoch": 0.6584707646176912, "grad_norm": 2.177894368576042, "learning_rate": 3.4939952585289877e-07, "loss": 0.7387, "step": 7137 }, { "epoch": 0.6585630261792181, "grad_norm": 3.2586781759069243, "learning_rate": 3.492306720214204e-07, "loss": 0.8101, "step": 7138 }, { "epoch": 0.658655287740745, "grad_norm": 2.170184350208145, "learning_rate": 3.490618431805927e-07, "loss": 0.6729, "step": 7139 }, { "epoch": 0.658747549302272, "grad_norm": 4.651327480307535, "learning_rate": 3.48893039345715e-07, "loss": 0.532, "step": 7140 }, { "epoch": 0.658747549302272, "eval_GEN Loss": 0.4399470090866089, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3439910113811493, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.82421875, "eval_runtime": 56.0964, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 7140 }, { "epoch": 0.6588398108637988, "grad_norm": 2.851873523386678, "learning_rate": 3.4872426053208493e-07, "loss": 0.8703, "step": 7141 }, { "epoch": 0.6589320724253258, "grad_norm": 1.4189799639667129, "learning_rate": 3.48555506754997e-07, "loss": 0.5514, "step": 7142 }, { "epoch": 0.6590243339868527, "grad_norm": 1.8238674994488204, "learning_rate": 3.4838677802974417e-07, "loss": 0.5517, "step": 7143 }, { "epoch": 0.6591165955483796, "grad_norm": 2.0631112884439626, "learning_rate": 3.482180743716172e-07, "loss": 0.6205, "step": 7144 }, { "epoch": 0.6592088571099066, "grad_norm": 2.603184329434478, "learning_rate": 3.4804939579590373e-07, "loss": 0.6037, "step": 7145 }, { "epoch": 0.6592088571099066, "eval_GEN Loss": 0.44025281071662903, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3469075560569763, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8275841474533081, "eval_runtime": 56.188, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 7145 }, { "epoch": 0.6593011186714335, "grad_norm": 2.058918460801519, "learning_rate": 3.478807423178899e-07, "loss": 0.6499, "step": 7146 }, { "epoch": 0.6593933802329605, "grad_norm": 2.01771048832108, "learning_rate": 3.477121139528594e-07, "loss": 0.6198, "step": 7147 }, { "epoch": 0.6594856417944873, "grad_norm": 2.8478109374329565, "learning_rate": 3.4754351071609386e-07, "loss": 0.5184, "step": 7148 }, { "epoch": 0.6595779033560143, "grad_norm": 2.052705132100747, "learning_rate": 3.473749326228716e-07, "loss": 0.6323, "step": 7149 }, { "epoch": 0.6596701649175413, "grad_norm": 2.1563375019326494, "learning_rate": 3.4720637968847043e-07, "loss": 0.7789, "step": 7150 }, { "epoch": 0.6596701649175413, "eval_GEN Loss": 0.4399755895137787, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3496460020542145, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8328725695610046, "eval_runtime": 56.031, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 7150 }, { "epoch": 0.6597624264790681, "grad_norm": 2.1773086318167882, "learning_rate": 3.4703785192816415e-07, "loss": 0.7853, "step": 7151 }, { "epoch": 0.6598546880405951, "grad_norm": 2.46343123579161, "learning_rate": 3.4686934935722545e-07, "loss": 0.6732, "step": 7152 }, { "epoch": 0.659946949602122, "grad_norm": 3.970062408974716, "learning_rate": 3.4670087199092366e-07, "loss": 0.615, "step": 7153 }, { "epoch": 0.6600392111636489, "grad_norm": 3.0543891995483485, "learning_rate": 3.465324198445273e-07, "loss": 0.7491, "step": 7154 }, { "epoch": 0.6601314727251759, "grad_norm": 1.5921356678936316, "learning_rate": 3.4636399293330126e-07, "loss": 0.4979, "step": 7155 }, { "epoch": 0.6601314727251759, "eval_GEN Loss": 0.4403335750102997, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35511642694473267, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8378305435180664, "eval_runtime": 56.0906, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 7155 }, { "epoch": 0.6602237342867028, "grad_norm": 2.382792883250842, "learning_rate": 3.4619559127250867e-07, "loss": 0.8325, "step": 7156 }, { "epoch": 0.6603159958482298, "grad_norm": 2.666968171479925, "learning_rate": 3.4602721487741077e-07, "loss": 0.6875, "step": 7157 }, { "epoch": 0.6604082574097566, "grad_norm": 2.0855892629581176, "learning_rate": 3.4585886376326537e-07, "loss": 0.5807, "step": 7158 }, { "epoch": 0.6605005189712836, "grad_norm": 2.003149376711615, "learning_rate": 3.4569053794532944e-07, "loss": 0.693, "step": 7159 }, { "epoch": 0.6605927805328106, "grad_norm": 1.9638578991583047, "learning_rate": 3.4552223743885614e-07, "loss": 0.7237, "step": 7160 }, { "epoch": 0.6605927805328106, "eval_GEN Loss": 0.4408080279827118, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3646101951599121, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8400240540504456, "eval_runtime": 55.9426, "eval_samples_per_second": 1.162, "eval_steps_per_second": 0.089, "step": 7160 }, { "epoch": 0.6606850420943374, "grad_norm": 2.167453686410967, "learning_rate": 3.4535396225909804e-07, "loss": 0.6294, "step": 7161 }, { "epoch": 0.6607773036558644, "grad_norm": 2.1610401499430405, "learning_rate": 3.4518571242130386e-07, "loss": 0.6245, "step": 7162 }, { "epoch": 0.6608695652173913, "grad_norm": 3.0353778827244025, "learning_rate": 3.450174879407208e-07, "loss": 0.9115, "step": 7163 }, { "epoch": 0.6609618267789182, "grad_norm": 2.496341309948299, "learning_rate": 3.448492888325937e-07, "loss": 0.8443, "step": 7164 }, { "epoch": 0.6610540883404452, "grad_norm": 2.5344444458180275, "learning_rate": 3.446811151121653e-07, "loss": 0.6477, "step": 7165 }, { "epoch": 0.6610540883404452, "eval_GEN Loss": 0.439966082572937, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3648792505264282, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8390925526618958, "eval_runtime": 56.2571, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 7165 }, { "epoch": 0.6611463499019721, "grad_norm": 2.566174868225515, "learning_rate": 3.445129667946751e-07, "loss": 0.582, "step": 7166 }, { "epoch": 0.661238611463499, "grad_norm": 1.9282290693274957, "learning_rate": 3.4434484389536143e-07, "loss": 0.6817, "step": 7167 }, { "epoch": 0.6613308730250259, "grad_norm": 1.8911425995144888, "learning_rate": 3.4417674642946e-07, "loss": 0.7057, "step": 7168 }, { "epoch": 0.6614231345865529, "grad_norm": 1.7166817180719822, "learning_rate": 3.4400867441220364e-07, "loss": 0.6852, "step": 7169 }, { "epoch": 0.6615153961480799, "grad_norm": 1.432645437262314, "learning_rate": 3.438406278588237e-07, "loss": 0.6751, "step": 7170 }, { "epoch": 0.6615153961480799, "eval_GEN Loss": 0.44133225083351135, "eval_GEN top-5 accuracy": 0.9820254274441035, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3662448525428772, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8451622724533081, "eval_runtime": 56.1788, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 7170 }, { "epoch": 0.6616076577096067, "grad_norm": 1.993680495792798, "learning_rate": 3.4367260678454805e-07, "loss": 0.6959, "step": 7171 }, { "epoch": 0.6616999192711337, "grad_norm": 3.1246987221129334, "learning_rate": 3.435046112046042e-07, "loss": 0.6016, "step": 7172 }, { "epoch": 0.6617921808326606, "grad_norm": 2.172113305846554, "learning_rate": 3.433366411342152e-07, "loss": 0.6514, "step": 7173 }, { "epoch": 0.6618844423941875, "grad_norm": 2.445366641773958, "learning_rate": 3.4316869658860325e-07, "loss": 0.8378, "step": 7174 }, { "epoch": 0.6619767039557144, "grad_norm": 1.859024141003589, "learning_rate": 3.430007775829875e-07, "loss": 0.6818, "step": 7175 }, { "epoch": 0.6619767039557144, "eval_GEN Loss": 0.4410001039505005, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3607403635978699, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8466646671295166, "eval_runtime": 55.9089, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 7175 }, { "epoch": 0.6620689655172414, "grad_norm": 2.554311280703326, "learning_rate": 3.428328841325855e-07, "loss": 0.6385, "step": 7176 }, { "epoch": 0.6621612270787683, "grad_norm": 2.2130713089051044, "learning_rate": 3.4266501625261144e-07, "loss": 0.5947, "step": 7177 }, { "epoch": 0.6622534886402952, "grad_norm": 1.9028108872414828, "learning_rate": 3.424971739582779e-07, "loss": 0.7151, "step": 7178 }, { "epoch": 0.6623457502018222, "grad_norm": 3.294980322603667, "learning_rate": 3.4232935726479544e-07, "loss": 0.568, "step": 7179 }, { "epoch": 0.662438011763349, "grad_norm": 1.775805351939078, "learning_rate": 3.421615661873713e-07, "loss": 0.5258, "step": 7180 }, { "epoch": 0.662438011763349, "eval_GEN Loss": 0.44123920798301697, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.358398973941803, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8454026579856873, "eval_runtime": 56.099, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 7180 }, { "epoch": 0.662530273324876, "grad_norm": 1.9184846898756907, "learning_rate": 3.4199380074121124e-07, "loss": 0.6179, "step": 7181 }, { "epoch": 0.662622534886403, "grad_norm": 2.2612670879527115, "learning_rate": 3.418260609415184e-07, "loss": 0.4956, "step": 7182 }, { "epoch": 0.6627147964479299, "grad_norm": 1.6704436712561899, "learning_rate": 3.4165834680349385e-07, "loss": 0.5711, "step": 7183 }, { "epoch": 0.6628070580094568, "grad_norm": 1.9674052509174313, "learning_rate": 3.4149065834233565e-07, "loss": 0.7211, "step": 7184 }, { "epoch": 0.6628993195709837, "grad_norm": 1.632044646936736, "learning_rate": 3.4132299557324035e-07, "loss": 0.5894, "step": 7185 }, { "epoch": 0.6628993195709837, "eval_GEN Loss": 0.4401538670063019, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35795632004737854, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8447115421295166, "eval_runtime": 56.0935, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 7185 }, { "epoch": 0.6629915811325107, "grad_norm": 2.019245290225633, "learning_rate": 3.411553585114016e-07, "loss": 0.7691, "step": 7186 }, { "epoch": 0.6630838426940376, "grad_norm": 2.4132385316400766, "learning_rate": 3.4098774717201134e-07, "loss": 0.6529, "step": 7187 }, { "epoch": 0.6631761042555645, "grad_norm": 1.651176097862046, "learning_rate": 3.4082016157025816e-07, "loss": 0.5749, "step": 7188 }, { "epoch": 0.6632683658170915, "grad_norm": 2.129231152039032, "learning_rate": 3.406526017213294e-07, "loss": 0.7074, "step": 7189 }, { "epoch": 0.6633606273786183, "grad_norm": 1.9551614468900973, "learning_rate": 3.404850676404093e-07, "loss": 0.6842, "step": 7190 }, { "epoch": 0.6633606273786183, "eval_GEN Loss": 0.4407082200050354, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.35482141375541687, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8442007303237915, "eval_runtime": 56.1604, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 7190 }, { "epoch": 0.6634528889401453, "grad_norm": 1.791790235596892, "learning_rate": 3.403175593426805e-07, "loss": 0.7458, "step": 7191 }, { "epoch": 0.6635451505016723, "grad_norm": 2.3741367734551457, "learning_rate": 3.401500768433223e-07, "loss": 0.7354, "step": 7192 }, { "epoch": 0.6636374120631992, "grad_norm": 2.065355784586665, "learning_rate": 3.3998262015751253e-07, "loss": 0.5731, "step": 7193 }, { "epoch": 0.6637296736247261, "grad_norm": 1.5360285848173592, "learning_rate": 3.3981518930042655e-07, "loss": 0.6248, "step": 7194 }, { "epoch": 0.663821935186253, "grad_norm": 2.49504983219662, "learning_rate": 3.396477842872367e-07, "loss": 0.6905, "step": 7195 }, { "epoch": 0.663821935186253, "eval_GEN Loss": 0.43963727355003357, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3484777510166168, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.840114176273346, "eval_runtime": 56.3054, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7195 }, { "epoch": 0.66391419674778, "grad_norm": 1.8198723709216065, "learning_rate": 3.3948040513311393e-07, "loss": 0.6258, "step": 7196 }, { "epoch": 0.6640064583093069, "grad_norm": 1.5009190801852939, "learning_rate": 3.393130518532262e-07, "loss": 0.4738, "step": 7197 }, { "epoch": 0.6640987198708338, "grad_norm": 1.7579970125410358, "learning_rate": 3.391457244627396e-07, "loss": 0.5693, "step": 7198 }, { "epoch": 0.6641909814323608, "grad_norm": 2.632863063390211, "learning_rate": 3.389784229768169e-07, "loss": 0.6739, "step": 7199 }, { "epoch": 0.6642832429938876, "grad_norm": 2.485701614864057, "learning_rate": 3.388111474106202e-07, "loss": 0.4971, "step": 7200 }, { "epoch": 0.6642832429938876, "eval_GEN Loss": 0.4400278925895691, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3426014184951782, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8384014368057251, "eval_runtime": 55.9024, "eval_samples_per_second": 1.163, "eval_steps_per_second": 0.089, "step": 7200 }, { "epoch": 0.6643755045554146, "grad_norm": 1.5457231912094136, "learning_rate": 3.3864389777930766e-07, "loss": 0.556, "step": 7201 }, { "epoch": 0.6644677661169416, "grad_norm": 1.7022704489611826, "learning_rate": 3.3847667409803597e-07, "loss": 0.5342, "step": 7202 }, { "epoch": 0.6645600276784684, "grad_norm": 2.4930490067314772, "learning_rate": 3.383094763819589e-07, "loss": 0.7472, "step": 7203 }, { "epoch": 0.6646522892399954, "grad_norm": 1.6417678955031285, "learning_rate": 3.381423046462283e-07, "loss": 0.6762, "step": 7204 }, { "epoch": 0.6647445508015223, "grad_norm": 2.994510468797089, "learning_rate": 3.3797515890599377e-07, "loss": 0.8475, "step": 7205 }, { "epoch": 0.6647445508015223, "eval_GEN Loss": 0.4406188428401947, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.340400367975235, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8418569564819336, "eval_runtime": 56.3094, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7205 }, { "epoch": 0.6648368123630493, "grad_norm": 2.2543938700769317, "learning_rate": 3.3780803917640166e-07, "loss": 0.7601, "step": 7206 }, { "epoch": 0.6649290739245761, "grad_norm": 3.2707792613492512, "learning_rate": 3.376409454725976e-07, "loss": 0.7129, "step": 7207 }, { "epoch": 0.6650213354861031, "grad_norm": 1.8619154432354972, "learning_rate": 3.3747387780972305e-07, "loss": 0.7787, "step": 7208 }, { "epoch": 0.6651135970476301, "grad_norm": 1.7338150309071243, "learning_rate": 3.373068362029186e-07, "loss": 0.7068, "step": 7209 }, { "epoch": 0.6652058586091569, "grad_norm": 1.7741494842451784, "learning_rate": 3.37139820667321e-07, "loss": 0.7956, "step": 7210 }, { "epoch": 0.6652058586091569, "eval_GEN Loss": 0.4402611255645752, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.341167688369751, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8375901579856873, "eval_runtime": 57.0048, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7210 }, { "epoch": 0.6652981201706839, "grad_norm": 2.1046582983328266, "learning_rate": 3.3697283121806644e-07, "loss": 0.6297, "step": 7211 }, { "epoch": 0.6653903817322108, "grad_norm": 1.745795296597955, "learning_rate": 3.368058678702869e-07, "loss": 0.6863, "step": 7212 }, { "epoch": 0.6654826432937377, "grad_norm": 2.17046124300048, "learning_rate": 3.3663893063911337e-07, "loss": 0.6514, "step": 7213 }, { "epoch": 0.6655749048552647, "grad_norm": 1.691837063732146, "learning_rate": 3.364720195396741e-07, "loss": 0.6205, "step": 7214 }, { "epoch": 0.6656671664167916, "grad_norm": 1.5960444833219352, "learning_rate": 3.3630513458709426e-07, "loss": 0.6098, "step": 7215 }, { "epoch": 0.6656671664167916, "eval_GEN Loss": 0.4404049515724182, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.34245195984840393, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8365985751152039, "eval_runtime": 57.0098, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7215 }, { "epoch": 0.6657594279783186, "grad_norm": 2.7911700735618714, "learning_rate": 3.3613827579649783e-07, "loss": 0.6878, "step": 7216 }, { "epoch": 0.6658516895398454, "grad_norm": 1.4322975845255064, "learning_rate": 3.3597144318300497e-07, "loss": 0.5283, "step": 7217 }, { "epoch": 0.6659439511013724, "grad_norm": 1.7341655651795729, "learning_rate": 3.358046367617354e-07, "loss": 0.7412, "step": 7218 }, { "epoch": 0.6660362126628994, "grad_norm": 2.119260546935961, "learning_rate": 3.3563785654780454e-07, "loss": 0.6838, "step": 7219 }, { "epoch": 0.6661284742244262, "grad_norm": 1.7065522265155018, "learning_rate": 3.3547110255632663e-07, "loss": 0.6656, "step": 7220 }, { "epoch": 0.6661284742244262, "eval_GEN Loss": 0.4404602646827698, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.34237703680992126, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8308894038200378, "eval_runtime": 56.1572, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 7220 }, { "epoch": 0.6662207357859532, "grad_norm": 1.7929355686334842, "learning_rate": 3.353043748024132e-07, "loss": 0.7469, "step": 7221 }, { "epoch": 0.6663129973474801, "grad_norm": 1.8984499008806701, "learning_rate": 3.3513767330117347e-07, "loss": 0.7889, "step": 7222 }, { "epoch": 0.666405258909007, "grad_norm": 2.4324519959761064, "learning_rate": 3.349709980677138e-07, "loss": 0.7208, "step": 7223 }, { "epoch": 0.666497520470534, "grad_norm": 2.716031319701419, "learning_rate": 3.348043491171388e-07, "loss": 0.7457, "step": 7224 }, { "epoch": 0.6665897820320609, "grad_norm": 1.4884769904678798, "learning_rate": 3.346377264645505e-07, "loss": 0.6689, "step": 7225 }, { "epoch": 0.6665897820320609, "eval_GEN Loss": 0.4404135048389435, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.34092220664024353, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8283053040504456, "eval_runtime": 56.5584, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 7225 }, { "epoch": 0.6666820435935878, "grad_norm": 2.083429080384654, "learning_rate": 3.344711301250486e-07, "loss": 0.7689, "step": 7226 }, { "epoch": 0.6667743051551147, "grad_norm": 1.5739446916605002, "learning_rate": 3.3430456011373e-07, "loss": 0.5456, "step": 7227 }, { "epoch": 0.6668665667166417, "grad_norm": 2.454675481970567, "learning_rate": 3.341380164456898e-07, "loss": 0.853, "step": 7228 }, { "epoch": 0.6669588282781687, "grad_norm": 1.7979149283560283, "learning_rate": 3.339714991360205e-07, "loss": 0.5283, "step": 7229 }, { "epoch": 0.6670510898396955, "grad_norm": 1.9843375882726988, "learning_rate": 3.338050081998119e-07, "loss": 0.5892, "step": 7230 }, { "epoch": 0.6670510898396955, "eval_GEN Loss": 0.4393016993999481, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33484211564064026, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8243990540504456, "eval_runtime": 56.5475, "eval_samples_per_second": 1.149, "eval_steps_per_second": 0.088, "step": 7230 }, { "epoch": 0.6671433514012225, "grad_norm": 3.4188395755290157, "learning_rate": 3.336385436521517e-07, "loss": 0.9204, "step": 7231 }, { "epoch": 0.6672356129627494, "grad_norm": 1.320655319814427, "learning_rate": 3.3347210550812537e-07, "loss": 0.5734, "step": 7232 }, { "epoch": 0.6673278745242763, "grad_norm": 1.3071325863682002, "learning_rate": 3.3330569378281594e-07, "loss": 0.5291, "step": 7233 }, { "epoch": 0.6674201360858033, "grad_norm": 2.3380409267771998, "learning_rate": 3.331393084913034e-07, "loss": 0.7155, "step": 7234 }, { "epoch": 0.6675123976473302, "grad_norm": 2.4200263081209035, "learning_rate": 3.329729496486661e-07, "loss": 0.7082, "step": 7235 }, { "epoch": 0.6675123976473302, "eval_GEN Loss": 0.43893539905548096, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33223652839660645, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8214543461799622, "eval_runtime": 56.1723, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 7235 }, { "epoch": 0.6676046592088571, "grad_norm": 1.5852830876391335, "learning_rate": 3.328066172699798e-07, "loss": 0.6918, "step": 7236 }, { "epoch": 0.667696920770384, "grad_norm": 2.414317081005227, "learning_rate": 3.3264031137031805e-07, "loss": 0.762, "step": 7237 }, { "epoch": 0.667789182331911, "grad_norm": 1.783960347900038, "learning_rate": 3.324740319647511e-07, "loss": 0.6722, "step": 7238 }, { "epoch": 0.6678814438934378, "grad_norm": 1.9922874795074634, "learning_rate": 3.323077790683479e-07, "loss": 0.7413, "step": 7239 }, { "epoch": 0.6679737054549648, "grad_norm": 1.8907067306149294, "learning_rate": 3.3214155269617466e-07, "loss": 0.6527, "step": 7240 }, { "epoch": 0.6679737054549648, "eval_GEN Loss": 0.4375043213367462, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3316052258014679, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8231971263885498, "eval_runtime": 56.0357, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 7240 }, { "epoch": 0.6680659670164918, "grad_norm": 2.4468597726272274, "learning_rate": 3.319753528632947e-07, "loss": 0.7997, "step": 7241 }, { "epoch": 0.6681582285780187, "grad_norm": 2.124394631007664, "learning_rate": 3.3180917958476946e-07, "loss": 0.5731, "step": 7242 }, { "epoch": 0.6682504901395456, "grad_norm": 2.365140248679982, "learning_rate": 3.3164303287565785e-07, "loss": 0.54, "step": 7243 }, { "epoch": 0.6683427517010725, "grad_norm": 1.5337748708399321, "learning_rate": 3.314769127510166e-07, "loss": 0.5415, "step": 7244 }, { "epoch": 0.6684350132625995, "grad_norm": 2.338350520946948, "learning_rate": 3.31310819225899e-07, "loss": 0.5879, "step": 7245 }, { "epoch": 0.6684350132625995, "eval_GEN Loss": 0.43688949942588806, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32841745018959045, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8158053159713745, "eval_runtime": 56.3685, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 7245 }, { "epoch": 0.6685272748241264, "grad_norm": 1.8182429244445524, "learning_rate": 3.3114475231535785e-07, "loss": 0.6743, "step": 7246 }, { "epoch": 0.6686195363856533, "grad_norm": 1.694996972637084, "learning_rate": 3.309787120344414e-07, "loss": 0.6844, "step": 7247 }, { "epoch": 0.6687117979471803, "grad_norm": 3.2966742271103526, "learning_rate": 3.3081269839819715e-07, "loss": 0.686, "step": 7248 }, { "epoch": 0.6688040595087071, "grad_norm": 1.8468302325881407, "learning_rate": 3.30646711421669e-07, "loss": 0.5875, "step": 7249 }, { "epoch": 0.6688963210702341, "grad_norm": 2.8725737289069873, "learning_rate": 3.3048075111989916e-07, "loss": 0.8703, "step": 7250 }, { "epoch": 0.6688963210702341, "eval_GEN Loss": 0.4373444616794586, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32913103699684143, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.811718761920929, "eval_runtime": 56.1095, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 7250 }, { "epoch": 0.6689885826317611, "grad_norm": 1.5507872506840004, "learning_rate": 3.303148175079275e-07, "loss": 0.4965, "step": 7251 }, { "epoch": 0.669080844193288, "grad_norm": 1.9167238386192285, "learning_rate": 3.3014891060079046e-07, "loss": 0.5758, "step": 7252 }, { "epoch": 0.6691731057548149, "grad_norm": 1.867487629314167, "learning_rate": 3.2998303041352363e-07, "loss": 0.7669, "step": 7253 }, { "epoch": 0.6692653673163418, "grad_norm": 2.0322767614254307, "learning_rate": 3.2981717696115883e-07, "loss": 0.7128, "step": 7254 }, { "epoch": 0.6693576288778688, "grad_norm": 1.790002636190558, "learning_rate": 3.296513502587262e-07, "loss": 0.5387, "step": 7255 }, { "epoch": 0.6693576288778688, "eval_GEN Loss": 0.43801310658454895, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33274394273757935, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8096754550933838, "eval_runtime": 56.3343, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7255 }, { "epoch": 0.6694498904393957, "grad_norm": 1.5682020815427458, "learning_rate": 3.294855503212527e-07, "loss": 0.4681, "step": 7256 }, { "epoch": 0.6695421520009226, "grad_norm": 2.3067326744696426, "learning_rate": 3.293197771637642e-07, "loss": 0.6502, "step": 7257 }, { "epoch": 0.6696344135624496, "grad_norm": 2.4844754828733646, "learning_rate": 3.291540308012827e-07, "loss": 0.758, "step": 7258 }, { "epoch": 0.6697266751239764, "grad_norm": 1.8107878369844348, "learning_rate": 3.289883112488289e-07, "loss": 0.7906, "step": 7259 }, { "epoch": 0.6698189366855034, "grad_norm": 1.7789241286416813, "learning_rate": 3.288226185214199e-07, "loss": 0.6767, "step": 7260 }, { "epoch": 0.6698189366855034, "eval_GEN Loss": 0.43759557604789734, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3323151469230652, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.807421863079071, "eval_runtime": 56.0861, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 7260 }, { "epoch": 0.6699111982470304, "grad_norm": 1.2309333481382618, "learning_rate": 3.286569526340715e-07, "loss": 0.5434, "step": 7261 }, { "epoch": 0.6700034598085572, "grad_norm": 2.6989915985615878, "learning_rate": 3.284913136017964e-07, "loss": 0.9112, "step": 7262 }, { "epoch": 0.6700957213700842, "grad_norm": 2.050080363164182, "learning_rate": 3.283257014396052e-07, "loss": 0.5108, "step": 7263 }, { "epoch": 0.6701879829316111, "grad_norm": 1.7210653830886362, "learning_rate": 3.281601161625061e-07, "loss": 0.6992, "step": 7264 }, { "epoch": 0.670280244493138, "grad_norm": 1.5930366095470851, "learning_rate": 3.279945577855044e-07, "loss": 0.6393, "step": 7265 }, { "epoch": 0.670280244493138, "eval_GEN Loss": 0.4376567602157593, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32926681637763977, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8058894276618958, "eval_runtime": 56.0582, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 7265 }, { "epoch": 0.670372506054665, "grad_norm": 2.6086512260103643, "learning_rate": 3.2782902632360354e-07, "loss": 0.9782, "step": 7266 }, { "epoch": 0.6704647676161919, "grad_norm": 3.6813710971792064, "learning_rate": 3.276635217918036e-07, "loss": 0.8647, "step": 7267 }, { "epoch": 0.6705570291777189, "grad_norm": 2.286253819072524, "learning_rate": 3.274980442051039e-07, "loss": 0.777, "step": 7268 }, { "epoch": 0.6706492907392457, "grad_norm": 1.7824519892474255, "learning_rate": 3.2733259357849935e-07, "loss": 0.6804, "step": 7269 }, { "epoch": 0.6707415523007727, "grad_norm": 1.7202629009278156, "learning_rate": 3.2716716992698363e-07, "loss": 0.5336, "step": 7270 }, { "epoch": 0.6707415523007727, "eval_GEN Loss": 0.43874773383140564, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32908597588539124, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8070312738418579, "eval_runtime": 56.1211, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 7270 }, { "epoch": 0.6708338138622996, "grad_norm": 2.0955293107965787, "learning_rate": 3.270017732655479e-07, "loss": 0.6379, "step": 7271 }, { "epoch": 0.6709260754238265, "grad_norm": 1.7079405979327706, "learning_rate": 3.2683640360918076e-07, "loss": 0.5491, "step": 7272 }, { "epoch": 0.6710183369853535, "grad_norm": 3.8240423782368618, "learning_rate": 3.266710609728678e-07, "loss": 0.8512, "step": 7273 }, { "epoch": 0.6711105985468804, "grad_norm": 1.911580939139347, "learning_rate": 3.2650574537159277e-07, "loss": 0.5626, "step": 7274 }, { "epoch": 0.6712028601084074, "grad_norm": 2.6818894895752026, "learning_rate": 3.2634045682033734e-07, "loss": 0.6163, "step": 7275 }, { "epoch": 0.6712028601084074, "eval_GEN Loss": 0.4383014142513275, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3278586268424988, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8086237907409668, "eval_runtime": 56.0235, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 7275 }, { "epoch": 0.6712951216699342, "grad_norm": 2.6412134044073525, "learning_rate": 3.2617519533407944e-07, "loss": 0.7878, "step": 7276 }, { "epoch": 0.6713873832314612, "grad_norm": 1.7636732251355336, "learning_rate": 3.260099609277957e-07, "loss": 0.6271, "step": 7277 }, { "epoch": 0.6714796447929882, "grad_norm": 1.8954835244441244, "learning_rate": 3.2584475361645993e-07, "loss": 0.7725, "step": 7278 }, { "epoch": 0.671571906354515, "grad_norm": 1.5019546343471366, "learning_rate": 3.256795734150438e-07, "loss": 0.6307, "step": 7279 }, { "epoch": 0.671664167916042, "grad_norm": 2.023296548022791, "learning_rate": 3.2551442033851555e-07, "loss": 0.6097, "step": 7280 }, { "epoch": 0.671664167916042, "eval_GEN Loss": 0.43904829025268555, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32960405945777893, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8079326748847961, "eval_runtime": 57.027, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7280 }, { "epoch": 0.6717564294775689, "grad_norm": 1.5724312766506627, "learning_rate": 3.253492944018419e-07, "loss": 0.4772, "step": 7281 }, { "epoch": 0.6718486910390958, "grad_norm": 2.9167816130573763, "learning_rate": 3.251841956199869e-07, "loss": 0.8149, "step": 7282 }, { "epoch": 0.6719409526006228, "grad_norm": 2.107047678026027, "learning_rate": 3.250191240079122e-07, "loss": 0.7348, "step": 7283 }, { "epoch": 0.6720332141621497, "grad_norm": 2.2017442126502207, "learning_rate": 3.248540795805765e-07, "loss": 0.8181, "step": 7284 }, { "epoch": 0.6721254757236766, "grad_norm": 2.884592434660212, "learning_rate": 3.2468906235293646e-07, "loss": 0.6155, "step": 7285 }, { "epoch": 0.6721254757236766, "eval_GEN Loss": 0.43994081020355225, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3350571095943451, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8098557591438293, "eval_runtime": 57.1839, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7285 }, { "epoch": 0.6722177372852035, "grad_norm": 1.918863928202312, "learning_rate": 3.245240723399466e-07, "loss": 0.993, "step": 7286 }, { "epoch": 0.6723099988467305, "grad_norm": 1.9367073570955653, "learning_rate": 3.243591095565579e-07, "loss": 0.6167, "step": 7287 }, { "epoch": 0.6724022604082575, "grad_norm": 1.5259548192366836, "learning_rate": 3.241941740177201e-07, "loss": 0.6297, "step": 7288 }, { "epoch": 0.6724945219697843, "grad_norm": 2.293058426125001, "learning_rate": 3.240292657383796e-07, "loss": 0.6424, "step": 7289 }, { "epoch": 0.6725867835313113, "grad_norm": 1.9420617533180098, "learning_rate": 3.2386438473348104e-07, "loss": 0.5631, "step": 7290 }, { "epoch": 0.6725867835313113, "eval_GEN Loss": 0.4390757977962494, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3403724133968353, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8081730604171753, "eval_runtime": 57.2886, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7290 }, { "epoch": 0.6726790450928382, "grad_norm": 1.2387429190423234, "learning_rate": 3.236995310179657e-07, "loss": 0.5336, "step": 7291 }, { "epoch": 0.6727713066543651, "grad_norm": 2.0595083586543126, "learning_rate": 3.23534704606773e-07, "loss": 0.6323, "step": 7292 }, { "epoch": 0.6728635682158921, "grad_norm": 1.82432458033373, "learning_rate": 3.2336990551483996e-07, "loss": 0.6371, "step": 7293 }, { "epoch": 0.672955829777419, "grad_norm": 1.6868665398822769, "learning_rate": 3.2320513375710115e-07, "loss": 0.6095, "step": 7294 }, { "epoch": 0.6730480913389459, "grad_norm": 2.1301880838072487, "learning_rate": 3.2304038934848793e-07, "loss": 0.6548, "step": 7295 }, { "epoch": 0.6730480913389459, "eval_GEN Loss": 0.4392530918121338, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34245195984840393, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8096754550933838, "eval_runtime": 57.0763, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7295 }, { "epoch": 0.6731403529004728, "grad_norm": 2.2265736873759234, "learning_rate": 3.2287567230392983e-07, "loss": 0.8669, "step": 7296 }, { "epoch": 0.6732326144619998, "grad_norm": 2.0855115282496524, "learning_rate": 3.2271098263835386e-07, "loss": 0.6194, "step": 7297 }, { "epoch": 0.6733248760235268, "grad_norm": 2.389177100757607, "learning_rate": 3.2254632036668467e-07, "loss": 0.8502, "step": 7298 }, { "epoch": 0.6734171375850536, "grad_norm": 1.5805253464355222, "learning_rate": 3.2238168550384387e-07, "loss": 0.736, "step": 7299 }, { "epoch": 0.6735093991465806, "grad_norm": 1.6162292199507258, "learning_rate": 3.22217078064751e-07, "loss": 0.5509, "step": 7300 }, { "epoch": 0.6735093991465806, "eval_GEN Loss": 0.4398425221443176, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.33733147382736206, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8040564656257629, "eval_runtime": 57.1654, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7300 }, { "epoch": 0.6736016607081075, "grad_norm": 2.2068709466866014, "learning_rate": 3.220524980643233e-07, "loss": 0.6376, "step": 7301 }, { "epoch": 0.6736939222696344, "grad_norm": 2.779941156875159, "learning_rate": 3.2188794551747465e-07, "loss": 0.6667, "step": 7302 }, { "epoch": 0.6737861838311613, "grad_norm": 2.1922503457997564, "learning_rate": 3.2172342043911794e-07, "loss": 0.6137, "step": 7303 }, { "epoch": 0.6738784453926883, "grad_norm": 3.0156811700107142, "learning_rate": 3.21558922844162e-07, "loss": 0.739, "step": 7304 }, { "epoch": 0.6739707069542152, "grad_norm": 1.852968851796741, "learning_rate": 3.2139445274751436e-07, "loss": 0.5322, "step": 7305 }, { "epoch": 0.6739707069542152, "eval_GEN Loss": 0.4397372901439667, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34001004695892334, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8059495091438293, "eval_runtime": 57.0737, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7305 }, { "epoch": 0.6740629685157421, "grad_norm": 1.596553602681776, "learning_rate": 3.2123001016407876e-07, "loss": 0.6259, "step": 7306 }, { "epoch": 0.6741552300772691, "grad_norm": 2.43674510995911, "learning_rate": 3.2106559510875825e-07, "loss": 0.9191, "step": 7307 }, { "epoch": 0.6742474916387959, "grad_norm": 1.963720340420855, "learning_rate": 3.209012075964517e-07, "loss": 0.7359, "step": 7308 }, { "epoch": 0.6743397532003229, "grad_norm": 3.5147903859166467, "learning_rate": 3.2073684764205637e-07, "loss": 1.1219, "step": 7309 }, { "epoch": 0.6744320147618499, "grad_norm": 1.9101128951108979, "learning_rate": 3.205725152604671e-07, "loss": 0.5942, "step": 7310 }, { "epoch": 0.6744320147618499, "eval_GEN Loss": 0.44064754247665405, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.343334436416626, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.803004801273346, "eval_runtime": 57.2583, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7310 }, { "epoch": 0.6745242763233767, "grad_norm": 2.0092177527570976, "learning_rate": 3.204082104665754e-07, "loss": 0.5066, "step": 7311 }, { "epoch": 0.6746165378849037, "grad_norm": 1.9135148109579698, "learning_rate": 3.202439332752714e-07, "loss": 0.6944, "step": 7312 }, { "epoch": 0.6747087994464306, "grad_norm": 1.5735856622144522, "learning_rate": 3.2007968370144133e-07, "loss": 0.4923, "step": 7313 }, { "epoch": 0.6748010610079576, "grad_norm": 1.854720333456571, "learning_rate": 3.1991546175997074e-07, "loss": 0.6912, "step": 7314 }, { "epoch": 0.6748933225694845, "grad_norm": 2.2781060676721245, "learning_rate": 3.1975126746574104e-07, "loss": 0.7738, "step": 7315 }, { "epoch": 0.6748933225694845, "eval_GEN Loss": 0.4393399953842163, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3463177978992462, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8073017001152039, "eval_runtime": 57.0724, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7315 }, { "epoch": 0.6749855841310114, "grad_norm": 3.003740930033111, "learning_rate": 3.1958710083363207e-07, "loss": 0.8218, "step": 7316 }, { "epoch": 0.6750778456925384, "grad_norm": 2.2562900791674116, "learning_rate": 3.1942296187852037e-07, "loss": 0.6287, "step": 7317 }, { "epoch": 0.6751701072540652, "grad_norm": 1.873939878440099, "learning_rate": 3.192588506152813e-07, "loss": 0.5917, "step": 7318 }, { "epoch": 0.6752623688155922, "grad_norm": 1.591713564021823, "learning_rate": 3.190947670587862e-07, "loss": 0.5432, "step": 7319 }, { "epoch": 0.6753546303771192, "grad_norm": 1.8653229964727631, "learning_rate": 3.1893071122390484e-07, "loss": 0.5767, "step": 7320 }, { "epoch": 0.6753546303771192, "eval_GEN Loss": 0.44006672501564026, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34733569622039795, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8112680315971375, "eval_runtime": 57.0811, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7320 }, { "epoch": 0.675446891938646, "grad_norm": 1.958459872188881, "learning_rate": 3.1876668312550437e-07, "loss": 0.8288, "step": 7321 }, { "epoch": 0.675539153500173, "grad_norm": 2.455460644483487, "learning_rate": 3.1860268277844884e-07, "loss": 0.9708, "step": 7322 }, { "epoch": 0.6756314150616999, "grad_norm": 1.8776800059051368, "learning_rate": 3.184387101976008e-07, "loss": 0.516, "step": 7323 }, { "epoch": 0.6757236766232269, "grad_norm": 2.140634644532372, "learning_rate": 3.182747653978188e-07, "loss": 0.7599, "step": 7324 }, { "epoch": 0.6758159381847538, "grad_norm": 2.2385442000111535, "learning_rate": 3.181108483939609e-07, "loss": 0.6333, "step": 7325 }, { "epoch": 0.6758159381847538, "eval_GEN Loss": 0.43992865085601807, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3465224802494049, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8067908883094788, "eval_runtime": 56.9765, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7325 }, { "epoch": 0.6759081997462807, "grad_norm": 1.674556097740936, "learning_rate": 3.1794695920088074e-07, "loss": 0.6656, "step": 7326 }, { "epoch": 0.6760004613078077, "grad_norm": 2.2170161935024155, "learning_rate": 3.177830978334304e-07, "loss": 0.649, "step": 7327 }, { "epoch": 0.6760927228693345, "grad_norm": 1.8376267228191272, "learning_rate": 3.1761926430645936e-07, "loss": 0.6678, "step": 7328 }, { "epoch": 0.6761849844308615, "grad_norm": 1.7379095404886835, "learning_rate": 3.1745545863481453e-07, "loss": 0.6745, "step": 7329 }, { "epoch": 0.6762772459923885, "grad_norm": 2.0760814010038366, "learning_rate": 3.1729168083334e-07, "loss": 0.618, "step": 7330 }, { "epoch": 0.6762772459923885, "eval_GEN Loss": 0.4395467936992645, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3499825596809387, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8092548251152039, "eval_runtime": 57.165, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7330 }, { "epoch": 0.6763695075539153, "grad_norm": 1.8731569408446678, "learning_rate": 3.171279309168776e-07, "loss": 0.6375, "step": 7331 }, { "epoch": 0.6764617691154423, "grad_norm": 2.073936465049623, "learning_rate": 3.16964208900267e-07, "loss": 0.6512, "step": 7332 }, { "epoch": 0.6765540306769692, "grad_norm": 1.9530668399570024, "learning_rate": 3.1680051479834437e-07, "loss": 0.6002, "step": 7333 }, { "epoch": 0.6766462922384961, "grad_norm": 1.6354932855668174, "learning_rate": 3.166368486259443e-07, "loss": 0.4912, "step": 7334 }, { "epoch": 0.676738553800023, "grad_norm": 2.072650378523588, "learning_rate": 3.1647321039789825e-07, "loss": 0.8469, "step": 7335 }, { "epoch": 0.676738553800023, "eval_GEN Loss": 0.4399409294128418, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3447607159614563, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8113881945610046, "eval_runtime": 57.2856, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7335 }, { "epoch": 0.67683081536155, "grad_norm": 2.355406005550927, "learning_rate": 3.163096001290358e-07, "loss": 0.5947, "step": 7336 }, { "epoch": 0.676923076923077, "grad_norm": 4.261844603903816, "learning_rate": 3.16146017834183e-07, "loss": 0.6516, "step": 7337 }, { "epoch": 0.6770153384846038, "grad_norm": 1.9659904290814867, "learning_rate": 3.1598246352816426e-07, "loss": 0.6039, "step": 7338 }, { "epoch": 0.6771076000461308, "grad_norm": 1.5546248547958315, "learning_rate": 3.158189372258011e-07, "loss": 0.7108, "step": 7339 }, { "epoch": 0.6771998616076577, "grad_norm": 1.863024967184415, "learning_rate": 3.156554389419127e-07, "loss": 0.701, "step": 7340 }, { "epoch": 0.6771998616076577, "eval_GEN Loss": 0.439403235912323, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34049171209335327, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8156550526618958, "eval_runtime": 57.2521, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7340 }, { "epoch": 0.6772921231691846, "grad_norm": 2.844053371393424, "learning_rate": 3.154919686913148e-07, "loss": 0.7239, "step": 7341 }, { "epoch": 0.6773843847307116, "grad_norm": 2.018370388234651, "learning_rate": 3.153285264888224e-07, "loss": 0.6763, "step": 7342 }, { "epoch": 0.6774766462922385, "grad_norm": 2.756429819194342, "learning_rate": 3.1516511234924623e-07, "loss": 0.7003, "step": 7343 }, { "epoch": 0.6775689078537654, "grad_norm": 3.028459087466602, "learning_rate": 3.1500172628739533e-07, "loss": 0.806, "step": 7344 }, { "epoch": 0.6776611694152923, "grad_norm": 2.358595118734039, "learning_rate": 3.148383683180758e-07, "loss": 0.7185, "step": 7345 }, { "epoch": 0.6776611694152923, "eval_GEN Loss": 0.43916720151901245, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3351098299026489, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8154447078704834, "eval_runtime": 57.1768, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7345 }, { "epoch": 0.6777534309768193, "grad_norm": 2.674198569477766, "learning_rate": 3.1467503845609146e-07, "loss": 0.6726, "step": 7346 }, { "epoch": 0.6778456925383463, "grad_norm": 1.944163111446442, "learning_rate": 3.1451173671624394e-07, "loss": 0.5862, "step": 7347 }, { "epoch": 0.6779379540998731, "grad_norm": 1.5711846685986952, "learning_rate": 3.1434846311333125e-07, "loss": 0.601, "step": 7348 }, { "epoch": 0.6780302156614001, "grad_norm": 1.6480229130506052, "learning_rate": 3.141852176621498e-07, "loss": 0.5727, "step": 7349 }, { "epoch": 0.678122477222927, "grad_norm": 2.035611276734158, "learning_rate": 3.140220003774931e-07, "loss": 0.7082, "step": 7350 }, { "epoch": 0.678122477222927, "eval_GEN Loss": 0.43958336114883423, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3380092978477478, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8146634697914124, "eval_runtime": 57.2565, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7350 }, { "epoch": 0.6782147387844539, "grad_norm": 1.629032388545908, "learning_rate": 3.138588112741526e-07, "loss": 0.6544, "step": 7351 }, { "epoch": 0.6783070003459809, "grad_norm": 1.905206616004218, "learning_rate": 3.136956503669158e-07, "loss": 0.5943, "step": 7352 }, { "epoch": 0.6783992619075078, "grad_norm": 1.8246368351114417, "learning_rate": 3.135325176705696e-07, "loss": 0.6654, "step": 7353 }, { "epoch": 0.6784915234690347, "grad_norm": 1.6687422419606046, "learning_rate": 3.1336941319989675e-07, "loss": 0.6111, "step": 7354 }, { "epoch": 0.6785837850305616, "grad_norm": 2.0525047625416573, "learning_rate": 3.1320633696967843e-07, "loss": 0.6342, "step": 7355 }, { "epoch": 0.6785837850305616, "eval_GEN Loss": 0.43953609466552734, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3417215049266815, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8143930435180664, "eval_runtime": 57.1885, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7355 }, { "epoch": 0.6786760465920886, "grad_norm": 2.174203202965884, "learning_rate": 3.130432889946923e-07, "loss": 0.7146, "step": 7356 }, { "epoch": 0.6787683081536156, "grad_norm": 1.5722567774911818, "learning_rate": 3.128802692897144e-07, "loss": 0.5134, "step": 7357 }, { "epoch": 0.6788605697151424, "grad_norm": 2.160755879179206, "learning_rate": 3.1271727786951805e-07, "loss": 0.5881, "step": 7358 }, { "epoch": 0.6789528312766694, "grad_norm": 1.618356161481068, "learning_rate": 3.12554314748873e-07, "loss": 0.6239, "step": 7359 }, { "epoch": 0.6790450928381963, "grad_norm": 2.515090473922486, "learning_rate": 3.1239137994254823e-07, "loss": 0.8414, "step": 7360 }, { "epoch": 0.6790450928381963, "eval_GEN Loss": 0.4404229521751404, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34472742676734924, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8146935105323792, "eval_runtime": 57.3914, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7360 }, { "epoch": 0.6791373543997232, "grad_norm": 1.7223163224077886, "learning_rate": 3.122284734653084e-07, "loss": 0.5855, "step": 7361 }, { "epoch": 0.6792296159612502, "grad_norm": 1.8395854960796998, "learning_rate": 3.1206559533191687e-07, "loss": 0.6248, "step": 7362 }, { "epoch": 0.6793218775227771, "grad_norm": 2.965209790102881, "learning_rate": 3.119027455571332e-07, "loss": 0.8669, "step": 7363 }, { "epoch": 0.679414139084304, "grad_norm": 2.283283381387464, "learning_rate": 3.1173992415571605e-07, "loss": 0.7669, "step": 7364 }, { "epoch": 0.6795064006458309, "grad_norm": 2.936388483287696, "learning_rate": 3.1157713114241976e-07, "loss": 0.7407, "step": 7365 }, { "epoch": 0.6795064006458309, "eval_GEN Loss": 0.4400458335876465, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34918051958084106, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8172475695610046, "eval_runtime": 57.3073, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7365 }, { "epoch": 0.6795986622073579, "grad_norm": 1.9169551770888122, "learning_rate": 3.114143665319972e-07, "loss": 0.6145, "step": 7366 }, { "epoch": 0.6796909237688847, "grad_norm": 3.0055232511406214, "learning_rate": 3.112516303391986e-07, "loss": 0.5886, "step": 7367 }, { "epoch": 0.6797831853304117, "grad_norm": 2.025182606825834, "learning_rate": 3.110889225787708e-07, "loss": 0.7522, "step": 7368 }, { "epoch": 0.6798754468919387, "grad_norm": 2.6268294384908573, "learning_rate": 3.10926243265459e-07, "loss": 0.7943, "step": 7369 }, { "epoch": 0.6799677084534655, "grad_norm": 1.891174840138953, "learning_rate": 3.1076359241400537e-07, "loss": 0.6565, "step": 7370 }, { "epoch": 0.6799677084534655, "eval_GEN Loss": 0.4393017292022705, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3488318622112274, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8158353567123413, "eval_runtime": 57.0815, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7370 }, { "epoch": 0.6800599700149925, "grad_norm": 2.215345937288463, "learning_rate": 3.106009700391498e-07, "loss": 0.6245, "step": 7371 }, { "epoch": 0.6801522315765194, "grad_norm": 1.8027227599639872, "learning_rate": 3.1043837615562907e-07, "loss": 0.486, "step": 7372 }, { "epoch": 0.6802444931380464, "grad_norm": 1.3869684092697072, "learning_rate": 3.1027581077817774e-07, "loss": 0.5897, "step": 7373 }, { "epoch": 0.6803367546995733, "grad_norm": 1.6568442659100806, "learning_rate": 3.1011327392152783e-07, "loss": 0.6603, "step": 7374 }, { "epoch": 0.6804290162611002, "grad_norm": 4.375827138117088, "learning_rate": 3.0995076560040894e-07, "loss": 0.6952, "step": 7375 }, { "epoch": 0.6804290162611002, "eval_GEN Loss": 0.43934983015060425, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3432154655456543, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8145432472229004, "eval_runtime": 56.4219, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 7375 }, { "epoch": 0.6805212778226272, "grad_norm": 3.8570146036810313, "learning_rate": 3.097882858295474e-07, "loss": 0.6529, "step": 7376 }, { "epoch": 0.680613539384154, "grad_norm": 2.3121465807677155, "learning_rate": 3.0962583462366737e-07, "loss": 0.7622, "step": 7377 }, { "epoch": 0.680705800945681, "grad_norm": 2.281510224029534, "learning_rate": 3.094634119974908e-07, "loss": 0.6754, "step": 7378 }, { "epoch": 0.680798062507208, "grad_norm": 2.3818401419010833, "learning_rate": 3.093010179657366e-07, "loss": 0.8696, "step": 7379 }, { "epoch": 0.6808903240687348, "grad_norm": 1.8088314579217888, "learning_rate": 3.0913865254312087e-07, "loss": 0.5473, "step": 7380 }, { "epoch": 0.6808903240687348, "eval_GEN Loss": 0.43961986899375916, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34280186891555786, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8224759697914124, "eval_runtime": 57.2968, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7380 }, { "epoch": 0.6809825856302618, "grad_norm": 1.611461677280018, "learning_rate": 3.089763157443576e-07, "loss": 0.5605, "step": 7381 }, { "epoch": 0.6810748471917887, "grad_norm": 1.9826728590652491, "learning_rate": 3.088140075841583e-07, "loss": 0.5686, "step": 7382 }, { "epoch": 0.6811671087533157, "grad_norm": 2.8043164772628266, "learning_rate": 3.08651728077231e-07, "loss": 0.8515, "step": 7383 }, { "epoch": 0.6812593703148426, "grad_norm": 1.9099225451860997, "learning_rate": 3.0848947723828216e-07, "loss": 0.6916, "step": 7384 }, { "epoch": 0.6813516318763695, "grad_norm": 2.028585298954462, "learning_rate": 3.0832725508201503e-07, "loss": 0.8394, "step": 7385 }, { "epoch": 0.6813516318763695, "eval_GEN Loss": 0.43927276134490967, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33902469277381897, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8228365182876587, "eval_runtime": 57.1472, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7385 }, { "epoch": 0.6814438934378965, "grad_norm": 2.4746878005978292, "learning_rate": 3.0816506162313076e-07, "loss": 0.4862, "step": 7386 }, { "epoch": 0.6815361549994233, "grad_norm": 2.117585886297289, "learning_rate": 3.0800289687632703e-07, "loss": 0.7424, "step": 7387 }, { "epoch": 0.6816284165609503, "grad_norm": 1.7942955407850418, "learning_rate": 3.078407608562998e-07, "loss": 0.7237, "step": 7388 }, { "epoch": 0.6817206781224773, "grad_norm": 2.15528157588315, "learning_rate": 3.07678653577742e-07, "loss": 0.6836, "step": 7389 }, { "epoch": 0.6818129396840041, "grad_norm": 1.608669136542332, "learning_rate": 3.075165750553443e-07, "loss": 0.7224, "step": 7390 }, { "epoch": 0.6818129396840041, "eval_GEN Loss": 0.4389278292655945, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33286580443382263, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8236778974533081, "eval_runtime": 56.3149, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7390 }, { "epoch": 0.6819052012455311, "grad_norm": 2.291438852132691, "learning_rate": 3.0735452530379404e-07, "loss": 0.735, "step": 7391 }, { "epoch": 0.681997462807058, "grad_norm": 1.9405690219552625, "learning_rate": 3.0719250433777675e-07, "loss": 0.7085, "step": 7392 }, { "epoch": 0.682089724368585, "grad_norm": 1.7052838867862499, "learning_rate": 3.0703051217197513e-07, "loss": 0.6725, "step": 7393 }, { "epoch": 0.6821819859301118, "grad_norm": 1.5363025771839778, "learning_rate": 3.068685488210688e-07, "loss": 0.4959, "step": 7394 }, { "epoch": 0.6822742474916388, "grad_norm": 3.9038719974297225, "learning_rate": 3.0670661429973534e-07, "loss": 0.7322, "step": 7395 }, { "epoch": 0.6822742474916388, "eval_GEN Loss": 0.4386090338230133, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32903170585632324, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8276442289352417, "eval_runtime": 56.8735, "eval_samples_per_second": 1.143, "eval_steps_per_second": 0.088, "step": 7395 }, { "epoch": 0.6823665090531658, "grad_norm": 1.8569476471399342, "learning_rate": 3.0654470862264944e-07, "loss": 0.636, "step": 7396 }, { "epoch": 0.6824587706146926, "grad_norm": 2.2445913087843037, "learning_rate": 3.0638283180448354e-07, "loss": 0.6861, "step": 7397 }, { "epoch": 0.6825510321762196, "grad_norm": 1.8717253524095403, "learning_rate": 3.0622098385990654e-07, "loss": 0.7168, "step": 7398 }, { "epoch": 0.6826432937377465, "grad_norm": 2.0895787338579073, "learning_rate": 3.0605916480358615e-07, "loss": 0.462, "step": 7399 }, { "epoch": 0.6827355552992734, "grad_norm": 2.1427561046325527, "learning_rate": 3.05897374650186e-07, "loss": 0.7889, "step": 7400 }, { "epoch": 0.6827355552992734, "eval_GEN Loss": 0.4387158453464508, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9047619047619048, "eval_PRM F1 AUC": 0.7621791513881613, "eval_PRM F1 Neg": 0.6363636363636364, "eval_PRM Loss": 0.3269506096839905, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.8941176470588236, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8333232998847961, "eval_runtime": 57.0662, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7400 }, { "epoch": 0.6828278168608004, "grad_norm": 4.135631906808779, "learning_rate": 3.057356134143683e-07, "loss": 0.8343, "step": 7401 }, { "epoch": 0.6829200784223273, "grad_norm": 1.6906969395948925, "learning_rate": 3.055738811107916e-07, "loss": 0.6455, "step": 7402 }, { "epoch": 0.6830123399838542, "grad_norm": 2.4233381784082835, "learning_rate": 3.0541217775411263e-07, "loss": 0.5997, "step": 7403 }, { "epoch": 0.6831046015453811, "grad_norm": 2.263054604506093, "learning_rate": 3.052505033589853e-07, "loss": 0.6816, "step": 7404 }, { "epoch": 0.6831968631069081, "grad_norm": 4.189084970034578, "learning_rate": 3.050888579400605e-07, "loss": 0.7467, "step": 7405 }, { "epoch": 0.6831968631069081, "eval_GEN Loss": 0.438618004322052, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9047619047619048, "eval_PRM F1 AUC": 0.7621791513881613, "eval_PRM F1 Neg": 0.6363636363636364, "eval_PRM Loss": 0.3279200792312622, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.8941176470588236, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.8352463841438293, "eval_runtime": 57.2307, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7405 }, { "epoch": 0.683289124668435, "grad_norm": 2.0150786414793957, "learning_rate": 3.0492724151198686e-07, "loss": 0.7063, "step": 7406 }, { "epoch": 0.6833813862299619, "grad_norm": 2.4864234922488246, "learning_rate": 3.047656540894105e-07, "loss": 0.8277, "step": 7407 }, { "epoch": 0.6834736477914889, "grad_norm": 2.475628256134793, "learning_rate": 3.0460409568697474e-07, "loss": 0.7066, "step": 7408 }, { "epoch": 0.6835659093530158, "grad_norm": 3.249411833074664, "learning_rate": 3.0444256631931976e-07, "loss": 0.8813, "step": 7409 }, { "epoch": 0.6836581709145427, "grad_norm": 1.9011196999661604, "learning_rate": 3.042810660010844e-07, "loss": 0.6933, "step": 7410 }, { "epoch": 0.6836581709145427, "eval_GEN Loss": 0.4391014575958252, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32819247245788574, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8240384459495544, "eval_runtime": 57.2516, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7410 }, { "epoch": 0.6837504324760697, "grad_norm": 3.3631507757329713, "learning_rate": 3.041195947469035e-07, "loss": 0.7632, "step": 7411 }, { "epoch": 0.6838426940375966, "grad_norm": 1.9843764465226146, "learning_rate": 3.039581525714101e-07, "loss": 0.8708, "step": 7412 }, { "epoch": 0.6839349555991235, "grad_norm": 2.044576620516082, "learning_rate": 3.037967394892339e-07, "loss": 0.5561, "step": 7413 }, { "epoch": 0.6840272171606504, "grad_norm": 2.1242002597566123, "learning_rate": 3.036353555150031e-07, "loss": 0.5641, "step": 7414 }, { "epoch": 0.6841194787221774, "grad_norm": 1.8484102612179152, "learning_rate": 3.0347400066334206e-07, "loss": 0.7258, "step": 7415 }, { "epoch": 0.6841194787221774, "eval_GEN Loss": 0.4390805959701538, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3379010260105133, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8171274065971375, "eval_runtime": 57.29, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7415 }, { "epoch": 0.6842117402837044, "grad_norm": 1.8661039952069638, "learning_rate": 3.0331267494887314e-07, "loss": 0.7139, "step": 7416 }, { "epoch": 0.6843040018452312, "grad_norm": 1.5788417028666344, "learning_rate": 3.0315137838621625e-07, "loss": 0.5795, "step": 7417 }, { "epoch": 0.6843962634067582, "grad_norm": 1.6772879802858316, "learning_rate": 3.029901109899878e-07, "loss": 0.47, "step": 7418 }, { "epoch": 0.684488524968285, "grad_norm": 1.8496228418271132, "learning_rate": 3.0282887277480253e-07, "loss": 0.5766, "step": 7419 }, { "epoch": 0.684580786529812, "grad_norm": 1.8799381692199497, "learning_rate": 3.026676637552715e-07, "loss": 0.7046, "step": 7420 }, { "epoch": 0.684580786529812, "eval_GEN Loss": 0.44013333320617676, "eval_GEN top-5 accuracy": 0.9824638316527838, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3456646800041199, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8142127394676208, "eval_runtime": 57.4145, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 7420 }, { "epoch": 0.684673048091339, "grad_norm": 2.5087383929163876, "learning_rate": 3.025064839460046e-07, "loss": 0.536, "step": 7421 }, { "epoch": 0.6847653096528659, "grad_norm": 1.6588779478959517, "learning_rate": 3.0234533336160743e-07, "loss": 0.475, "step": 7422 }, { "epoch": 0.6848575712143928, "grad_norm": 1.9407373759707396, "learning_rate": 3.0218421201668406e-07, "loss": 0.6079, "step": 7423 }, { "epoch": 0.6849498327759197, "grad_norm": 1.9375638945435232, "learning_rate": 3.0202311992583553e-07, "loss": 0.7915, "step": 7424 }, { "epoch": 0.6850420943374467, "grad_norm": 2.075894219783399, "learning_rate": 3.0186205710366045e-07, "loss": 0.7063, "step": 7425 }, { "epoch": 0.6850420943374467, "eval_GEN Loss": 0.4404766261577606, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3516843318939209, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8140624761581421, "eval_runtime": 57.0341, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7425 }, { "epoch": 0.6851343558989735, "grad_norm": 1.8969738184782594, "learning_rate": 3.017010235647542e-07, "loss": 0.4772, "step": 7426 }, { "epoch": 0.6852266174605005, "grad_norm": 1.382497211531331, "learning_rate": 3.0154001932371e-07, "loss": 0.5771, "step": 7427 }, { "epoch": 0.6853188790220275, "grad_norm": 2.042856443561697, "learning_rate": 3.013790443951187e-07, "loss": 0.8191, "step": 7428 }, { "epoch": 0.6854111405835543, "grad_norm": 2.1550334975831302, "learning_rate": 3.012180987935675e-07, "loss": 0.6966, "step": 7429 }, { "epoch": 0.6855034021450813, "grad_norm": 1.7280630233032204, "learning_rate": 3.0105718253364184e-07, "loss": 0.6623, "step": 7430 }, { "epoch": 0.6855034021450813, "eval_GEN Loss": 0.44067272543907166, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3555468022823334, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8149939775466919, "eval_runtime": 56.9917, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7430 }, { "epoch": 0.6855956637066082, "grad_norm": 2.261478293106886, "learning_rate": 3.0089629562992417e-07, "loss": 0.7236, "step": 7431 }, { "epoch": 0.6856879252681352, "grad_norm": 2.086559805537447, "learning_rate": 3.0073543809699464e-07, "loss": 0.661, "step": 7432 }, { "epoch": 0.6857801868296621, "grad_norm": 1.3977536130129515, "learning_rate": 3.005746099494298e-07, "loss": 0.4299, "step": 7433 }, { "epoch": 0.685872448391189, "grad_norm": 2.011027840720222, "learning_rate": 3.004138112018045e-07, "loss": 0.8292, "step": 7434 }, { "epoch": 0.685964709952716, "grad_norm": 1.663498217948821, "learning_rate": 3.0025304186869055e-07, "loss": 0.6258, "step": 7435 }, { "epoch": 0.685964709952716, "eval_GEN Loss": 0.440920889377594, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3507845401763916, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8152944445610046, "eval_runtime": 57.2635, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7435 }, { "epoch": 0.6860569715142428, "grad_norm": 2.5048646344078564, "learning_rate": 3.0009230196465725e-07, "loss": 0.7135, "step": 7436 }, { "epoch": 0.6861492330757698, "grad_norm": 1.8866506523979203, "learning_rate": 2.999315915042708e-07, "loss": 0.6516, "step": 7437 }, { "epoch": 0.6862414946372968, "grad_norm": 1.9144362307444776, "learning_rate": 2.9977091050209515e-07, "loss": 0.5757, "step": 7438 }, { "epoch": 0.6863337561988236, "grad_norm": 1.983273656711781, "learning_rate": 2.996102589726918e-07, "loss": 0.5536, "step": 7439 }, { "epoch": 0.6864260177603506, "grad_norm": 1.587339529641708, "learning_rate": 2.9944963693061874e-07, "loss": 0.6893, "step": 7440 }, { "epoch": 0.6864260177603506, "eval_GEN Loss": 0.4402867555618286, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3467608392238617, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8116586804389954, "eval_runtime": 57.0933, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7440 }, { "epoch": 0.6865182793218775, "grad_norm": 2.0897472240425987, "learning_rate": 2.992890443904319e-07, "loss": 0.6989, "step": 7441 }, { "epoch": 0.6866105408834045, "grad_norm": 1.6445195614682129, "learning_rate": 2.9912848136668464e-07, "loss": 0.6799, "step": 7442 }, { "epoch": 0.6867028024449314, "grad_norm": 1.6263943283797864, "learning_rate": 2.9896794787392746e-07, "loss": 0.6301, "step": 7443 }, { "epoch": 0.6867950640064583, "grad_norm": 2.2053484297331885, "learning_rate": 2.988074439267079e-07, "loss": 0.8273, "step": 7444 }, { "epoch": 0.6868873255679853, "grad_norm": 3.676145824858514, "learning_rate": 2.986469695395711e-07, "loss": 1.0863, "step": 7445 }, { "epoch": 0.6868873255679853, "eval_GEN Loss": 0.43981650471687317, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.33815568685531616, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8112980723381042, "eval_runtime": 57.3239, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7445 }, { "epoch": 0.6869795871295121, "grad_norm": 2.2381197470538257, "learning_rate": 2.9848652472705964e-07, "loss": 0.7022, "step": 7446 }, { "epoch": 0.6870718486910391, "grad_norm": 1.706235045028308, "learning_rate": 2.9832610950371357e-07, "loss": 0.6071, "step": 7447 }, { "epoch": 0.6871641102525661, "grad_norm": 1.9749741840172408, "learning_rate": 2.9816572388406933e-07, "loss": 0.7073, "step": 7448 }, { "epoch": 0.6872563718140929, "grad_norm": 1.6634731523504978, "learning_rate": 2.980053678826617e-07, "loss": 0.5437, "step": 7449 }, { "epoch": 0.6873486333756199, "grad_norm": 2.4695549454888877, "learning_rate": 2.978450415140222e-07, "loss": 0.7498, "step": 7450 }, { "epoch": 0.6873486333756199, "eval_GEN Loss": 0.4392330050468445, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3310582637786865, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8121694922447205, "eval_runtime": 57.18, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7450 }, { "epoch": 0.6874408949371468, "grad_norm": 2.865838244621695, "learning_rate": 2.9768474479268033e-07, "loss": 0.7266, "step": 7451 }, { "epoch": 0.6875331564986737, "grad_norm": 2.714059419289642, "learning_rate": 2.975244777331618e-07, "loss": 0.8567, "step": 7452 }, { "epoch": 0.6876254180602007, "grad_norm": 2.627169507795024, "learning_rate": 2.973642403499906e-07, "loss": 0.828, "step": 7453 }, { "epoch": 0.6877176796217276, "grad_norm": 2.0707591206638605, "learning_rate": 2.9720403265768784e-07, "loss": 0.5244, "step": 7454 }, { "epoch": 0.6878099411832546, "grad_norm": 2.7358798118031245, "learning_rate": 2.9704385467077113e-07, "loss": 0.6428, "step": 7455 }, { "epoch": 0.6878099411832546, "eval_GEN Loss": 0.43971163034439087, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32870322465896606, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8088040947914124, "eval_runtime": 57.0325, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7455 }, { "epoch": 0.6879022027447814, "grad_norm": 1.3018241181961066, "learning_rate": 2.9688370640375704e-07, "loss": 0.4546, "step": 7456 }, { "epoch": 0.6879944643063084, "grad_norm": 2.1639416041995103, "learning_rate": 2.967235878711577e-07, "loss": 0.6205, "step": 7457 }, { "epoch": 0.6880867258678353, "grad_norm": 2.0049333849396223, "learning_rate": 2.9656349908748367e-07, "loss": 0.6422, "step": 7458 }, { "epoch": 0.6881789874293622, "grad_norm": 1.2430100676856544, "learning_rate": 2.96403440067242e-07, "loss": 0.5156, "step": 7459 }, { "epoch": 0.6882712489908892, "grad_norm": 1.7488665395385503, "learning_rate": 2.962434108249382e-07, "loss": 0.5873, "step": 7460 }, { "epoch": 0.6882712489908892, "eval_GEN Loss": 0.4398549795150757, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3270803987979889, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8104567527770996, "eval_runtime": 57.0278, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7460 }, { "epoch": 0.6883635105524161, "grad_norm": 3.2147053810898925, "learning_rate": 2.9608341137507373e-07, "loss": 0.8856, "step": 7461 }, { "epoch": 0.688455772113943, "grad_norm": 2.603514346334395, "learning_rate": 2.959234417321483e-07, "loss": 0.5457, "step": 7462 }, { "epoch": 0.6885480336754699, "grad_norm": 2.0708687772966754, "learning_rate": 2.9576350191065877e-07, "loss": 0.7267, "step": 7463 }, { "epoch": 0.6886402952369969, "grad_norm": 1.947227763286897, "learning_rate": 2.9560359192509866e-07, "loss": 0.6254, "step": 7464 }, { "epoch": 0.6887325567985239, "grad_norm": 1.8809315518879337, "learning_rate": 2.9544371178995973e-07, "loss": 0.7662, "step": 7465 }, { "epoch": 0.6887325567985239, "eval_GEN Loss": 0.4394494295120239, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32821106910705566, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8064302802085876, "eval_runtime": 57.2452, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7465 }, { "epoch": 0.6888248183600507, "grad_norm": 2.1186571424818106, "learning_rate": 2.9528386151972995e-07, "loss": 0.7654, "step": 7466 }, { "epoch": 0.6889170799215777, "grad_norm": 2.6746994200029377, "learning_rate": 2.951240411288961e-07, "loss": 0.5277, "step": 7467 }, { "epoch": 0.6890093414831046, "grad_norm": 2.424669696119, "learning_rate": 2.9496425063194063e-07, "loss": 0.7954, "step": 7468 }, { "epoch": 0.6891016030446315, "grad_norm": 1.8781039549205618, "learning_rate": 2.9480449004334453e-07, "loss": 0.7595, "step": 7469 }, { "epoch": 0.6891938646061585, "grad_norm": 2.3835750835870027, "learning_rate": 2.9464475937758474e-07, "loss": 0.7924, "step": 7470 }, { "epoch": 0.6891938646061585, "eval_GEN Loss": 0.4397251605987549, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3318486213684082, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8059194684028625, "eval_runtime": 57.1679, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7470 }, { "epoch": 0.6892861261676854, "grad_norm": 2.012286580014358, "learning_rate": 2.944850586491373e-07, "loss": 0.602, "step": 7471 }, { "epoch": 0.6893783877292123, "grad_norm": 1.560065035350559, "learning_rate": 2.943253878724739e-07, "loss": 0.525, "step": 7472 }, { "epoch": 0.6894706492907392, "grad_norm": 1.7853306509685332, "learning_rate": 2.941657470620643e-07, "loss": 0.6045, "step": 7473 }, { "epoch": 0.6895629108522662, "grad_norm": 1.763333611502238, "learning_rate": 2.9400613623237574e-07, "loss": 0.7346, "step": 7474 }, { "epoch": 0.6896551724137931, "grad_norm": 1.9822505114488693, "learning_rate": 2.938465553978718e-07, "loss": 0.629, "step": 7475 }, { "epoch": 0.6896551724137931, "eval_GEN Loss": 0.4390304386615753, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3411422669887543, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8048377633094788, "eval_runtime": 57.3905, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7475 }, { "epoch": 0.68974743397532, "grad_norm": 2.5217416802683195, "learning_rate": 2.936870045730145e-07, "loss": 0.6452, "step": 7476 }, { "epoch": 0.689839695536847, "grad_norm": 3.0845404950934894, "learning_rate": 2.935274837722619e-07, "loss": 0.56, "step": 7477 }, { "epoch": 0.6899319570983738, "grad_norm": 1.9825284638560812, "learning_rate": 2.933679930100709e-07, "loss": 0.764, "step": 7478 }, { "epoch": 0.6900242186599008, "grad_norm": 2.141974548801707, "learning_rate": 2.9320853230089415e-07, "loss": 0.5943, "step": 7479 }, { "epoch": 0.6901164802214278, "grad_norm": 1.5143085554050624, "learning_rate": 2.930491016591825e-07, "loss": 0.6813, "step": 7480 }, { "epoch": 0.6901164802214278, "eval_GEN Loss": 0.4401601254940033, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.34517011046409607, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8061598539352417, "eval_runtime": 57.2052, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7480 }, { "epoch": 0.6902087417829547, "grad_norm": 1.2590864373903046, "learning_rate": 2.928897010993837e-07, "loss": 0.4633, "step": 7481 }, { "epoch": 0.6903010033444816, "grad_norm": 2.6133337026113144, "learning_rate": 2.927303306359432e-07, "loss": 0.7002, "step": 7482 }, { "epoch": 0.6903932649060085, "grad_norm": 1.9786609901284273, "learning_rate": 2.9257099028330284e-07, "loss": 0.6476, "step": 7483 }, { "epoch": 0.6904855264675355, "grad_norm": 1.7762419858222276, "learning_rate": 2.924116800559027e-07, "loss": 0.5108, "step": 7484 }, { "epoch": 0.6905777880290624, "grad_norm": 3.563373615574328, "learning_rate": 2.922523999681796e-07, "loss": 0.6345, "step": 7485 }, { "epoch": 0.6905777880290624, "eval_GEN Loss": 0.4398023784160614, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 Neg": 0.6, "eval_PRM Loss": 0.3448041081428528, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8070011734962463, "eval_runtime": 57.1436, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7485 }, { "epoch": 0.6906700495905893, "grad_norm": 3.7431584196992858, "learning_rate": 2.920931500345679e-07, "loss": 0.7269, "step": 7486 }, { "epoch": 0.6907623111521163, "grad_norm": 2.093250248753236, "learning_rate": 2.919339302694988e-07, "loss": 0.6387, "step": 7487 }, { "epoch": 0.6908545727136431, "grad_norm": 2.834463820544003, "learning_rate": 2.9177474068740113e-07, "loss": 0.8767, "step": 7488 }, { "epoch": 0.6909468342751701, "grad_norm": 2.0880975779406055, "learning_rate": 2.916155813027013e-07, "loss": 0.7306, "step": 7489 }, { "epoch": 0.691039095836697, "grad_norm": 2.05313319325119, "learning_rate": 2.9145645212982187e-07, "loss": 0.6842, "step": 7490 }, { "epoch": 0.691039095836697, "eval_GEN Loss": 0.4405510723590851, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.34308189153671265, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8056490421295166, "eval_runtime": 57.288, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7490 }, { "epoch": 0.691131357398224, "grad_norm": 2.01335825760001, "learning_rate": 2.9129735318318385e-07, "loss": 0.5891, "step": 7491 }, { "epoch": 0.6912236189597509, "grad_norm": 1.5879719465116569, "learning_rate": 2.911382844772049e-07, "loss": 0.5602, "step": 7492 }, { "epoch": 0.6913158805212778, "grad_norm": 2.019962932927662, "learning_rate": 2.9097924602630037e-07, "loss": 0.6608, "step": 7493 }, { "epoch": 0.6914081420828048, "grad_norm": 2.393444467150143, "learning_rate": 2.908202378448818e-07, "loss": 0.6543, "step": 7494 }, { "epoch": 0.6915004036443316, "grad_norm": 2.3942528146431457, "learning_rate": 2.9066125994735987e-07, "loss": 0.564, "step": 7495 }, { "epoch": 0.6915004036443316, "eval_GEN Loss": 0.440162718296051, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3388652205467224, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8087740540504456, "eval_runtime": 57.257, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7495 }, { "epoch": 0.6915926652058586, "grad_norm": 3.374217629354594, "learning_rate": 2.9050231234814053e-07, "loss": 0.845, "step": 7496 }, { "epoch": 0.6916849267673856, "grad_norm": 1.8808935519656043, "learning_rate": 2.9034339506162834e-07, "loss": 0.6583, "step": 7497 }, { "epoch": 0.6917771883289124, "grad_norm": 2.1440017024082274, "learning_rate": 2.901845081022243e-07, "loss": 0.6157, "step": 7498 }, { "epoch": 0.6918694498904394, "grad_norm": 2.15434128163714, "learning_rate": 2.9002565148432704e-07, "loss": 0.6915, "step": 7499 }, { "epoch": 0.6919617114519663, "grad_norm": 1.6696731814521717, "learning_rate": 2.898668252223328e-07, "loss": 0.5752, "step": 7500 }, { "epoch": 0.6919617114519663, "eval_GEN Loss": 0.43915772438049316, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3373815715312958, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8073918223381042, "eval_runtime": 57.1429, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7500 }, { "epoch": 0.6920539730134933, "grad_norm": 1.6245884881499242, "learning_rate": 2.897080293306341e-07, "loss": 0.4783, "step": 7501 }, { "epoch": 0.6921462345750202, "grad_norm": 2.269791291880906, "learning_rate": 2.8954926382362156e-07, "loss": 0.6182, "step": 7502 }, { "epoch": 0.6922384961365471, "grad_norm": 3.1511587775076206, "learning_rate": 2.893905287156828e-07, "loss": 0.5885, "step": 7503 }, { "epoch": 0.6923307576980741, "grad_norm": 1.9645861343129774, "learning_rate": 2.8923182402120277e-07, "loss": 0.6398, "step": 7504 }, { "epoch": 0.6924230192596009, "grad_norm": 1.9727199598205378, "learning_rate": 2.8907314975456286e-07, "loss": 0.6809, "step": 7505 }, { "epoch": 0.6924230192596009, "eval_GEN Loss": 0.4399043321609497, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3374497890472412, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8123798370361328, "eval_runtime": 57.3207, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7505 }, { "epoch": 0.6925152808211279, "grad_norm": 2.6798203215717584, "learning_rate": 2.8891450593014334e-07, "loss": 0.6288, "step": 7506 }, { "epoch": 0.6926075423826549, "grad_norm": 2.1524107833195267, "learning_rate": 2.8875589256232005e-07, "loss": 0.6601, "step": 7507 }, { "epoch": 0.6926998039441817, "grad_norm": 2.117995440570148, "learning_rate": 2.885973096654673e-07, "loss": 0.7752, "step": 7508 }, { "epoch": 0.6927920655057087, "grad_norm": 1.7555838779860946, "learning_rate": 2.884387572539556e-07, "loss": 0.5889, "step": 7509 }, { "epoch": 0.6928843270672356, "grad_norm": 2.1630525419281375, "learning_rate": 2.882802353421535e-07, "loss": 0.6541, "step": 7510 }, { "epoch": 0.6928843270672356, "eval_GEN Loss": 0.44007331132888794, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3417389988899231, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8130708932876587, "eval_runtime": 56.7462, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 7510 }, { "epoch": 0.6929765886287625, "grad_norm": 1.683892199108229, "learning_rate": 2.881217439444267e-07, "loss": 0.6574, "step": 7511 }, { "epoch": 0.6930688501902895, "grad_norm": 2.568314285014365, "learning_rate": 2.8796328307513727e-07, "loss": 0.8007, "step": 7512 }, { "epoch": 0.6931611117518164, "grad_norm": 2.4423850648308902, "learning_rate": 2.878048527486461e-07, "loss": 0.6994, "step": 7513 }, { "epoch": 0.6932533733133434, "grad_norm": 2.663619849768364, "learning_rate": 2.8764645297930964e-07, "loss": 0.5898, "step": 7514 }, { "epoch": 0.6933456348748702, "grad_norm": 1.750469032278258, "learning_rate": 2.874880837814829e-07, "loss": 0.6805, "step": 7515 }, { "epoch": 0.6933456348748702, "eval_GEN Loss": 0.439759761095047, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3428731858730316, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8096754550933838, "eval_runtime": 57.0813, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7515 }, { "epoch": 0.6934378964363972, "grad_norm": 2.2235736954521386, "learning_rate": 2.873297451695168e-07, "loss": 0.7647, "step": 7516 }, { "epoch": 0.6935301579979242, "grad_norm": 3.2919016793801745, "learning_rate": 2.8717143715776107e-07, "loss": 0.5607, "step": 7517 }, { "epoch": 0.693622419559451, "grad_norm": 1.665573955728799, "learning_rate": 2.870131597605613e-07, "loss": 0.4429, "step": 7518 }, { "epoch": 0.693714681120978, "grad_norm": 2.1660252974413052, "learning_rate": 2.8685491299226096e-07, "loss": 0.726, "step": 7519 }, { "epoch": 0.6938069426825049, "grad_norm": 1.4886577554215572, "learning_rate": 2.8669669686720093e-07, "loss": 0.7032, "step": 7520 }, { "epoch": 0.6938069426825049, "eval_GEN Loss": 0.4392464756965637, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3417656719684601, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8058293461799622, "eval_runtime": 56.303, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7520 }, { "epoch": 0.6938992042440318, "grad_norm": 3.2967141345037745, "learning_rate": 2.865385113997185e-07, "loss": 0.8354, "step": 7521 }, { "epoch": 0.6939914658055587, "grad_norm": 1.8332924562743358, "learning_rate": 2.8638035660414887e-07, "loss": 0.5885, "step": 7522 }, { "epoch": 0.6940837273670857, "grad_norm": 2.5087808160300336, "learning_rate": 2.8622223249482434e-07, "loss": 0.7764, "step": 7523 }, { "epoch": 0.6941759889286127, "grad_norm": 2.3986879091839826, "learning_rate": 2.860641390860745e-07, "loss": 0.7453, "step": 7524 }, { "epoch": 0.6942682504901395, "grad_norm": 1.8451992483550603, "learning_rate": 2.8590607639222576e-07, "loss": 0.7127, "step": 7525 }, { "epoch": 0.6942682504901395, "eval_GEN Loss": 0.4395827651023865, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33759990334510803, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.805468738079071, "eval_runtime": 56.2382, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 7525 }, { "epoch": 0.6943605120516665, "grad_norm": 2.3363196596622595, "learning_rate": 2.8574804442760227e-07, "loss": 0.6654, "step": 7526 }, { "epoch": 0.6944527736131934, "grad_norm": 1.6371367332632645, "learning_rate": 2.855900432065246e-07, "loss": 0.6111, "step": 7527 }, { "epoch": 0.6945450351747203, "grad_norm": 2.4302014233551, "learning_rate": 2.8543207274331184e-07, "loss": 0.6878, "step": 7528 }, { "epoch": 0.6946372967362473, "grad_norm": 1.7575072992158154, "learning_rate": 2.8527413305227895e-07, "loss": 0.6393, "step": 7529 }, { "epoch": 0.6947295582977742, "grad_norm": 2.910765612773316, "learning_rate": 2.8511622414773876e-07, "loss": 0.6748, "step": 7530 }, { "epoch": 0.6947295582977742, "eval_GEN Loss": 0.43982282280921936, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33666208386421204, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8046875, "eval_runtime": 56.3146, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 7530 }, { "epoch": 0.6948218198593011, "grad_norm": 2.5400465915505452, "learning_rate": 2.8495834604400147e-07, "loss": 0.6118, "step": 7531 }, { "epoch": 0.694914081420828, "grad_norm": 1.5603651277101673, "learning_rate": 2.848004987553742e-07, "loss": 0.5231, "step": 7532 }, { "epoch": 0.695006342982355, "grad_norm": 1.7342208452353236, "learning_rate": 2.846426822961611e-07, "loss": 0.5314, "step": 7533 }, { "epoch": 0.695098604543882, "grad_norm": 1.5809347809148102, "learning_rate": 2.8448489668066375e-07, "loss": 0.6354, "step": 7534 }, { "epoch": 0.6951908661054088, "grad_norm": 2.5094743981854437, "learning_rate": 2.843271419231813e-07, "loss": 0.6299, "step": 7535 }, { "epoch": 0.6951908661054088, "eval_GEN Loss": 0.4391185939311981, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33054372668266296, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8004807829856873, "eval_runtime": 57.3099, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7535 }, { "epoch": 0.6952831276669358, "grad_norm": 2.7477738576700848, "learning_rate": 2.841694180380093e-07, "loss": 0.851, "step": 7536 }, { "epoch": 0.6953753892284626, "grad_norm": 2.3073939120897378, "learning_rate": 2.840117250394411e-07, "loss": 0.6043, "step": 7537 }, { "epoch": 0.6954676507899896, "grad_norm": 2.064727967392344, "learning_rate": 2.838540629417671e-07, "loss": 0.648, "step": 7538 }, { "epoch": 0.6955599123515166, "grad_norm": 2.026956585519375, "learning_rate": 2.836964317592751e-07, "loss": 0.5733, "step": 7539 }, { "epoch": 0.6956521739130435, "grad_norm": 1.8219948536853483, "learning_rate": 2.835388315062494e-07, "loss": 0.6712, "step": 7540 }, { "epoch": 0.6956521739130435, "eval_GEN Loss": 0.4391144812107086, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32557055354118347, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7981970906257629, "eval_runtime": 57.3094, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7540 }, { "epoch": 0.6957444354745704, "grad_norm": 2.7167957588790617, "learning_rate": 2.8338126219697234e-07, "loss": 0.7761, "step": 7541 }, { "epoch": 0.6958366970360973, "grad_norm": 3.5704367229779255, "learning_rate": 2.83223723845723e-07, "loss": 0.8931, "step": 7542 }, { "epoch": 0.6959289585976243, "grad_norm": 1.5419405534273594, "learning_rate": 2.8306621646677793e-07, "loss": 0.5808, "step": 7543 }, { "epoch": 0.6960212201591512, "grad_norm": 3.0927949263060808, "learning_rate": 2.829087400744104e-07, "loss": 0.791, "step": 7544 }, { "epoch": 0.6961134817206781, "grad_norm": 2.3103434583688056, "learning_rate": 2.827512946828912e-07, "loss": 0.7519, "step": 7545 }, { "epoch": 0.6961134817206781, "eval_GEN Loss": 0.4376736581325531, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.327210009098053, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7939903736114502, "eval_runtime": 57.4894, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 7545 }, { "epoch": 0.6962057432822051, "grad_norm": 1.7400780496018629, "learning_rate": 2.825938803064887e-07, "loss": 0.5592, "step": 7546 }, { "epoch": 0.6962980048437319, "grad_norm": 2.212813387083588, "learning_rate": 2.8243649695946744e-07, "loss": 0.7971, "step": 7547 }, { "epoch": 0.6963902664052589, "grad_norm": 1.5903994703848474, "learning_rate": 2.8227914465609004e-07, "loss": 0.6491, "step": 7548 }, { "epoch": 0.6964825279667859, "grad_norm": 4.678151213691483, "learning_rate": 2.82121823410616e-07, "loss": 0.6383, "step": 7549 }, { "epoch": 0.6965747895283128, "grad_norm": 2.021743357429596, "learning_rate": 2.819645332373023e-07, "loss": 0.7297, "step": 7550 }, { "epoch": 0.6965747895283128, "eval_GEN Loss": 0.4387027621269226, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3356570601463318, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.796875, "eval_runtime": 57.0636, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7550 }, { "epoch": 0.6966670510898397, "grad_norm": 2.2035165036174185, "learning_rate": 2.81807274150402e-07, "loss": 0.6485, "step": 7551 }, { "epoch": 0.6967593126513666, "grad_norm": 1.881352443986148, "learning_rate": 2.8165004616416726e-07, "loss": 0.656, "step": 7552 }, { "epoch": 0.6968515742128936, "grad_norm": 3.350289312564557, "learning_rate": 2.814928492928455e-07, "loss": 0.869, "step": 7553 }, { "epoch": 0.6969438357744204, "grad_norm": 2.0974807565012688, "learning_rate": 2.8133568355068266e-07, "loss": 0.588, "step": 7554 }, { "epoch": 0.6970360973359474, "grad_norm": 1.8979441207256462, "learning_rate": 2.811785489519209e-07, "loss": 0.697, "step": 7555 }, { "epoch": 0.6970360973359474, "eval_GEN Loss": 0.4389715790748596, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33826935291290283, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7978065013885498, "eval_runtime": 57.0157, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7555 }, { "epoch": 0.6971283588974744, "grad_norm": 2.1253924417002095, "learning_rate": 2.810214455108001e-07, "loss": 0.5855, "step": 7556 }, { "epoch": 0.6972206204590012, "grad_norm": 2.3464325305413594, "learning_rate": 2.808643732415575e-07, "loss": 0.8686, "step": 7557 }, { "epoch": 0.6973128820205282, "grad_norm": 1.7732654036899183, "learning_rate": 2.8070733215842723e-07, "loss": 0.5541, "step": 7558 }, { "epoch": 0.6974051435820551, "grad_norm": 2.1535046280742765, "learning_rate": 2.8055032227564025e-07, "loss": 0.917, "step": 7559 }, { "epoch": 0.697497405143582, "grad_norm": 2.281942969246904, "learning_rate": 2.803933436074252e-07, "loss": 0.8135, "step": 7560 }, { "epoch": 0.697497405143582, "eval_GEN Loss": 0.43900319933891296, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3349604308605194, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8009615540504456, "eval_runtime": 57.3047, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7560 }, { "epoch": 0.697589666705109, "grad_norm": 3.103502035080762, "learning_rate": 2.80236396168008e-07, "loss": 0.7307, "step": 7561 }, { "epoch": 0.6976819282666359, "grad_norm": 2.2612707683105, "learning_rate": 2.8007947997161076e-07, "loss": 0.7328, "step": 7562 }, { "epoch": 0.6977741898281629, "grad_norm": 1.7683457408365593, "learning_rate": 2.7992259503245446e-07, "loss": 0.7037, "step": 7563 }, { "epoch": 0.6978664513896897, "grad_norm": 2.592650305058427, "learning_rate": 2.797657413647555e-07, "loss": 0.8442, "step": 7564 }, { "epoch": 0.6979587129512167, "grad_norm": 3.9616775664721255, "learning_rate": 2.796089189827288e-07, "loss": 0.7498, "step": 7565 }, { "epoch": 0.6979587129512167, "eval_GEN Loss": 0.43819233775138855, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33212894201278687, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.799098551273346, "eval_runtime": 57.2415, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7565 }, { "epoch": 0.6980509745127437, "grad_norm": 2.3241568906531933, "learning_rate": 2.79452127900585e-07, "loss": 0.721, "step": 7566 }, { "epoch": 0.6981432360742705, "grad_norm": 2.7261748788169315, "learning_rate": 2.7929536813253366e-07, "loss": 0.4759, "step": 7567 }, { "epoch": 0.6982354976357975, "grad_norm": 1.6183222041174643, "learning_rate": 2.7913863969278e-07, "loss": 0.8232, "step": 7568 }, { "epoch": 0.6983277591973244, "grad_norm": 1.915544340975291, "learning_rate": 2.7898194259552724e-07, "loss": 0.7024, "step": 7569 }, { "epoch": 0.6984200207588513, "grad_norm": 2.2694936416954588, "learning_rate": 2.7882527685497566e-07, "loss": 0.678, "step": 7570 }, { "epoch": 0.6984200207588513, "eval_GEN Loss": 0.4389684200286865, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3301727771759033, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8001502156257629, "eval_runtime": 57.3064, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7570 }, { "epoch": 0.6985122823203783, "grad_norm": 1.6250339106643379, "learning_rate": 2.7866864248532223e-07, "loss": 0.6159, "step": 7571 }, { "epoch": 0.6986045438819052, "grad_norm": 1.9609389419123828, "learning_rate": 2.785120395007617e-07, "loss": 0.5341, "step": 7572 }, { "epoch": 0.6986968054434322, "grad_norm": 1.70686529685266, "learning_rate": 2.783554679154851e-07, "loss": 0.6643, "step": 7573 }, { "epoch": 0.698789067004959, "grad_norm": 1.5470337996859067, "learning_rate": 2.781989277436821e-07, "loss": 0.6096, "step": 7574 }, { "epoch": 0.698881328566486, "grad_norm": 2.3677446773922446, "learning_rate": 2.7804241899953795e-07, "loss": 0.6635, "step": 7575 }, { "epoch": 0.698881328566486, "eval_GEN Loss": 0.438372403383255, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3274807035923004, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.799879789352417, "eval_runtime": 57.2846, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7575 }, { "epoch": 0.698973590128013, "grad_norm": 2.307816836126703, "learning_rate": 2.7788594169723586e-07, "loss": 0.5825, "step": 7576 }, { "epoch": 0.6990658516895398, "grad_norm": 1.9345357062764776, "learning_rate": 2.777294958509561e-07, "loss": 0.7381, "step": 7577 }, { "epoch": 0.6991581132510668, "grad_norm": 1.5241800598967488, "learning_rate": 2.7757308147487623e-07, "loss": 0.703, "step": 7578 }, { "epoch": 0.6992503748125937, "grad_norm": 1.5911593811211773, "learning_rate": 2.774166985831704e-07, "loss": 0.465, "step": 7579 }, { "epoch": 0.6993426363741206, "grad_norm": 1.9878473815037463, "learning_rate": 2.772603471900104e-07, "loss": 0.5695, "step": 7580 }, { "epoch": 0.6993426363741206, "eval_GEN Loss": 0.43851327896118164, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32270532846450806, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8001803159713745, "eval_runtime": 57.2721, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7580 }, { "epoch": 0.6994348979356476, "grad_norm": 2.5556382617820903, "learning_rate": 2.771040273095654e-07, "loss": 0.7856, "step": 7581 }, { "epoch": 0.6995271594971745, "grad_norm": 2.536060359025665, "learning_rate": 2.769477389560007e-07, "loss": 0.9353, "step": 7582 }, { "epoch": 0.6996194210587015, "grad_norm": 1.7812945911802125, "learning_rate": 2.7679148214347987e-07, "loss": 0.6257, "step": 7583 }, { "epoch": 0.6997116826202283, "grad_norm": 2.4142251446142717, "learning_rate": 2.766352568861629e-07, "loss": 0.5825, "step": 7584 }, { "epoch": 0.6998039441817553, "grad_norm": 1.8492176622899588, "learning_rate": 2.764790631982076e-07, "loss": 0.6478, "step": 7585 }, { "epoch": 0.6998039441817553, "eval_GEN Loss": 0.4386636018753052, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32350003719329834, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8044771552085876, "eval_runtime": 57.0882, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7585 }, { "epoch": 0.6998962057432822, "grad_norm": 1.1945552430675297, "learning_rate": 2.7632290109376794e-07, "loss": 0.4752, "step": 7586 }, { "epoch": 0.6999884673048091, "grad_norm": 1.6479939516371747, "learning_rate": 2.7616677058699574e-07, "loss": 0.639, "step": 7587 }, { "epoch": 0.7000807288663361, "grad_norm": 3.4807973669697945, "learning_rate": 2.7601067169203994e-07, "loss": 1.069, "step": 7588 }, { "epoch": 0.700172990427863, "grad_norm": 1.5849938138715953, "learning_rate": 2.758546044230465e-07, "loss": 0.4067, "step": 7589 }, { "epoch": 0.7002652519893899, "grad_norm": 1.807531866350162, "learning_rate": 2.7569856879415825e-07, "loss": 0.6809, "step": 7590 }, { "epoch": 0.7002652519893899, "eval_GEN Loss": 0.4381018579006195, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3218788504600525, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8021634817123413, "eval_runtime": 57.4316, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 7590 }, { "epoch": 0.7003575135509168, "grad_norm": 2.1599646725745743, "learning_rate": 2.755425648195155e-07, "loss": 0.5768, "step": 7591 }, { "epoch": 0.7004497751124438, "grad_norm": 1.95349126642436, "learning_rate": 2.7538659251325575e-07, "loss": 0.6156, "step": 7592 }, { "epoch": 0.7005420366739707, "grad_norm": 2.6040036795310204, "learning_rate": 2.7523065188951307e-07, "loss": 0.8779, "step": 7593 }, { "epoch": 0.7006342982354976, "grad_norm": 1.9784404777726183, "learning_rate": 2.7507474296241925e-07, "loss": 0.7191, "step": 7594 }, { "epoch": 0.7007265597970246, "grad_norm": 1.6573487270605507, "learning_rate": 2.749188657461031e-07, "loss": 0.8185, "step": 7595 }, { "epoch": 0.7007265597970246, "eval_GEN Loss": 0.43835094571113586, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32362157106399536, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8028244972229004, "eval_runtime": 57.0005, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7595 }, { "epoch": 0.7008188213585514, "grad_norm": 1.431663670532779, "learning_rate": 2.7476302025469053e-07, "loss": 0.6303, "step": 7596 }, { "epoch": 0.7009110829200784, "grad_norm": 4.072024219165664, "learning_rate": 2.7460720650230417e-07, "loss": 0.8401, "step": 7597 }, { "epoch": 0.7010033444816054, "grad_norm": 1.8819109310345739, "learning_rate": 2.744514245030642e-07, "loss": 0.8384, "step": 7598 }, { "epoch": 0.7010956060431323, "grad_norm": 3.287266951776461, "learning_rate": 2.7429567427108796e-07, "loss": 0.786, "step": 7599 }, { "epoch": 0.7011878676046592, "grad_norm": 2.4853890608069062, "learning_rate": 2.741399558204899e-07, "loss": 0.6396, "step": 7600 }, { "epoch": 0.7011878676046592, "eval_GEN Loss": 0.43820497393608093, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32750800251960754, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7963041067123413, "eval_runtime": 57.1651, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7600 }, { "epoch": 0.7012801291661861, "grad_norm": 1.9097772452643222, "learning_rate": 2.7398426916538096e-07, "loss": 0.6248, "step": 7601 }, { "epoch": 0.7013723907277131, "grad_norm": 1.872796281608114, "learning_rate": 2.7382861431987046e-07, "loss": 0.6685, "step": 7602 }, { "epoch": 0.70146465228924, "grad_norm": 2.392567843650792, "learning_rate": 2.7367299129806347e-07, "loss": 0.6434, "step": 7603 }, { "epoch": 0.7015569138507669, "grad_norm": 1.629398161368014, "learning_rate": 2.7351740011406317e-07, "loss": 0.6144, "step": 7604 }, { "epoch": 0.7016491754122939, "grad_norm": 1.7778891732484896, "learning_rate": 2.733618407819692e-07, "loss": 0.6356, "step": 7605 }, { "epoch": 0.7016491754122939, "eval_GEN Loss": 0.4385720491409302, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33266720175743103, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7938401699066162, "eval_runtime": 57.2345, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7605 }, { "epoch": 0.7017414369738207, "grad_norm": 2.4592888395731043, "learning_rate": 2.7320631331587856e-07, "loss": 0.725, "step": 7606 }, { "epoch": 0.7018336985353477, "grad_norm": 2.6327454442100375, "learning_rate": 2.730508177298859e-07, "loss": 0.7072, "step": 7607 }, { "epoch": 0.7019259600968747, "grad_norm": 1.4306806312353348, "learning_rate": 2.7289535403808154e-07, "loss": 0.5921, "step": 7608 }, { "epoch": 0.7020182216584016, "grad_norm": 1.7154771439450527, "learning_rate": 2.727399222545549e-07, "loss": 0.6788, "step": 7609 }, { "epoch": 0.7021104832199285, "grad_norm": 1.9884976434528727, "learning_rate": 2.725845223933908e-07, "loss": 0.7499, "step": 7610 }, { "epoch": 0.7021104832199285, "eval_GEN Loss": 0.4384738504886627, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3373554050922394, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7972956895828247, "eval_runtime": 57.3193, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7610 }, { "epoch": 0.7022027447814554, "grad_norm": 1.5095916429586789, "learning_rate": 2.7242915446867224e-07, "loss": 0.5848, "step": 7611 }, { "epoch": 0.7022950063429824, "grad_norm": 2.9527139700617693, "learning_rate": 2.7227381849447816e-07, "loss": 0.8709, "step": 7612 }, { "epoch": 0.7023872679045093, "grad_norm": 2.5684032306567564, "learning_rate": 2.721185144848863e-07, "loss": 0.7449, "step": 7613 }, { "epoch": 0.7024795294660362, "grad_norm": 2.609582389516733, "learning_rate": 2.719632424539698e-07, "loss": 0.8001, "step": 7614 }, { "epoch": 0.7025717910275632, "grad_norm": 1.9537147193180695, "learning_rate": 2.718080024158003e-07, "loss": 0.6482, "step": 7615 }, { "epoch": 0.7025717910275632, "eval_GEN Loss": 0.4381050765514374, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34338268637657166, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.796604573726654, "eval_runtime": 57.3795, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7615 }, { "epoch": 0.70266405258909, "grad_norm": 2.3285979128000767, "learning_rate": 2.716527943844453e-07, "loss": 0.6852, "step": 7616 }, { "epoch": 0.702756314150617, "grad_norm": 2.129961572231308, "learning_rate": 2.7149761837397024e-07, "loss": 0.6073, "step": 7617 }, { "epoch": 0.7028485757121439, "grad_norm": 1.9645372306962223, "learning_rate": 2.713424743984376e-07, "loss": 0.5078, "step": 7618 }, { "epoch": 0.7029408372736708, "grad_norm": 2.5046292564812838, "learning_rate": 2.7118736247190624e-07, "loss": 0.6878, "step": 7619 }, { "epoch": 0.7030330988351978, "grad_norm": 1.7337385331115687, "learning_rate": 2.7103228260843333e-07, "loss": 0.7527, "step": 7620 }, { "epoch": 0.7030330988351978, "eval_GEN Loss": 0.4380924105644226, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3494049608707428, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7964242696762085, "eval_runtime": 57.1158, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7620 }, { "epoch": 0.7031253603967247, "grad_norm": 2.3501820457309823, "learning_rate": 2.70877234822072e-07, "loss": 0.6101, "step": 7621 }, { "epoch": 0.7032176219582517, "grad_norm": 2.3037379050897497, "learning_rate": 2.7072221912687323e-07, "loss": 0.7454, "step": 7622 }, { "epoch": 0.7033098835197785, "grad_norm": 2.392313133182807, "learning_rate": 2.705672355368842e-07, "loss": 0.554, "step": 7623 }, { "epoch": 0.7034021450813055, "grad_norm": 1.7505749008516729, "learning_rate": 2.7041228406615054e-07, "loss": 0.6268, "step": 7624 }, { "epoch": 0.7034944066428325, "grad_norm": 1.8664811847962115, "learning_rate": 2.7025736472871373e-07, "loss": 0.5683, "step": 7625 }, { "epoch": 0.7034944066428325, "eval_GEN Loss": 0.4381406009197235, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.35133031010627747, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7952223420143127, "eval_runtime": 57.121, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7625 }, { "epoch": 0.7035866682043593, "grad_norm": 2.301278493092115, "learning_rate": 2.7010247753861274e-07, "loss": 0.7671, "step": 7626 }, { "epoch": 0.7036789297658863, "grad_norm": 1.7349255862297581, "learning_rate": 2.699476225098842e-07, "loss": 0.6102, "step": 7627 }, { "epoch": 0.7037711913274132, "grad_norm": 1.8297146790970835, "learning_rate": 2.697927996565607e-07, "loss": 0.677, "step": 7628 }, { "epoch": 0.7038634528889401, "grad_norm": 2.3700676910938885, "learning_rate": 2.696380089926728e-07, "loss": 0.6403, "step": 7629 }, { "epoch": 0.7039557144504671, "grad_norm": 2.058965038851938, "learning_rate": 2.694832505322479e-07, "loss": 0.6637, "step": 7630 }, { "epoch": 0.7039557144504671, "eval_GEN Loss": 0.4379960000514984, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3428812325000763, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7909255027770996, "eval_runtime": 57.0235, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7630 }, { "epoch": 0.704047976011994, "grad_norm": 2.03485380241862, "learning_rate": 2.693285242893106e-07, "loss": 0.645, "step": 7631 }, { "epoch": 0.704140237573521, "grad_norm": 1.7534059347330075, "learning_rate": 2.6917383027788207e-07, "loss": 0.5817, "step": 7632 }, { "epoch": 0.7042324991350478, "grad_norm": 1.5897813180221276, "learning_rate": 2.6901916851198113e-07, "loss": 0.5546, "step": 7633 }, { "epoch": 0.7043247606965748, "grad_norm": 1.638582355383271, "learning_rate": 2.688645390056234e-07, "loss": 0.6408, "step": 7634 }, { "epoch": 0.7044170222581018, "grad_norm": 1.4741452221840952, "learning_rate": 2.68709941772822e-07, "loss": 0.4971, "step": 7635 }, { "epoch": 0.7044170222581018, "eval_GEN Loss": 0.43760815262794495, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3405035138130188, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7891225814819336, "eval_runtime": 57.2344, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7635 }, { "epoch": 0.7045092838196286, "grad_norm": 2.6370957273502214, "learning_rate": 2.6855537682758626e-07, "loss": 0.69, "step": 7636 }, { "epoch": 0.7046015453811556, "grad_norm": 1.5281461543003703, "learning_rate": 2.684008441839233e-07, "loss": 0.6638, "step": 7637 }, { "epoch": 0.7046938069426825, "grad_norm": 2.0454341215460237, "learning_rate": 2.682463438558371e-07, "loss": 0.7767, "step": 7638 }, { "epoch": 0.7047860685042094, "grad_norm": 2.099503345562081, "learning_rate": 2.680918758573291e-07, "loss": 0.6436, "step": 7639 }, { "epoch": 0.7048783300657364, "grad_norm": 1.8070594087288365, "learning_rate": 2.6793744020239676e-07, "loss": 0.6048, "step": 7640 }, { "epoch": 0.7048783300657364, "eval_GEN Loss": 0.4382171034812927, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3356093168258667, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7928786277770996, "eval_runtime": 57.3409, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7640 }, { "epoch": 0.7049705916272633, "grad_norm": 3.052693989128505, "learning_rate": 2.6778303690503563e-07, "loss": 0.9629, "step": 7641 }, { "epoch": 0.7050628531887903, "grad_norm": 2.1094978721207385, "learning_rate": 2.6762866597923827e-07, "loss": 0.5824, "step": 7642 }, { "epoch": 0.7051551147503171, "grad_norm": 1.7820599826722467, "learning_rate": 2.6747432743899343e-07, "loss": 0.6557, "step": 7643 }, { "epoch": 0.7052473763118441, "grad_norm": 2.808461492385915, "learning_rate": 2.6732002129828775e-07, "loss": 0.8418, "step": 7644 }, { "epoch": 0.7053396378733711, "grad_norm": 2.6886808683735386, "learning_rate": 2.671657475711047e-07, "loss": 0.8088, "step": 7645 }, { "epoch": 0.7053396378733711, "eval_GEN Loss": 0.43863752484321594, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3300844728946686, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7906249761581421, "eval_runtime": 57.4585, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 7645 }, { "epoch": 0.7054318994348979, "grad_norm": 2.671200210501914, "learning_rate": 2.670115062714252e-07, "loss": 0.6359, "step": 7646 }, { "epoch": 0.7055241609964249, "grad_norm": 1.7919169994237847, "learning_rate": 2.668572974132262e-07, "loss": 0.6251, "step": 7647 }, { "epoch": 0.7056164225579518, "grad_norm": 2.2654662669760834, "learning_rate": 2.6670312101048263e-07, "loss": 0.6408, "step": 7648 }, { "epoch": 0.7057086841194787, "grad_norm": 2.054874163408238, "learning_rate": 2.665489770771662e-07, "loss": 0.5467, "step": 7649 }, { "epoch": 0.7058009456810056, "grad_norm": 1.5930954027840778, "learning_rate": 2.663948656272459e-07, "loss": 0.588, "step": 7650 }, { "epoch": 0.7058009456810056, "eval_GEN Loss": 0.43846824765205383, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3306979537010193, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7886418104171753, "eval_runtime": 57.0274, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7650 }, { "epoch": 0.7058932072425326, "grad_norm": 2.28692526583499, "learning_rate": 2.662407866746871e-07, "loss": 0.7609, "step": 7651 }, { "epoch": 0.7059854688040595, "grad_norm": 1.8392944507234301, "learning_rate": 2.660867402334529e-07, "loss": 0.5851, "step": 7652 }, { "epoch": 0.7060777303655864, "grad_norm": 1.0755958218023864, "learning_rate": 2.659327263175035e-07, "loss": 0.4584, "step": 7653 }, { "epoch": 0.7061699919271134, "grad_norm": 1.3875632091274972, "learning_rate": 2.657787449407954e-07, "loss": 0.6108, "step": 7654 }, { "epoch": 0.7062622534886402, "grad_norm": 2.4481408504733118, "learning_rate": 2.6562479611728283e-07, "loss": 0.7706, "step": 7655 }, { "epoch": 0.7062622534886402, "eval_GEN Loss": 0.4383276700973511, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32851049304008484, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7892728447914124, "eval_runtime": 57.2592, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7655 }, { "epoch": 0.7063545150501672, "grad_norm": 1.8632456519233045, "learning_rate": 2.6547087986091684e-07, "loss": 0.5081, "step": 7656 }, { "epoch": 0.7064467766116942, "grad_norm": 2.0836362316296557, "learning_rate": 2.6531699618564596e-07, "loss": 0.739, "step": 7657 }, { "epoch": 0.7065390381732211, "grad_norm": 2.453835486240904, "learning_rate": 2.651631451054145e-07, "loss": 0.685, "step": 7658 }, { "epoch": 0.706631299734748, "grad_norm": 1.2770730440921414, "learning_rate": 2.6500932663416574e-07, "loss": 0.5475, "step": 7659 }, { "epoch": 0.7067235612962749, "grad_norm": 3.2038004858620335, "learning_rate": 2.648555407858382e-07, "loss": 0.7999, "step": 7660 }, { "epoch": 0.7067235612962749, "eval_GEN Loss": 0.43880680203437805, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3247685730457306, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7881009578704834, "eval_runtime": 57.0842, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7660 }, { "epoch": 0.7068158228578019, "grad_norm": 2.3056586302996296, "learning_rate": 2.647017875743686e-07, "loss": 0.9609, "step": 7661 }, { "epoch": 0.7069080844193288, "grad_norm": 1.568166473512872, "learning_rate": 2.6454806701368996e-07, "loss": 0.6396, "step": 7662 }, { "epoch": 0.7070003459808557, "grad_norm": 1.9375625564601933, "learning_rate": 2.643943791177328e-07, "loss": 0.6977, "step": 7663 }, { "epoch": 0.7070926075423827, "grad_norm": 2.3618104412057126, "learning_rate": 2.6424072390042484e-07, "loss": 0.7217, "step": 7664 }, { "epoch": 0.7071848691039095, "grad_norm": 1.623785673185428, "learning_rate": 2.6408710137568987e-07, "loss": 0.5561, "step": 7665 }, { "epoch": 0.7071848691039095, "eval_GEN Loss": 0.43854737281799316, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3225677013397217, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7831130027770996, "eval_runtime": 57.1808, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7665 }, { "epoch": 0.7072771306654365, "grad_norm": 2.3225996377439646, "learning_rate": 2.639335115574504e-07, "loss": 0.6407, "step": 7666 }, { "epoch": 0.7073693922269635, "grad_norm": 2.233946781971763, "learning_rate": 2.637799544596241e-07, "loss": 0.7229, "step": 7667 }, { "epoch": 0.7074616537884904, "grad_norm": 4.184322085315114, "learning_rate": 2.6362643009612713e-07, "loss": 0.6988, "step": 7668 }, { "epoch": 0.7075539153500173, "grad_norm": 1.4734835240368584, "learning_rate": 2.6347293848087154e-07, "loss": 0.6251, "step": 7669 }, { "epoch": 0.7076461769115442, "grad_norm": 1.556672804355415, "learning_rate": 2.6331947962776764e-07, "loss": 0.626, "step": 7670 }, { "epoch": 0.7076461769115442, "eval_GEN Loss": 0.4378474950790405, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3209223747253418, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7851262092590332, "eval_runtime": 57.0277, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7670 }, { "epoch": 0.7077384384730712, "grad_norm": 2.5567035191841536, "learning_rate": 2.6316605355072163e-07, "loss": 0.6368, "step": 7671 }, { "epoch": 0.7078307000345981, "grad_norm": 2.345774127686596, "learning_rate": 2.630126602636373e-07, "loss": 0.5642, "step": 7672 }, { "epoch": 0.707922961596125, "grad_norm": 1.5861353748932685, "learning_rate": 2.628592997804156e-07, "loss": 0.531, "step": 7673 }, { "epoch": 0.708015223157652, "grad_norm": 1.973410774027925, "learning_rate": 2.627059721149543e-07, "loss": 0.6467, "step": 7674 }, { "epoch": 0.7081074847191788, "grad_norm": 2.229006383133802, "learning_rate": 2.6255267728114787e-07, "loss": 0.6963, "step": 7675 }, { "epoch": 0.7081074847191788, "eval_GEN Loss": 0.43795859813690186, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32571059465408325, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7873197197914124, "eval_runtime": 57.4091, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 7675 }, { "epoch": 0.7081997462807058, "grad_norm": 2.2870942568266606, "learning_rate": 2.6239941529288834e-07, "loss": 0.659, "step": 7676 }, { "epoch": 0.7082920078422328, "grad_norm": 1.8264698204851915, "learning_rate": 2.6224618616406477e-07, "loss": 0.5788, "step": 7677 }, { "epoch": 0.7083842694037596, "grad_norm": 2.334747800582495, "learning_rate": 2.620929899085625e-07, "loss": 0.7062, "step": 7678 }, { "epoch": 0.7084765309652866, "grad_norm": 1.5651101360070245, "learning_rate": 2.61939826540265e-07, "loss": 0.4864, "step": 7679 }, { "epoch": 0.7085687925268135, "grad_norm": 2.087139697445044, "learning_rate": 2.617866960730514e-07, "loss": 0.7151, "step": 7680 }, { "epoch": 0.7085687925268135, "eval_GEN Loss": 0.43815454840660095, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32705795764923096, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7898737788200378, "eval_runtime": 56.9908, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7680 }, { "epoch": 0.7086610540883405, "grad_norm": 2.5196367445692434, "learning_rate": 2.616335985207996e-07, "loss": 0.5302, "step": 7681 }, { "epoch": 0.7087533156498673, "grad_norm": 2.1198117690233076, "learning_rate": 2.6148053389738277e-07, "loss": 0.8295, "step": 7682 }, { "epoch": 0.7088455772113943, "grad_norm": 1.560360908170319, "learning_rate": 2.6132750221667216e-07, "loss": 0.6801, "step": 7683 }, { "epoch": 0.7089378387729213, "grad_norm": 2.191405087362877, "learning_rate": 2.611745034925358e-07, "loss": 0.7605, "step": 7684 }, { "epoch": 0.7090301003344481, "grad_norm": 1.9862913241623572, "learning_rate": 2.6102153773883874e-07, "loss": 0.6651, "step": 7685 }, { "epoch": 0.7090301003344481, "eval_GEN Loss": 0.4378926753997803, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.328876256942749, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7893028855323792, "eval_runtime": 57.4602, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 7685 }, { "epoch": 0.7091223618959751, "grad_norm": 2.1161004941642805, "learning_rate": 2.608686049694426e-07, "loss": 0.6753, "step": 7686 }, { "epoch": 0.709214623457502, "grad_norm": 1.407803856266062, "learning_rate": 2.607157051982067e-07, "loss": 0.4634, "step": 7687 }, { "epoch": 0.7093068850190289, "grad_norm": 2.3318214326286086, "learning_rate": 2.6056283843898724e-07, "loss": 0.7938, "step": 7688 }, { "epoch": 0.7093991465805559, "grad_norm": 1.8190259111534135, "learning_rate": 2.604100047056367e-07, "loss": 0.6519, "step": 7689 }, { "epoch": 0.7094914081420828, "grad_norm": 2.2911158778468015, "learning_rate": 2.602572040120054e-07, "loss": 0.5871, "step": 7690 }, { "epoch": 0.7094914081420828, "eval_GEN Loss": 0.43883150815963745, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3294527232646942, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7931190133094788, "eval_runtime": 57.2172, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7690 }, { "epoch": 0.7095836697036098, "grad_norm": 1.7935010515490084, "learning_rate": 2.6010443637194043e-07, "loss": 0.7216, "step": 7691 }, { "epoch": 0.7096759312651366, "grad_norm": 1.5514338806301957, "learning_rate": 2.59951701799286e-07, "loss": 0.6296, "step": 7692 }, { "epoch": 0.7097681928266636, "grad_norm": 2.73954143824952, "learning_rate": 2.597990003078827e-07, "loss": 0.6763, "step": 7693 }, { "epoch": 0.7098604543881906, "grad_norm": 2.758670976682627, "learning_rate": 2.5964633191156887e-07, "loss": 0.6935, "step": 7694 }, { "epoch": 0.7099527159497174, "grad_norm": 1.5132233161076871, "learning_rate": 2.594936966241795e-07, "loss": 0.588, "step": 7695 }, { "epoch": 0.7099527159497174, "eval_GEN Loss": 0.4384821653366089, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.332141250371933, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.796604573726654, "eval_runtime": 57.0889, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7695 }, { "epoch": 0.7100449775112444, "grad_norm": 1.9379255371834925, "learning_rate": 2.593410944595468e-07, "loss": 0.5994, "step": 7696 }, { "epoch": 0.7101372390727713, "grad_norm": 1.9824026120672475, "learning_rate": 2.591885254314996e-07, "loss": 0.7649, "step": 7697 }, { "epoch": 0.7102295006342982, "grad_norm": 2.0800244671605266, "learning_rate": 2.590359895538639e-07, "loss": 0.7161, "step": 7698 }, { "epoch": 0.7103217621958252, "grad_norm": 1.6174779162108819, "learning_rate": 2.5888348684046314e-07, "loss": 0.4881, "step": 7699 }, { "epoch": 0.7104140237573521, "grad_norm": 1.8856667399242664, "learning_rate": 2.5873101730511686e-07, "loss": 0.6223, "step": 7700 }, { "epoch": 0.7104140237573521, "eval_GEN Loss": 0.43783777952194214, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33433765172958374, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7971754670143127, "eval_runtime": 57.4531, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 7700 }, { "epoch": 0.710506285318879, "grad_norm": 1.870491136335149, "learning_rate": 2.585785809616423e-07, "loss": 0.6581, "step": 7701 }, { "epoch": 0.7105985468804059, "grad_norm": 1.9702321506657552, "learning_rate": 2.5842617782385343e-07, "loss": 0.6468, "step": 7702 }, { "epoch": 0.7106908084419329, "grad_norm": 2.235456748675317, "learning_rate": 2.582738079055616e-07, "loss": 0.4702, "step": 7703 }, { "epoch": 0.7107830700034599, "grad_norm": 2.048303773429522, "learning_rate": 2.581214712205741e-07, "loss": 0.6442, "step": 7704 }, { "epoch": 0.7108753315649867, "grad_norm": 1.8243672290819863, "learning_rate": 2.5796916778269674e-07, "loss": 0.6886, "step": 7705 }, { "epoch": 0.7108753315649867, "eval_GEN Loss": 0.43775948882102966, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3381432592868805, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7991586327552795, "eval_runtime": 56.9484, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7705 }, { "epoch": 0.7109675931265137, "grad_norm": 2.0096379065353207, "learning_rate": 2.57816897605731e-07, "loss": 0.7082, "step": 7706 }, { "epoch": 0.7110598546880406, "grad_norm": 1.3725377611681975, "learning_rate": 2.5766466070347607e-07, "loss": 0.4893, "step": 7707 }, { "epoch": 0.7111521162495675, "grad_norm": 2.089105171630828, "learning_rate": 2.5751245708972763e-07, "loss": 0.6253, "step": 7708 }, { "epoch": 0.7112443778110945, "grad_norm": 1.9096073730776806, "learning_rate": 2.5736028677827876e-07, "loss": 0.6723, "step": 7709 }, { "epoch": 0.7113366393726214, "grad_norm": 1.9920396324233414, "learning_rate": 2.572081497829193e-07, "loss": 0.7195, "step": 7710 }, { "epoch": 0.7113366393726214, "eval_GEN Loss": 0.43782028555870056, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33729809522628784, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7992788553237915, "eval_runtime": 57.2661, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7710 }, { "epoch": 0.7114289009341483, "grad_norm": 1.1451729253943397, "learning_rate": 2.570560461174365e-07, "loss": 0.5198, "step": 7711 }, { "epoch": 0.7115211624956752, "grad_norm": 1.7287979526407544, "learning_rate": 2.569039757956137e-07, "loss": 0.539, "step": 7712 }, { "epoch": 0.7116134240572022, "grad_norm": 2.1473940261195925, "learning_rate": 2.56751938831232e-07, "loss": 0.6401, "step": 7713 }, { "epoch": 0.711705685618729, "grad_norm": 2.234538523178221, "learning_rate": 2.565999352380695e-07, "loss": 0.5619, "step": 7714 }, { "epoch": 0.711797947180256, "grad_norm": 2.14059793369232, "learning_rate": 2.564479650299003e-07, "loss": 0.6565, "step": 7715 }, { "epoch": 0.711797947180256, "eval_GEN Loss": 0.4383207857608795, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.335584819316864, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.802463948726654, "eval_runtime": 57.0613, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7715 }, { "epoch": 0.711890208741783, "grad_norm": 2.3805927539035374, "learning_rate": 2.56296028220497e-07, "loss": 0.6179, "step": 7716 }, { "epoch": 0.7119824703033099, "grad_norm": 2.0479791891348436, "learning_rate": 2.561441248236278e-07, "loss": 0.7813, "step": 7717 }, { "epoch": 0.7120747318648368, "grad_norm": 1.9342675351927023, "learning_rate": 2.559922548530588e-07, "loss": 0.8508, "step": 7718 }, { "epoch": 0.7121669934263637, "grad_norm": 1.63720004262603, "learning_rate": 2.558404183225521e-07, "loss": 0.7074, "step": 7719 }, { "epoch": 0.7122592549878907, "grad_norm": 1.6881556992083488, "learning_rate": 2.5568861524586813e-07, "loss": 0.6656, "step": 7720 }, { "epoch": 0.7122592549878907, "eval_GEN Loss": 0.43820875883102417, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33597877621650696, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.802734375, "eval_runtime": 57.1647, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7720 }, { "epoch": 0.7123515165494176, "grad_norm": 1.4144577680098624, "learning_rate": 2.5553684563676296e-07, "loss": 0.5569, "step": 7721 }, { "epoch": 0.7124437781109445, "grad_norm": 1.8071781096082762, "learning_rate": 2.5538510950899036e-07, "loss": 0.6101, "step": 7722 }, { "epoch": 0.7125360396724715, "grad_norm": 1.7671767106681495, "learning_rate": 2.552334068763011e-07, "loss": 0.7052, "step": 7723 }, { "epoch": 0.7126283012339983, "grad_norm": 2.1831972318939683, "learning_rate": 2.5508173775244243e-07, "loss": 0.5429, "step": 7724 }, { "epoch": 0.7127205627955253, "grad_norm": 2.0534232930040948, "learning_rate": 2.549301021511591e-07, "loss": 0.6793, "step": 7725 }, { "epoch": 0.7127205627955253, "eval_GEN Loss": 0.4381026029586792, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3339330554008484, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7981970906257629, "eval_runtime": 56.911, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 7725 }, { "epoch": 0.7128128243570523, "grad_norm": 2.1152494515777014, "learning_rate": 2.547785000861919e-07, "loss": 0.627, "step": 7726 }, { "epoch": 0.7129050859185792, "grad_norm": 1.9916030612204962, "learning_rate": 2.5462693157128035e-07, "loss": 0.572, "step": 7727 }, { "epoch": 0.7129973474801061, "grad_norm": 2.153505178577791, "learning_rate": 2.5447539662015895e-07, "loss": 0.6056, "step": 7728 }, { "epoch": 0.713089609041633, "grad_norm": 1.2941198916607495, "learning_rate": 2.543238952465603e-07, "loss": 0.487, "step": 7729 }, { "epoch": 0.71318187060316, "grad_norm": 1.9362086024325529, "learning_rate": 2.5417242746421373e-07, "loss": 0.7585, "step": 7730 }, { "epoch": 0.71318187060316, "eval_GEN Loss": 0.4379020929336548, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33194124698638916, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8027644157409668, "eval_runtime": 57.1541, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7730 }, { "epoch": 0.7132741321646869, "grad_norm": 1.9954539689064301, "learning_rate": 2.5402099328684564e-07, "loss": 0.6397, "step": 7731 }, { "epoch": 0.7133663937262138, "grad_norm": 2.4410423566024986, "learning_rate": 2.5386959272817896e-07, "loss": 0.5191, "step": 7732 }, { "epoch": 0.7134586552877408, "grad_norm": 1.634806011530162, "learning_rate": 2.5371822580193383e-07, "loss": 0.5536, "step": 7733 }, { "epoch": 0.7135509168492676, "grad_norm": 1.5654880403449287, "learning_rate": 2.535668925218278e-07, "loss": 0.5604, "step": 7734 }, { "epoch": 0.7136431784107946, "grad_norm": 2.0451906850196813, "learning_rate": 2.5341559290157435e-07, "loss": 0.5649, "step": 7735 }, { "epoch": 0.7136431784107946, "eval_GEN Loss": 0.43708646297454834, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3263174593448639, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8024038672447205, "eval_runtime": 57.3441, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7735 }, { "epoch": 0.7137354399723216, "grad_norm": 2.116314987711105, "learning_rate": 2.5326432695488497e-07, "loss": 0.5808, "step": 7736 }, { "epoch": 0.7138277015338484, "grad_norm": 1.6626013231344658, "learning_rate": 2.53113094695467e-07, "loss": 0.5938, "step": 7737 }, { "epoch": 0.7139199630953754, "grad_norm": 1.6979724244386158, "learning_rate": 2.5296189613702617e-07, "loss": 0.5332, "step": 7738 }, { "epoch": 0.7140122246569023, "grad_norm": 2.382093274377307, "learning_rate": 2.5281073129326367e-07, "loss": 0.7697, "step": 7739 }, { "epoch": 0.7141044862184293, "grad_norm": 2.1018475393859886, "learning_rate": 2.526596001778785e-07, "loss": 0.6022, "step": 7740 }, { "epoch": 0.7141044862184293, "eval_GEN Loss": 0.4370022416114807, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32270291447639465, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8082932829856873, "eval_runtime": 57.3437, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7740 }, { "epoch": 0.7141967477799561, "grad_norm": 2.3970430559001543, "learning_rate": 2.525085028045665e-07, "loss": 0.5206, "step": 7741 }, { "epoch": 0.7142890093414831, "grad_norm": 2.4845952831392837, "learning_rate": 2.523574391870205e-07, "loss": 0.7819, "step": 7742 }, { "epoch": 0.7143812709030101, "grad_norm": 2.191821097868958, "learning_rate": 2.5220640933892965e-07, "loss": 0.5401, "step": 7743 }, { "epoch": 0.7144735324645369, "grad_norm": 2.996222587244158, "learning_rate": 2.520554132739809e-07, "loss": 0.6027, "step": 7744 }, { "epoch": 0.7145657940260639, "grad_norm": 1.797156515929991, "learning_rate": 2.5190445100585747e-07, "loss": 0.6365, "step": 7745 }, { "epoch": 0.7145657940260639, "eval_GEN Loss": 0.4368453621864319, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3202647864818573, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8084434866905212, "eval_runtime": 57.0355, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7745 }, { "epoch": 0.7146580555875908, "grad_norm": 1.690268554112659, "learning_rate": 2.5175352254824025e-07, "loss": 0.6348, "step": 7746 }, { "epoch": 0.7147503171491177, "grad_norm": 2.6202613384006366, "learning_rate": 2.5160262791480607e-07, "loss": 0.6757, "step": 7747 }, { "epoch": 0.7148425787106447, "grad_norm": 2.15474156839459, "learning_rate": 2.5145176711922947e-07, "loss": 0.8199, "step": 7748 }, { "epoch": 0.7149348402721716, "grad_norm": 1.7713000465710564, "learning_rate": 2.51300940175182e-07, "loss": 0.7448, "step": 7749 }, { "epoch": 0.7150271018336986, "grad_norm": 2.021771261105806, "learning_rate": 2.511501470963312e-07, "loss": 0.796, "step": 7750 }, { "epoch": 0.7150271018336986, "eval_GEN Loss": 0.43739640712738037, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32175642251968384, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8076021671295166, "eval_runtime": 57.3483, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7750 }, { "epoch": 0.7151193633952254, "grad_norm": 2.1305897036172827, "learning_rate": 2.5099938789634256e-07, "loss": 0.5478, "step": 7751 }, { "epoch": 0.7152116249567524, "grad_norm": 1.3314811062776046, "learning_rate": 2.5084866258887813e-07, "loss": 0.5662, "step": 7752 }, { "epoch": 0.7153038865182794, "grad_norm": 2.4586795456734145, "learning_rate": 2.50697971187597e-07, "loss": 0.6182, "step": 7753 }, { "epoch": 0.7153961480798062, "grad_norm": 2.357497875311818, "learning_rate": 2.505473137061544e-07, "loss": 0.7136, "step": 7754 }, { "epoch": 0.7154884096413332, "grad_norm": 1.7294087289956972, "learning_rate": 2.503966901582042e-07, "loss": 0.5154, "step": 7755 }, { "epoch": 0.7154884096413332, "eval_GEN Loss": 0.43746209144592285, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3271979093551636, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8063101172447205, "eval_runtime": 57.1968, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7755 }, { "epoch": 0.7155806712028601, "grad_norm": 1.8117224083770864, "learning_rate": 2.502461005573952e-07, "loss": 0.6023, "step": 7756 }, { "epoch": 0.715672932764387, "grad_norm": 2.7811745959109975, "learning_rate": 2.500955449173748e-07, "loss": 0.8785, "step": 7757 }, { "epoch": 0.715765194325914, "grad_norm": 2.6319681255062144, "learning_rate": 2.499450232517859e-07, "loss": 0.7061, "step": 7758 }, { "epoch": 0.7158574558874409, "grad_norm": 2.574244108511848, "learning_rate": 2.4979453557426933e-07, "loss": 0.6282, "step": 7759 }, { "epoch": 0.7159497174489678, "grad_norm": 3.4478183074282103, "learning_rate": 2.496440818984628e-07, "loss": 0.5444, "step": 7760 }, { "epoch": 0.7159497174489678, "eval_GEN Loss": 0.437517374753952, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3261704742908478, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8021033406257629, "eval_runtime": 57.1661, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7760 }, { "epoch": 0.7160419790104947, "grad_norm": 1.4996502132158438, "learning_rate": 2.4949366223799994e-07, "loss": 0.7463, "step": 7761 }, { "epoch": 0.7161342405720217, "grad_norm": 2.2139861777782737, "learning_rate": 2.493432766065129e-07, "loss": 0.6976, "step": 7762 }, { "epoch": 0.7162265021335487, "grad_norm": 1.9265652078120739, "learning_rate": 2.491929250176292e-07, "loss": 0.5629, "step": 7763 }, { "epoch": 0.7163187636950755, "grad_norm": 1.7978156335900923, "learning_rate": 2.4904260748497437e-07, "loss": 0.5643, "step": 7764 }, { "epoch": 0.7164110252566025, "grad_norm": 2.314205793211768, "learning_rate": 2.4889232402216983e-07, "loss": 0.6012, "step": 7765 }, { "epoch": 0.7164110252566025, "eval_GEN Loss": 0.4376749098300934, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3288351893424988, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8020432591438293, "eval_runtime": 57.2013, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7765 }, { "epoch": 0.7165032868181294, "grad_norm": 1.690397386110926, "learning_rate": 2.487420746428353e-07, "loss": 0.8092, "step": 7766 }, { "epoch": 0.7165955483796563, "grad_norm": 3.4185271906957633, "learning_rate": 2.48591859360586e-07, "loss": 0.8335, "step": 7767 }, { "epoch": 0.7166878099411833, "grad_norm": 2.1659031671199673, "learning_rate": 2.48441678189035e-07, "loss": 0.6204, "step": 7768 }, { "epoch": 0.7167800715027102, "grad_norm": 2.055829925764934, "learning_rate": 2.4829153114179173e-07, "loss": 0.9019, "step": 7769 }, { "epoch": 0.7168723330642371, "grad_norm": 1.3993010803202712, "learning_rate": 2.4814141823246285e-07, "loss": 0.6628, "step": 7770 }, { "epoch": 0.7168723330642371, "eval_GEN Loss": 0.4376712739467621, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32946258783340454, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8010817170143127, "eval_runtime": 57.1296, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7770 }, { "epoch": 0.716964594625764, "grad_norm": 1.577083638572686, "learning_rate": 2.47991339474652e-07, "loss": 0.5288, "step": 7771 }, { "epoch": 0.717056856187291, "grad_norm": 1.5499482831521556, "learning_rate": 2.47841294881959e-07, "loss": 0.6405, "step": 7772 }, { "epoch": 0.7171491177488178, "grad_norm": 1.7969134624785708, "learning_rate": 2.476912844679819e-07, "loss": 0.667, "step": 7773 }, { "epoch": 0.7172413793103448, "grad_norm": 3.7472719080359775, "learning_rate": 2.4754130824631436e-07, "loss": 0.8641, "step": 7774 }, { "epoch": 0.7173336408718718, "grad_norm": 1.7128480082317357, "learning_rate": 2.4739136623054773e-07, "loss": 0.6518, "step": 7775 }, { "epoch": 0.7173336408718718, "eval_GEN Loss": 0.43761587142944336, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32855305075645447, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7987380027770996, "eval_runtime": 57.2388, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7775 }, { "epoch": 0.7174259024333987, "grad_norm": 1.6132366770739184, "learning_rate": 2.4724145843426943e-07, "loss": 0.582, "step": 7776 }, { "epoch": 0.7175181639949256, "grad_norm": 2.396797864464258, "learning_rate": 2.470915848710653e-07, "loss": 0.5959, "step": 7777 }, { "epoch": 0.7176104255564525, "grad_norm": 1.964194416494418, "learning_rate": 2.4694174555451625e-07, "loss": 0.5564, "step": 7778 }, { "epoch": 0.7177026871179795, "grad_norm": 2.5421870933799644, "learning_rate": 2.467919404982013e-07, "loss": 0.6939, "step": 7779 }, { "epoch": 0.7177949486795064, "grad_norm": 1.7038951111608933, "learning_rate": 2.466421697156963e-07, "loss": 0.5537, "step": 7780 }, { "epoch": 0.7177949486795064, "eval_GEN Loss": 0.4374338686466217, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32918065786361694, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7962139248847961, "eval_runtime": 57.0135, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7780 }, { "epoch": 0.7178872102410333, "grad_norm": 2.140349465217066, "learning_rate": 2.4649243322057317e-07, "loss": 0.7058, "step": 7781 }, { "epoch": 0.7179794718025603, "grad_norm": 1.9497484163427357, "learning_rate": 2.4634273102640146e-07, "loss": 0.5791, "step": 7782 }, { "epoch": 0.7180717333640871, "grad_norm": 1.5985960439514801, "learning_rate": 2.4619306314674756e-07, "loss": 0.5364, "step": 7783 }, { "epoch": 0.7181639949256141, "grad_norm": 2.1428340819044753, "learning_rate": 2.460434295951747e-07, "loss": 0.6931, "step": 7784 }, { "epoch": 0.7182562564871411, "grad_norm": 1.5574534928611243, "learning_rate": 2.4589383038524256e-07, "loss": 0.6128, "step": 7785 }, { "epoch": 0.7182562564871411, "eval_GEN Loss": 0.43879592418670654, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32590150833129883, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7963641881942749, "eval_runtime": 57.1677, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7785 }, { "epoch": 0.718348518048668, "grad_norm": 1.8215332232507295, "learning_rate": 2.457442655305082e-07, "loss": 0.6924, "step": 7786 }, { "epoch": 0.7184407796101949, "grad_norm": 3.0113510439204387, "learning_rate": 2.4559473504452544e-07, "loss": 0.7204, "step": 7787 }, { "epoch": 0.7185330411717218, "grad_norm": 1.5117274024599168, "learning_rate": 2.4544523894084524e-07, "loss": 0.6191, "step": 7788 }, { "epoch": 0.7186253027332488, "grad_norm": 1.8680624846897973, "learning_rate": 2.452957772330147e-07, "loss": 0.5921, "step": 7789 }, { "epoch": 0.7187175642947757, "grad_norm": 2.308298603265699, "learning_rate": 2.4514634993457845e-07, "loss": 0.6172, "step": 7790 }, { "epoch": 0.7187175642947757, "eval_GEN Loss": 0.43740183115005493, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32071515917778015, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.79296875, "eval_runtime": 57.3061, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7790 }, { "epoch": 0.7188098258563026, "grad_norm": 1.8533952796826174, "learning_rate": 2.4499695705907786e-07, "loss": 0.6555, "step": 7791 }, { "epoch": 0.7189020874178296, "grad_norm": 2.899782548753045, "learning_rate": 2.4484759862005146e-07, "loss": 0.8563, "step": 7792 }, { "epoch": 0.7189943489793564, "grad_norm": 1.6859376497995313, "learning_rate": 2.446982746310338e-07, "loss": 0.5065, "step": 7793 }, { "epoch": 0.7190866105408834, "grad_norm": 1.8017383872800925, "learning_rate": 2.44548985105557e-07, "loss": 0.6328, "step": 7794 }, { "epoch": 0.7191788721024104, "grad_norm": 1.5656716537536342, "learning_rate": 2.4439973005715034e-07, "loss": 0.563, "step": 7795 }, { "epoch": 0.7191788721024104, "eval_GEN Loss": 0.4376770853996277, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3178326487541199, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7947115302085876, "eval_runtime": 57.2306, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7795 }, { "epoch": 0.7192711336639372, "grad_norm": 1.7110800889203437, "learning_rate": 2.442505094993389e-07, "loss": 0.6575, "step": 7796 }, { "epoch": 0.7193633952254642, "grad_norm": 1.9129948709403208, "learning_rate": 2.441013234456457e-07, "loss": 0.5196, "step": 7797 }, { "epoch": 0.7194556567869911, "grad_norm": 1.4624215556913518, "learning_rate": 2.4395217190959003e-07, "loss": 0.3296, "step": 7798 }, { "epoch": 0.7195479183485181, "grad_norm": 2.36429651850057, "learning_rate": 2.438030549046886e-07, "loss": 0.7013, "step": 7799 }, { "epoch": 0.719640179910045, "grad_norm": 1.629943728352188, "learning_rate": 2.4365397244445407e-07, "loss": 0.5773, "step": 7800 }, { "epoch": 0.719640179910045, "eval_GEN Loss": 0.43740856647491455, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3175562620162964, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7977464199066162, "eval_runtime": 57.1627, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7800 }, { "epoch": 0.7197324414715719, "grad_norm": 1.958798091277567, "learning_rate": 2.4350492454239686e-07, "loss": 0.7097, "step": 7801 }, { "epoch": 0.7198247030330989, "grad_norm": 2.6646590140577406, "learning_rate": 2.433559112120238e-07, "loss": 0.7839, "step": 7802 }, { "epoch": 0.7199169645946257, "grad_norm": 2.5674117445484335, "learning_rate": 2.432069324668391e-07, "loss": 0.8423, "step": 7803 }, { "epoch": 0.7200092261561527, "grad_norm": 3.2634947035335844, "learning_rate": 2.430579883203428e-07, "loss": 0.7508, "step": 7804 }, { "epoch": 0.7201014877176796, "grad_norm": 3.1155253241452026, "learning_rate": 2.4290907878603285e-07, "loss": 0.7446, "step": 7805 }, { "epoch": 0.7201014877176796, "eval_GEN Loss": 0.4376136362552643, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3184812068939209, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7963942289352417, "eval_runtime": 57.2644, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7805 }, { "epoch": 0.7201937492792065, "grad_norm": 1.3883785195796086, "learning_rate": 2.4276020387740377e-07, "loss": 0.5595, "step": 7806 }, { "epoch": 0.7202860108407335, "grad_norm": 3.101362262763052, "learning_rate": 2.4261136360794656e-07, "loss": 0.7846, "step": 7807 }, { "epoch": 0.7203782724022604, "grad_norm": 2.535071713102246, "learning_rate": 2.424625579911494e-07, "loss": 0.6802, "step": 7808 }, { "epoch": 0.7204705339637874, "grad_norm": 2.063603989311089, "learning_rate": 2.4231378704049736e-07, "loss": 0.6229, "step": 7809 }, { "epoch": 0.7205627955253142, "grad_norm": 1.6142890198132345, "learning_rate": 2.4216505076947246e-07, "loss": 0.6661, "step": 7810 }, { "epoch": 0.7205627955253142, "eval_GEN Loss": 0.43712830543518066, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3228866755962372, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7954927682876587, "eval_runtime": 57.2127, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7810 }, { "epoch": 0.7206550570868412, "grad_norm": 3.675453802168607, "learning_rate": 2.420163491915529e-07, "loss": 0.6634, "step": 7811 }, { "epoch": 0.7207473186483682, "grad_norm": 2.4228618758737226, "learning_rate": 2.4186768232021497e-07, "loss": 0.7033, "step": 7812 }, { "epoch": 0.720839580209895, "grad_norm": 1.9801546254367008, "learning_rate": 2.417190501689306e-07, "loss": 0.6351, "step": 7813 }, { "epoch": 0.720931841771422, "grad_norm": 3.1258273061704527, "learning_rate": 2.415704527511693e-07, "loss": 0.6364, "step": 7814 }, { "epoch": 0.7210241033329489, "grad_norm": 3.244345611091845, "learning_rate": 2.4142189008039695e-07, "loss": 0.8941, "step": 7815 }, { "epoch": 0.7210241033329489, "eval_GEN Loss": 0.43811658024787903, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33160629868507385, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.7996394038200378, "eval_runtime": 57.364, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7815 }, { "epoch": 0.7211163648944758, "grad_norm": 1.7950696987016082, "learning_rate": 2.412733621700767e-07, "loss": 0.6361, "step": 7816 }, { "epoch": 0.7212086264560028, "grad_norm": 2.090828388261856, "learning_rate": 2.411248690336683e-07, "loss": 0.7585, "step": 7817 }, { "epoch": 0.7213008880175297, "grad_norm": 2.401857337999073, "learning_rate": 2.409764106846285e-07, "loss": 0.6344, "step": 7818 }, { "epoch": 0.7213931495790566, "grad_norm": 2.3841789440363663, "learning_rate": 2.408279871364111e-07, "loss": 0.7313, "step": 7819 }, { "epoch": 0.7214854111405835, "grad_norm": 2.3271127214155025, "learning_rate": 2.4067959840246594e-07, "loss": 0.8227, "step": 7820 }, { "epoch": 0.7214854111405835, "eval_GEN Loss": 0.43861937522888184, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.33730021119117737, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8033052682876587, "eval_runtime": 57.2793, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7820 }, { "epoch": 0.7215776727021105, "grad_norm": 1.5785679587853012, "learning_rate": 2.405312444962408e-07, "loss": 0.4835, "step": 7821 }, { "epoch": 0.7216699342636375, "grad_norm": 1.8932513028735107, "learning_rate": 2.403829254311789e-07, "loss": 0.6533, "step": 7822 }, { "epoch": 0.7217621958251643, "grad_norm": 1.9984465118762624, "learning_rate": 2.4023464122072215e-07, "loss": 0.711, "step": 7823 }, { "epoch": 0.7218544573866913, "grad_norm": 2.4285733870000157, "learning_rate": 2.4008639187830775e-07, "loss": 0.5703, "step": 7824 }, { "epoch": 0.7219467189482182, "grad_norm": 2.0059998393729757, "learning_rate": 2.399381774173704e-07, "loss": 0.7633, "step": 7825 }, { "epoch": 0.7219467189482182, "eval_GEN Loss": 0.4383153021335602, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3362383544445038, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.800510823726654, "eval_runtime": 56.9901, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 7825 }, { "epoch": 0.7220389805097451, "grad_norm": 1.998944884977911, "learning_rate": 2.397899978513412e-07, "loss": 0.7504, "step": 7826 }, { "epoch": 0.7221312420712721, "grad_norm": 1.7019848523343066, "learning_rate": 2.396418531936492e-07, "loss": 0.6694, "step": 7827 }, { "epoch": 0.722223503632799, "grad_norm": 2.027978522468343, "learning_rate": 2.3949374345771867e-07, "loss": 0.6586, "step": 7828 }, { "epoch": 0.7223157651943259, "grad_norm": 2.21544160492201, "learning_rate": 2.3934566865697203e-07, "loss": 0.5989, "step": 7829 }, { "epoch": 0.7224080267558528, "grad_norm": 2.013721309071023, "learning_rate": 2.3919762880482804e-07, "loss": 0.6408, "step": 7830 }, { "epoch": 0.7224080267558528, "eval_GEN Loss": 0.4379677474498749, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3338964879512787, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.802463948726654, "eval_runtime": 57.1137, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7830 }, { "epoch": 0.7225002883173798, "grad_norm": 2.818561085273852, "learning_rate": 2.3904962391470206e-07, "loss": 0.8818, "step": 7831 }, { "epoch": 0.7225925498789068, "grad_norm": 1.6641266063613558, "learning_rate": 2.3890165400000685e-07, "loss": 0.5388, "step": 7832 }, { "epoch": 0.7226848114404336, "grad_norm": 2.052279037071331, "learning_rate": 2.3875371907415105e-07, "loss": 0.6597, "step": 7833 }, { "epoch": 0.7227770730019606, "grad_norm": 1.4084856017894654, "learning_rate": 2.386058191505416e-07, "loss": 0.5814, "step": 7834 }, { "epoch": 0.7228693345634875, "grad_norm": 2.168255339815319, "learning_rate": 2.384579542425808e-07, "loss": 0.6132, "step": 7835 }, { "epoch": 0.7228693345634875, "eval_GEN Loss": 0.4382684528827667, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32752904295921326, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8008413314819336, "eval_runtime": 57.0252, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7835 }, { "epoch": 0.7229615961250144, "grad_norm": 1.5495384053713488, "learning_rate": 2.383101243636686e-07, "loss": 0.6008, "step": 7836 }, { "epoch": 0.7230538576865413, "grad_norm": 1.5333215763153376, "learning_rate": 2.3816232952720155e-07, "loss": 0.5376, "step": 7837 }, { "epoch": 0.7231461192480683, "grad_norm": 1.849977289903219, "learning_rate": 2.3801456974657333e-07, "loss": 0.5292, "step": 7838 }, { "epoch": 0.7232383808095952, "grad_norm": 1.272146629609333, "learning_rate": 2.3786684503517377e-07, "loss": 0.45, "step": 7839 }, { "epoch": 0.7233306423711221, "grad_norm": 2.2996086331324657, "learning_rate": 2.3771915540639004e-07, "loss": 0.5635, "step": 7840 }, { "epoch": 0.7233306423711221, "eval_GEN Loss": 0.4380802512168884, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.322937935590744, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8024939894676208, "eval_runtime": 57.1252, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7840 }, { "epoch": 0.7234229039326491, "grad_norm": 1.3764340102882446, "learning_rate": 2.3757150087360624e-07, "loss": 0.5288, "step": 7841 }, { "epoch": 0.7235151654941759, "grad_norm": 1.631670574485566, "learning_rate": 2.3742388145020266e-07, "loss": 0.5416, "step": 7842 }, { "epoch": 0.7236074270557029, "grad_norm": 2.0396449301264568, "learning_rate": 2.37276297149557e-07, "loss": 0.6469, "step": 7843 }, { "epoch": 0.7236996886172299, "grad_norm": 2.326643858307957, "learning_rate": 2.3712874798504356e-07, "loss": 0.6561, "step": 7844 }, { "epoch": 0.7237919501787567, "grad_norm": 2.2171201780490404, "learning_rate": 2.3698123397003372e-07, "loss": 0.6078, "step": 7845 }, { "epoch": 0.7237919501787567, "eval_GEN Loss": 0.4381980001926422, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3233911991119385, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8072716593742371, "eval_runtime": 57.2874, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7845 }, { "epoch": 0.7238842117402837, "grad_norm": 1.759138292198411, "learning_rate": 2.3683375511789494e-07, "loss": 0.5668, "step": 7846 }, { "epoch": 0.7239764733018106, "grad_norm": 1.6521050777069064, "learning_rate": 2.3668631144199232e-07, "loss": 0.6111, "step": 7847 }, { "epoch": 0.7240687348633376, "grad_norm": 2.1227329568794753, "learning_rate": 2.3653890295568736e-07, "loss": 0.4512, "step": 7848 }, { "epoch": 0.7241609964248645, "grad_norm": 2.0547489960075933, "learning_rate": 2.363915296723386e-07, "loss": 0.837, "step": 7849 }, { "epoch": 0.7242532579863914, "grad_norm": 2.15706904690181, "learning_rate": 2.3624419160530098e-07, "loss": 0.7889, "step": 7850 }, { "epoch": 0.7242532579863914, "eval_GEN Loss": 0.4382028877735138, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3253610134124756, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8104267120361328, "eval_runtime": 57.185, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7850 }, { "epoch": 0.7243455195479184, "grad_norm": 1.5751767421914469, "learning_rate": 2.3609688876792657e-07, "loss": 0.5596, "step": 7851 }, { "epoch": 0.7244377811094452, "grad_norm": 1.8937441603846947, "learning_rate": 2.359496211735645e-07, "loss": 0.7366, "step": 7852 }, { "epoch": 0.7245300426709722, "grad_norm": 1.4026969315433986, "learning_rate": 2.358023888355599e-07, "loss": 0.6111, "step": 7853 }, { "epoch": 0.7246223042324992, "grad_norm": 1.533610504466345, "learning_rate": 2.3565519176725545e-07, "loss": 0.5524, "step": 7854 }, { "epoch": 0.724714565794026, "grad_norm": 1.765534501247701, "learning_rate": 2.3550802998199036e-07, "loss": 0.567, "step": 7855 }, { "epoch": 0.724714565794026, "eval_GEN Loss": 0.4391516447067261, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32879018783569336, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8138822317123413, "eval_runtime": 57.0405, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7855 }, { "epoch": 0.724806827355553, "grad_norm": 2.3906642669974887, "learning_rate": 2.3536090349310084e-07, "loss": 0.747, "step": 7856 }, { "epoch": 0.7248990889170799, "grad_norm": 1.9091155248871776, "learning_rate": 2.3521381231391937e-07, "loss": 0.5408, "step": 7857 }, { "epoch": 0.7249913504786069, "grad_norm": 2.3402407359988375, "learning_rate": 2.350667564577757e-07, "loss": 0.81, "step": 7858 }, { "epoch": 0.7250836120401338, "grad_norm": 2.4876480650790085, "learning_rate": 2.3491973593799643e-07, "loss": 0.6959, "step": 7859 }, { "epoch": 0.7251758736016607, "grad_norm": 3.5781744310262775, "learning_rate": 2.3477275076790477e-07, "loss": 0.663, "step": 7860 }, { "epoch": 0.7251758736016607, "eval_GEN Loss": 0.43791428208351135, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32916125655174255, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8124399185180664, "eval_runtime": 57.2658, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7860 }, { "epoch": 0.7252681351631877, "grad_norm": 1.9440432464097173, "learning_rate": 2.346258009608203e-07, "loss": 0.6763, "step": 7861 }, { "epoch": 0.7253603967247145, "grad_norm": 1.6111408831114344, "learning_rate": 2.3447888653006067e-07, "loss": 0.605, "step": 7862 }, { "epoch": 0.7254526582862415, "grad_norm": 1.6231426303594592, "learning_rate": 2.3433200748893882e-07, "loss": 0.5967, "step": 7863 }, { "epoch": 0.7255449198477685, "grad_norm": 1.8799477955613646, "learning_rate": 2.341851638507655e-07, "loss": 0.5115, "step": 7864 }, { "epoch": 0.7256371814092953, "grad_norm": 2.128015210954018, "learning_rate": 2.340383556288476e-07, "loss": 0.6695, "step": 7865 }, { "epoch": 0.7256371814092953, "eval_GEN Loss": 0.43884578347206116, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.33447861671447754, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8198016881942749, "eval_runtime": 57.1842, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7865 }, { "epoch": 0.7257294429708223, "grad_norm": 1.8930517508531786, "learning_rate": 2.3389158283648933e-07, "loss": 0.6658, "step": 7866 }, { "epoch": 0.7258217045323492, "grad_norm": 2.7365094185712, "learning_rate": 2.3374484548699164e-07, "loss": 0.666, "step": 7867 }, { "epoch": 0.7259139660938762, "grad_norm": 2.552648748973824, "learning_rate": 2.3359814359365145e-07, "loss": 0.6417, "step": 7868 }, { "epoch": 0.726006227655403, "grad_norm": 2.893674948030201, "learning_rate": 2.33451477169764e-07, "loss": 0.809, "step": 7869 }, { "epoch": 0.72609848921693, "grad_norm": 1.796438287571219, "learning_rate": 2.3330484622861979e-07, "loss": 0.6265, "step": 7870 }, { "epoch": 0.72609848921693, "eval_GEN Loss": 0.4378489553928375, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3374446928501129, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8216646909713745, "eval_runtime": 57.204, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7870 }, { "epoch": 0.726190750778457, "grad_norm": 1.856822129003823, "learning_rate": 2.3315825078350715e-07, "loss": 0.684, "step": 7871 }, { "epoch": 0.7262830123399838, "grad_norm": 2.8014301799286687, "learning_rate": 2.330116908477102e-07, "loss": 0.812, "step": 7872 }, { "epoch": 0.7263752739015108, "grad_norm": 2.110884757357625, "learning_rate": 2.328651664345112e-07, "loss": 0.5113, "step": 7873 }, { "epoch": 0.7264675354630377, "grad_norm": 1.9597403654139829, "learning_rate": 2.327186775571879e-07, "loss": 0.6769, "step": 7874 }, { "epoch": 0.7265597970245646, "grad_norm": 2.4564673674090396, "learning_rate": 2.3257222422901544e-07, "loss": 0.7778, "step": 7875 }, { "epoch": 0.7265597970245646, "eval_GEN Loss": 0.4387342631816864, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3413580358028412, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8151742815971375, "eval_runtime": 57.3536, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7875 }, { "epoch": 0.7266520585860916, "grad_norm": 1.4398884778654524, "learning_rate": 2.3242580646326596e-07, "loss": 0.6496, "step": 7876 }, { "epoch": 0.7267443201476185, "grad_norm": 2.4662728193551873, "learning_rate": 2.3227942427320758e-07, "loss": 0.6793, "step": 7877 }, { "epoch": 0.7268365817091454, "grad_norm": 1.6410831585271053, "learning_rate": 2.3213307767210613e-07, "loss": 0.5302, "step": 7878 }, { "epoch": 0.7269288432706723, "grad_norm": 1.9992706295086222, "learning_rate": 2.3198676667322319e-07, "loss": 0.6335, "step": 7879 }, { "epoch": 0.7270211048321993, "grad_norm": 1.9370482110799545, "learning_rate": 2.3184049128981846e-07, "loss": 0.5378, "step": 7880 }, { "epoch": 0.7270211048321993, "eval_GEN Loss": 0.43872544169425964, "eval_GEN top-5 accuracy": 0.9850942569048663, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34563493728637695, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8196213841438293, "eval_runtime": 57.4099, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 7880 }, { "epoch": 0.7271133663937263, "grad_norm": 1.8486333693789636, "learning_rate": 2.3169425153514705e-07, "loss": 0.7393, "step": 7881 }, { "epoch": 0.7272056279552531, "grad_norm": 2.386887345593943, "learning_rate": 2.3154804742246156e-07, "loss": 0.8329, "step": 7882 }, { "epoch": 0.7272978895167801, "grad_norm": 2.189772673352762, "learning_rate": 2.3140187896501138e-07, "loss": 0.6204, "step": 7883 }, { "epoch": 0.727390151078307, "grad_norm": 2.5246779973619518, "learning_rate": 2.3125574617604272e-07, "loss": 0.686, "step": 7884 }, { "epoch": 0.7274824126398339, "grad_norm": 1.7252448191024186, "learning_rate": 2.311096490687978e-07, "loss": 0.5659, "step": 7885 }, { "epoch": 0.7274824126398339, "eval_GEN Loss": 0.4390948414802551, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34675663709640503, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8180288672447205, "eval_runtime": 57.1411, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7885 }, { "epoch": 0.7275746742013609, "grad_norm": 1.6458912772046916, "learning_rate": 2.3096358765651654e-07, "loss": 0.4828, "step": 7886 }, { "epoch": 0.7276669357628878, "grad_norm": 1.6115765306877137, "learning_rate": 2.3081756195243534e-07, "loss": 0.6378, "step": 7887 }, { "epoch": 0.7277591973244147, "grad_norm": 1.6784459088828625, "learning_rate": 2.3067157196978697e-07, "loss": 0.4691, "step": 7888 }, { "epoch": 0.7278514588859416, "grad_norm": 1.897975619926399, "learning_rate": 2.305256177218014e-07, "loss": 0.6077, "step": 7889 }, { "epoch": 0.7279437204474686, "grad_norm": 1.5455513109164465, "learning_rate": 2.3037969922170528e-07, "loss": 0.6557, "step": 7890 }, { "epoch": 0.7279437204474686, "eval_GEN Loss": 0.43964895606040955, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3534965515136719, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8227463960647583, "eval_runtime": 57.2866, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7890 }, { "epoch": 0.7280359820089956, "grad_norm": 2.5726048985180188, "learning_rate": 2.302338164827222e-07, "loss": 0.7312, "step": 7891 }, { "epoch": 0.7281282435705224, "grad_norm": 2.005950536872293, "learning_rate": 2.3008796951807183e-07, "loss": 0.5365, "step": 7892 }, { "epoch": 0.7282205051320494, "grad_norm": 2.2148986651311113, "learning_rate": 2.2994215834097118e-07, "loss": 0.5103, "step": 7893 }, { "epoch": 0.7283127666935763, "grad_norm": 2.0909658505690514, "learning_rate": 2.29796382964634e-07, "loss": 0.6589, "step": 7894 }, { "epoch": 0.7284050282551032, "grad_norm": 1.8209161796751325, "learning_rate": 2.2965064340227093e-07, "loss": 0.5728, "step": 7895 }, { "epoch": 0.7284050282551032, "eval_GEN Loss": 0.4392683207988739, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3518878221511841, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8183894157409668, "eval_runtime": 57.1708, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7895 }, { "epoch": 0.7284972898166302, "grad_norm": 1.7771325797293933, "learning_rate": 2.2950493966708856e-07, "loss": 0.6256, "step": 7896 }, { "epoch": 0.7285895513781571, "grad_norm": 2.388703911583078, "learning_rate": 2.293592717722911e-07, "loss": 0.8155, "step": 7897 }, { "epoch": 0.728681812939684, "grad_norm": 1.7006391721321144, "learning_rate": 2.2921363973107924e-07, "loss": 0.6226, "step": 7898 }, { "epoch": 0.7287740745012109, "grad_norm": 1.9569142659365577, "learning_rate": 2.2906804355665043e-07, "loss": 0.7833, "step": 7899 }, { "epoch": 0.7288663360627379, "grad_norm": 2.7529071324196046, "learning_rate": 2.2892248326219862e-07, "loss": 0.7558, "step": 7900 }, { "epoch": 0.7288663360627379, "eval_GEN Loss": 0.44006234407424927, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3524196445941925, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8178185224533081, "eval_runtime": 57.1085, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7900 }, { "epoch": 0.7289585976242647, "grad_norm": 2.2482431297171037, "learning_rate": 2.2877695886091478e-07, "loss": 0.956, "step": 7901 }, { "epoch": 0.7290508591857917, "grad_norm": 1.6834070523669256, "learning_rate": 2.286314703659867e-07, "loss": 0.6984, "step": 7902 }, { "epoch": 0.7291431207473187, "grad_norm": 3.66646045518242, "learning_rate": 2.2848601779059856e-07, "loss": 0.7585, "step": 7903 }, { "epoch": 0.7292353823088455, "grad_norm": 1.577887930481479, "learning_rate": 2.2834060114793158e-07, "loss": 0.4779, "step": 7904 }, { "epoch": 0.7293276438703725, "grad_norm": 3.40385967552502, "learning_rate": 2.2819522045116365e-07, "loss": 0.9212, "step": 7905 }, { "epoch": 0.7293276438703725, "eval_GEN Loss": 0.440186083316803, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3521534204483032, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8187800645828247, "eval_runtime": 57.3504, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7905 }, { "epoch": 0.7294199054318994, "grad_norm": 2.4773407762679818, "learning_rate": 2.280498757134697e-07, "loss": 0.7846, "step": 7906 }, { "epoch": 0.7295121669934264, "grad_norm": 1.6307001970075596, "learning_rate": 2.2790456694802039e-07, "loss": 0.5999, "step": 7907 }, { "epoch": 0.7296044285549533, "grad_norm": 1.3288212241076722, "learning_rate": 2.2775929416798466e-07, "loss": 0.388, "step": 7908 }, { "epoch": 0.7296966901164802, "grad_norm": 1.9079321406837688, "learning_rate": 2.2761405738652674e-07, "loss": 0.7814, "step": 7909 }, { "epoch": 0.7297889516780072, "grad_norm": 1.9736257934130268, "learning_rate": 2.274688566168086e-07, "loss": 0.7086, "step": 7910 }, { "epoch": 0.7297889516780072, "eval_GEN Loss": 0.43979600071907043, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3530125021934509, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8177283406257629, "eval_runtime": 56.9939, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7910 }, { "epoch": 0.729881213239534, "grad_norm": 2.650141256770645, "learning_rate": 2.2732369187198823e-07, "loss": 0.6345, "step": 7911 }, { "epoch": 0.729973474801061, "grad_norm": 2.422310251219888, "learning_rate": 2.271785631652209e-07, "loss": 0.5986, "step": 7912 }, { "epoch": 0.730065736362588, "grad_norm": 2.759432447499375, "learning_rate": 2.270334705096585e-07, "loss": 0.7175, "step": 7913 }, { "epoch": 0.7301579979241148, "grad_norm": 2.3273729744479175, "learning_rate": 2.26888413918449e-07, "loss": 0.7228, "step": 7914 }, { "epoch": 0.7302502594856418, "grad_norm": 2.3462816346290185, "learning_rate": 2.2674339340473855e-07, "loss": 0.5391, "step": 7915 }, { "epoch": 0.7302502594856418, "eval_GEN Loss": 0.44117215275764465, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3532792925834656, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8220552802085876, "eval_runtime": 57.2345, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7915 }, { "epoch": 0.7303425210471687, "grad_norm": 2.2031841039786806, "learning_rate": 2.2659840898166836e-07, "loss": 0.6471, "step": 7916 }, { "epoch": 0.7304347826086957, "grad_norm": 1.7922977144338739, "learning_rate": 2.264534606623777e-07, "loss": 0.6535, "step": 7917 }, { "epoch": 0.7305270441702226, "grad_norm": 2.7083299409845245, "learning_rate": 2.2630854846000133e-07, "loss": 0.6726, "step": 7918 }, { "epoch": 0.7306193057317495, "grad_norm": 2.5468607357497604, "learning_rate": 2.2616367238767228e-07, "loss": 0.7653, "step": 7919 }, { "epoch": 0.7307115672932765, "grad_norm": 2.2393888394541226, "learning_rate": 2.260188324585188e-07, "loss": 0.6942, "step": 7920 }, { "epoch": 0.7307115672932765, "eval_GEN Loss": 0.43999242782592773, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3557075262069702, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8200120329856873, "eval_runtime": 56.7766, "eval_samples_per_second": 1.145, "eval_steps_per_second": 0.088, "step": 7920 }, { "epoch": 0.7308038288548033, "grad_norm": 1.9428687628507841, "learning_rate": 2.2587402868566692e-07, "loss": 0.5973, "step": 7921 }, { "epoch": 0.7308960904163303, "grad_norm": 2.5143742803173406, "learning_rate": 2.2572926108223863e-07, "loss": 0.626, "step": 7922 }, { "epoch": 0.7309883519778573, "grad_norm": 1.806520432905869, "learning_rate": 2.2558452966135306e-07, "loss": 0.5361, "step": 7923 }, { "epoch": 0.7310806135393841, "grad_norm": 1.8087776060800513, "learning_rate": 2.2543983443612638e-07, "loss": 0.7539, "step": 7924 }, { "epoch": 0.7311728751009111, "grad_norm": 1.4229098554861215, "learning_rate": 2.2529517541967042e-07, "loss": 0.5379, "step": 7925 }, { "epoch": 0.7311728751009111, "eval_GEN Loss": 0.4412521719932556, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.36358290910720825, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8250600695610046, "eval_runtime": 57.1539, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7925 }, { "epoch": 0.731265136662438, "grad_norm": 2.689805975601732, "learning_rate": 2.2515055262509522e-07, "loss": 0.729, "step": 7926 }, { "epoch": 0.731357398223965, "grad_norm": 2.530293763575933, "learning_rate": 2.2500596606550607e-07, "loss": 0.6083, "step": 7927 }, { "epoch": 0.7314496597854919, "grad_norm": 1.8540071272463365, "learning_rate": 2.248614157540061e-07, "loss": 0.6501, "step": 7928 }, { "epoch": 0.7315419213470188, "grad_norm": 2.791756857041487, "learning_rate": 2.2471690170369403e-07, "loss": 1.0178, "step": 7929 }, { "epoch": 0.7316341829085458, "grad_norm": 1.773036641000174, "learning_rate": 2.2457242392766684e-07, "loss": 0.6487, "step": 7930 }, { "epoch": 0.7316341829085458, "eval_GEN Loss": 0.44059255719184875, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.366232305765152, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8267728090286255, "eval_runtime": 57.1059, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 7930 }, { "epoch": 0.7317264444700726, "grad_norm": 1.67854708871025, "learning_rate": 2.2442798243901664e-07, "loss": 0.6609, "step": 7931 }, { "epoch": 0.7318187060315996, "grad_norm": 2.557784314341645, "learning_rate": 2.2428357725083316e-07, "loss": 0.8389, "step": 7932 }, { "epoch": 0.7319109675931265, "grad_norm": 1.4092539483006314, "learning_rate": 2.241392083762027e-07, "loss": 0.5454, "step": 7933 }, { "epoch": 0.7320032291546534, "grad_norm": 1.7271788221952598, "learning_rate": 2.239948758282083e-07, "loss": 0.7131, "step": 7934 }, { "epoch": 0.7320954907161804, "grad_norm": 1.959504194443559, "learning_rate": 2.2385057961992932e-07, "loss": 0.7353, "step": 7935 }, { "epoch": 0.7320954907161804, "eval_GEN Loss": 0.441094309091568, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM Loss": 0.3644280433654785, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8248798251152039, "eval_runtime": 57.2336, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7935 }, { "epoch": 0.7321877522777073, "grad_norm": 2.5807945424572103, "learning_rate": 2.2370631976444215e-07, "loss": 0.8417, "step": 7936 }, { "epoch": 0.7322800138392342, "grad_norm": 2.3451478079044774, "learning_rate": 2.2356209627482014e-07, "loss": 0.563, "step": 7937 }, { "epoch": 0.7323722754007611, "grad_norm": 1.279503420718096, "learning_rate": 2.2341790916413268e-07, "loss": 0.5134, "step": 7938 }, { "epoch": 0.7324645369622881, "grad_norm": 2.1587876805343824, "learning_rate": 2.2327375844544633e-07, "loss": 0.6883, "step": 7939 }, { "epoch": 0.7325567985238151, "grad_norm": 1.8822836213363, "learning_rate": 2.231296441318243e-07, "loss": 0.6945, "step": 7940 }, { "epoch": 0.7325567985238151, "eval_GEN Loss": 0.4392783045768738, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3580546975135803, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8224759697914124, "eval_runtime": 57.1938, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7940 }, { "epoch": 0.7326490600853419, "grad_norm": 2.6882801650831802, "learning_rate": 2.229855662363268e-07, "loss": 0.9527, "step": 7941 }, { "epoch": 0.7327413216468689, "grad_norm": 2.659029065724765, "learning_rate": 2.2284152477200976e-07, "loss": 0.6902, "step": 7942 }, { "epoch": 0.7328335832083958, "grad_norm": 1.7647190680700415, "learning_rate": 2.2269751975192677e-07, "loss": 0.7222, "step": 7943 }, { "epoch": 0.7329258447699227, "grad_norm": 1.9725941376479896, "learning_rate": 2.2255355118912783e-07, "loss": 0.5789, "step": 7944 }, { "epoch": 0.7330181063314497, "grad_norm": 3.8237429793542272, "learning_rate": 2.2240961909665965e-07, "loss": 0.9767, "step": 7945 }, { "epoch": 0.7330181063314497, "eval_GEN Loss": 0.4389013946056366, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3570839762687683, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8211839199066162, "eval_runtime": 57.06, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 7945 }, { "epoch": 0.7331103678929766, "grad_norm": 1.6094792540686016, "learning_rate": 2.2226572348756533e-07, "loss": 0.6489, "step": 7946 }, { "epoch": 0.7332026294545035, "grad_norm": 2.4747319462549235, "learning_rate": 2.2212186437488507e-07, "loss": 0.7141, "step": 7947 }, { "epoch": 0.7332948910160304, "grad_norm": 2.2225879351578337, "learning_rate": 2.2197804177165577e-07, "loss": 0.7061, "step": 7948 }, { "epoch": 0.7333871525775574, "grad_norm": 1.6225206798612546, "learning_rate": 2.2183425569091045e-07, "loss": 0.5236, "step": 7949 }, { "epoch": 0.7334794141390844, "grad_norm": 1.722035499193365, "learning_rate": 2.2169050614567956e-07, "loss": 0.6438, "step": 7950 }, { "epoch": 0.7334794141390844, "eval_GEN Loss": 0.43925827741622925, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3566788136959076, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8207031488418579, "eval_runtime": 57.1518, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7950 }, { "epoch": 0.7335716757006112, "grad_norm": 2.0030607566373186, "learning_rate": 2.215467931489898e-07, "loss": 0.5538, "step": 7951 }, { "epoch": 0.7336639372621382, "grad_norm": 2.101861456868141, "learning_rate": 2.2140311671386485e-07, "loss": 0.7728, "step": 7952 }, { "epoch": 0.733756198823665, "grad_norm": 1.5648777607884994, "learning_rate": 2.212594768533246e-07, "loss": 0.605, "step": 7953 }, { "epoch": 0.733848460385192, "grad_norm": 2.8189140499840613, "learning_rate": 2.2111587358038597e-07, "loss": 0.8804, "step": 7954 }, { "epoch": 0.733940721946719, "grad_norm": 1.596710431311532, "learning_rate": 2.2097230690806262e-07, "loss": 0.6903, "step": 7955 }, { "epoch": 0.733940721946719, "eval_GEN Loss": 0.43953731656074524, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.35482725501060486, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8190204501152039, "eval_runtime": 57.1692, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 7955 }, { "epoch": 0.7340329835082459, "grad_norm": 1.996263338210039, "learning_rate": 2.20828776849365e-07, "loss": 0.7172, "step": 7956 }, { "epoch": 0.7341252450697728, "grad_norm": 1.4753417945859393, "learning_rate": 2.2068528341729964e-07, "loss": 0.6415, "step": 7957 }, { "epoch": 0.7342175066312997, "grad_norm": 2.2967058904247684, "learning_rate": 2.2054182662487018e-07, "loss": 0.6464, "step": 7958 }, { "epoch": 0.7343097681928267, "grad_norm": 1.627645520787659, "learning_rate": 2.2039840648507732e-07, "loss": 0.6246, "step": 7959 }, { "epoch": 0.7344020297543536, "grad_norm": 2.3284552465821666, "learning_rate": 2.2025502301091745e-07, "loss": 0.6349, "step": 7960 }, { "epoch": 0.7344020297543536, "eval_GEN Loss": 0.4401329457759857, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3480963408946991, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8192307949066162, "eval_runtime": 57.3629, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7960 }, { "epoch": 0.7344942913158805, "grad_norm": 2.475650230817161, "learning_rate": 2.2011167621538454e-07, "loss": 0.6499, "step": 7961 }, { "epoch": 0.7345865528774075, "grad_norm": 1.868066971396064, "learning_rate": 2.1996836611146877e-07, "loss": 0.5169, "step": 7962 }, { "epoch": 0.7346788144389343, "grad_norm": 2.295767611312265, "learning_rate": 2.1982509271215744e-07, "loss": 0.646, "step": 7963 }, { "epoch": 0.7347710760004613, "grad_norm": 1.6826770750608961, "learning_rate": 2.1968185603043347e-07, "loss": 0.56, "step": 7964 }, { "epoch": 0.7348633375619882, "grad_norm": 2.1926034929465543, "learning_rate": 2.1953865607927817e-07, "loss": 0.7633, "step": 7965 }, { "epoch": 0.7348633375619882, "eval_GEN Loss": 0.43896815180778503, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34418657422065735, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8180589079856873, "eval_runtime": 57.0324, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 7965 }, { "epoch": 0.7349555991235152, "grad_norm": 2.571377629004295, "learning_rate": 2.1939549287166787e-07, "loss": 0.7524, "step": 7966 }, { "epoch": 0.7350478606850421, "grad_norm": 3.5513056020232443, "learning_rate": 2.192523664205766e-07, "loss": 0.917, "step": 7967 }, { "epoch": 0.735140122246569, "grad_norm": 2.8800962966687282, "learning_rate": 2.1910927673897436e-07, "loss": 0.9761, "step": 7968 }, { "epoch": 0.735232383808096, "grad_norm": 2.2546294707801513, "learning_rate": 2.1896622383982837e-07, "loss": 0.5211, "step": 7969 }, { "epoch": 0.7353246453696228, "grad_norm": 2.7589928686020126, "learning_rate": 2.1882320773610224e-07, "loss": 0.5752, "step": 7970 }, { "epoch": 0.7353246453696228, "eval_GEN Loss": 0.43903622031211853, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34562739729881287, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8188701868057251, "eval_runtime": 57.2631, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7970 }, { "epoch": 0.7354169069311498, "grad_norm": 1.5463494375457296, "learning_rate": 2.1868022844075638e-07, "loss": 0.719, "step": 7971 }, { "epoch": 0.7355091684926768, "grad_norm": 1.621789964515967, "learning_rate": 2.1853728596674797e-07, "loss": 0.7158, "step": 7972 }, { "epoch": 0.7356014300542036, "grad_norm": 1.746903501024696, "learning_rate": 2.1839438032703025e-07, "loss": 0.8234, "step": 7973 }, { "epoch": 0.7356936916157306, "grad_norm": 1.8494244752564273, "learning_rate": 2.1825151153455404e-07, "loss": 0.4436, "step": 7974 }, { "epoch": 0.7357859531772575, "grad_norm": 2.254473364385892, "learning_rate": 2.1810867960226564e-07, "loss": 0.6034, "step": 7975 }, { "epoch": 0.7357859531772575, "eval_GEN Loss": 0.4394301474094391, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.34757712483406067, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8208833932876587, "eval_runtime": 57.3739, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7975 }, { "epoch": 0.7358782147387845, "grad_norm": 1.8547993867929344, "learning_rate": 2.1796588454310965e-07, "loss": 0.5982, "step": 7976 }, { "epoch": 0.7359704763003114, "grad_norm": 2.041324949634301, "learning_rate": 2.1782312637002556e-07, "loss": 0.6966, "step": 7977 }, { "epoch": 0.7360627378618383, "grad_norm": 1.6485361514736159, "learning_rate": 2.1768040509595093e-07, "loss": 0.7311, "step": 7978 }, { "epoch": 0.7361549994233653, "grad_norm": 1.7711470832865897, "learning_rate": 2.175377207338187e-07, "loss": 0.6589, "step": 7979 }, { "epoch": 0.7362472609848921, "grad_norm": 2.4551125108980654, "learning_rate": 2.1739507329655997e-07, "loss": 0.6037, "step": 7980 }, { "epoch": 0.7362472609848921, "eval_GEN Loss": 0.4381187856197357, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34427329897880554, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8170071840286255, "eval_runtime": 57.2607, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 7980 }, { "epoch": 0.7363395225464191, "grad_norm": 1.6542337751732537, "learning_rate": 2.1725246279710107e-07, "loss": 0.6153, "step": 7981 }, { "epoch": 0.7364317841079461, "grad_norm": 2.390067310333501, "learning_rate": 2.1710988924836585e-07, "loss": 0.6448, "step": 7982 }, { "epoch": 0.7365240456694729, "grad_norm": 1.6378131678405312, "learning_rate": 2.169673526632747e-07, "loss": 0.6149, "step": 7983 }, { "epoch": 0.7366163072309999, "grad_norm": 1.762845264536676, "learning_rate": 2.1682485305474406e-07, "loss": 0.7267, "step": 7984 }, { "epoch": 0.7367085687925268, "grad_norm": 1.6730143843556873, "learning_rate": 2.1668239043568788e-07, "loss": 0.6733, "step": 7985 }, { "epoch": 0.7367085687925268, "eval_GEN Loss": 0.4375797212123871, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34300416707992554, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8179687261581421, "eval_runtime": 57.3018, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 7985 }, { "epoch": 0.7368008303540537, "grad_norm": 4.366056890973289, "learning_rate": 2.1653996481901586e-07, "loss": 0.8108, "step": 7986 }, { "epoch": 0.7368930919155807, "grad_norm": 3.286007039577742, "learning_rate": 2.1639757621763548e-07, "loss": 0.6503, "step": 7987 }, { "epoch": 0.7369853534771076, "grad_norm": 2.7444610647246805, "learning_rate": 2.162552246444497e-07, "loss": 0.8093, "step": 7988 }, { "epoch": 0.7370776150386346, "grad_norm": 1.800917562336719, "learning_rate": 2.1611291011235886e-07, "loss": 0.6856, "step": 7989 }, { "epoch": 0.7371698766001614, "grad_norm": 1.9278075510775292, "learning_rate": 2.159706326342597e-07, "loss": 0.5085, "step": 7990 }, { "epoch": 0.7371698766001614, "eval_GEN Loss": 0.4386669397354126, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.34374362230300903, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8210336565971375, "eval_runtime": 57.3901, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 7990 }, { "epoch": 0.7372621381616884, "grad_norm": 3.7844447114330007, "learning_rate": 2.1582839222304586e-07, "loss": 1.0033, "step": 7991 }, { "epoch": 0.7373543997232154, "grad_norm": 1.829202270938417, "learning_rate": 2.1568618889160695e-07, "loss": 0.586, "step": 7992 }, { "epoch": 0.7374466612847422, "grad_norm": 2.019940678471704, "learning_rate": 2.1554402265282985e-07, "loss": 0.6818, "step": 7993 }, { "epoch": 0.7375389228462692, "grad_norm": 1.8755963299126046, "learning_rate": 2.1540189351959812e-07, "loss": 0.5694, "step": 7994 }, { "epoch": 0.7376311844077961, "grad_norm": 1.8571807790913137, "learning_rate": 2.152598015047913e-07, "loss": 0.6849, "step": 7995 }, { "epoch": 0.7376311844077961, "eval_GEN Loss": 0.4382859170436859, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3435203731060028, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.819411039352417, "eval_runtime": 57.2006, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 7995 }, { "epoch": 0.737723445969323, "grad_norm": 1.889308194118825, "learning_rate": 2.151177466212863e-07, "loss": 0.6402, "step": 7996 }, { "epoch": 0.7378157075308499, "grad_norm": 2.2337534517132513, "learning_rate": 2.1497572888195617e-07, "loss": 0.5861, "step": 7997 }, { "epoch": 0.7379079690923769, "grad_norm": 1.4460265399807637, "learning_rate": 2.1483374829967111e-07, "loss": 0.5322, "step": 7998 }, { "epoch": 0.7380002306539039, "grad_norm": 2.0308827691794904, "learning_rate": 2.1469180488729717e-07, "loss": 0.7742, "step": 7999 }, { "epoch": 0.7380924922154307, "grad_norm": 2.47631028217819, "learning_rate": 2.145498986576977e-07, "loss": 0.6599, "step": 8000 }, { "epoch": 0.7380924922154307, "eval_GEN Loss": 0.4389457106590271, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3427395224571228, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8228966593742371, "eval_runtime": 57.1832, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8000 }, { "epoch": 0.7381847537769577, "grad_norm": 2.046362642796398, "learning_rate": 2.1440802962373248e-07, "loss": 0.8098, "step": 8001 }, { "epoch": 0.7382770153384846, "grad_norm": 1.4435512934544006, "learning_rate": 2.142661977982581e-07, "loss": 0.4291, "step": 8002 }, { "epoch": 0.7383692769000115, "grad_norm": 2.012431486065352, "learning_rate": 2.141244031941272e-07, "loss": 0.5144, "step": 8003 }, { "epoch": 0.7384615384615385, "grad_norm": 2.4961006175960203, "learning_rate": 2.1398264582418955e-07, "loss": 0.564, "step": 8004 }, { "epoch": 0.7385538000230654, "grad_norm": 1.9107634355678826, "learning_rate": 2.1384092570129154e-07, "loss": 0.7258, "step": 8005 }, { "epoch": 0.7385538000230654, "eval_GEN Loss": 0.4390805661678314, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.3428064286708832, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8217848539352417, "eval_runtime": 57.2996, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8005 }, { "epoch": 0.7386460615845923, "grad_norm": 3.300990362770836, "learning_rate": 2.136992428382762e-07, "loss": 0.8439, "step": 8006 }, { "epoch": 0.7387383231461192, "grad_norm": 1.866461873185808, "learning_rate": 2.1355759724798275e-07, "loss": 0.5885, "step": 8007 }, { "epoch": 0.7388305847076462, "grad_norm": 2.649056466220046, "learning_rate": 2.1341598894324739e-07, "loss": 0.7351, "step": 8008 }, { "epoch": 0.7389228462691732, "grad_norm": 1.9463865941665526, "learning_rate": 2.1327441793690313e-07, "loss": 0.66, "step": 8009 }, { "epoch": 0.7390151078307, "grad_norm": 1.7308664482373413, "learning_rate": 2.1313288424177895e-07, "loss": 0.5243, "step": 8010 }, { "epoch": 0.7390151078307, "eval_GEN Loss": 0.438196063041687, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3405686616897583, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8198317289352417, "eval_runtime": 57.1945, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8010 }, { "epoch": 0.739107369392227, "grad_norm": 2.4641760795452083, "learning_rate": 2.1299138787070114e-07, "loss": 0.8057, "step": 8011 }, { "epoch": 0.7391996309537539, "grad_norm": 1.6580597712329912, "learning_rate": 2.1284992883649226e-07, "loss": 0.6231, "step": 8012 }, { "epoch": 0.7392918925152808, "grad_norm": 2.039429562212772, "learning_rate": 2.127085071519718e-07, "loss": 0.7599, "step": 8013 }, { "epoch": 0.7393841540768078, "grad_norm": 2.139268994274617, "learning_rate": 2.1256712282995493e-07, "loss": 0.8077, "step": 8014 }, { "epoch": 0.7394764156383347, "grad_norm": 3.8546857783259916, "learning_rate": 2.12425775883255e-07, "loss": 0.7647, "step": 8015 }, { "epoch": 0.7394764156383347, "eval_GEN Loss": 0.4373180866241455, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33909299969673157, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.818629801273346, "eval_runtime": 56.0357, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 8015 }, { "epoch": 0.7395686771998616, "grad_norm": 1.5267552119279062, "learning_rate": 2.122844663246805e-07, "loss": 0.6688, "step": 8016 }, { "epoch": 0.7396609387613885, "grad_norm": 1.3726202160537173, "learning_rate": 2.1214319416703745e-07, "loss": 0.6024, "step": 8017 }, { "epoch": 0.7397532003229155, "grad_norm": 1.8981332852684052, "learning_rate": 2.1200195942312777e-07, "loss": 0.687, "step": 8018 }, { "epoch": 0.7398454618844424, "grad_norm": 1.6907693097207817, "learning_rate": 2.1186076210575059e-07, "loss": 0.5601, "step": 8019 }, { "epoch": 0.7399377234459693, "grad_norm": 2.500785683234993, "learning_rate": 2.1171960222770168e-07, "loss": 0.8809, "step": 8020 }, { "epoch": 0.7399377234459693, "eval_GEN Loss": 0.43813613057136536, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33785414695739746, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8186598420143127, "eval_runtime": 56.0686, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 8020 }, { "epoch": 0.7400299850074963, "grad_norm": 1.5531614873419142, "learning_rate": 2.1157847980177246e-07, "loss": 0.5164, "step": 8021 }, { "epoch": 0.7401222465690231, "grad_norm": 2.2291870878467837, "learning_rate": 2.1143739484075264e-07, "loss": 0.685, "step": 8022 }, { "epoch": 0.7402145081305501, "grad_norm": 3.4359162360062476, "learning_rate": 2.1129634735742678e-07, "loss": 0.6744, "step": 8023 }, { "epoch": 0.7403067696920771, "grad_norm": 2.1713903897707545, "learning_rate": 2.111553373645773e-07, "loss": 0.651, "step": 8024 }, { "epoch": 0.740399031253604, "grad_norm": 1.6030929478297355, "learning_rate": 2.1101436487498219e-07, "loss": 0.7317, "step": 8025 }, { "epoch": 0.740399031253604, "eval_GEN Loss": 0.4377763271331787, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3350926637649536, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8161057829856873, "eval_runtime": 56.2439, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8025 }, { "epoch": 0.7404912928151309, "grad_norm": 3.3167236432131766, "learning_rate": 2.1087342990141729e-07, "loss": 0.6856, "step": 8026 }, { "epoch": 0.7405835543766578, "grad_norm": 1.721118821582812, "learning_rate": 2.1073253245665387e-07, "loss": 0.639, "step": 8027 }, { "epoch": 0.7406758159381848, "grad_norm": 2.1007891221866966, "learning_rate": 2.1059167255346042e-07, "loss": 0.7395, "step": 8028 }, { "epoch": 0.7407680774997116, "grad_norm": 1.544269901723135, "learning_rate": 2.104508502046021e-07, "loss": 0.5851, "step": 8029 }, { "epoch": 0.7408603390612386, "grad_norm": 2.1170742843213497, "learning_rate": 2.1031006542284002e-07, "loss": 0.8782, "step": 8030 }, { "epoch": 0.7408603390612386, "eval_GEN Loss": 0.43792131543159485, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.33655041456222534, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8161959052085876, "eval_runtime": 56.2732, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8030 }, { "epoch": 0.7409526006227656, "grad_norm": 1.8703040574857739, "learning_rate": 2.101693182209328e-07, "loss": 0.6904, "step": 8031 }, { "epoch": 0.7410448621842924, "grad_norm": 1.4845020025912739, "learning_rate": 2.1002860861163446e-07, "loss": 0.5255, "step": 8032 }, { "epoch": 0.7411371237458194, "grad_norm": 1.7674399991708978, "learning_rate": 2.0988793660769718e-07, "loss": 0.607, "step": 8033 }, { "epoch": 0.7412293853073463, "grad_norm": 2.3930408278805624, "learning_rate": 2.097473022218683e-07, "loss": 0.6166, "step": 8034 }, { "epoch": 0.7413216468688733, "grad_norm": 2.098339855135153, "learning_rate": 2.0960670546689273e-07, "loss": 0.6446, "step": 8035 }, { "epoch": 0.7413216468688733, "eval_GEN Loss": 0.43794283270835876, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3342767357826233, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8165865540504456, "eval_runtime": 56.2295, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8035 }, { "epoch": 0.7414139084304002, "grad_norm": 1.65683171783807, "learning_rate": 2.0946614635551088e-07, "loss": 0.6083, "step": 8036 }, { "epoch": 0.7415061699919271, "grad_norm": 2.6148783603934556, "learning_rate": 2.0932562490046131e-07, "loss": 0.7316, "step": 8037 }, { "epoch": 0.7415984315534541, "grad_norm": 2.604222643075845, "learning_rate": 2.0918514111447776e-07, "loss": 0.6588, "step": 8038 }, { "epoch": 0.7416906931149809, "grad_norm": 2.100779011760131, "learning_rate": 2.0904469501029125e-07, "loss": 0.6301, "step": 8039 }, { "epoch": 0.7417829546765079, "grad_norm": 2.6197449153139893, "learning_rate": 2.0890428660062932e-07, "loss": 0.8319, "step": 8040 }, { "epoch": 0.7417829546765079, "eval_GEN Loss": 0.4380934536457062, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3357158303260803, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8197416067123413, "eval_runtime": 56.2081, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8040 }, { "epoch": 0.7418752162380349, "grad_norm": 2.2560699126716752, "learning_rate": 2.087639158982157e-07, "loss": 0.6266, "step": 8041 }, { "epoch": 0.7419674777995617, "grad_norm": 2.9450846403192426, "learning_rate": 2.0862358291577123e-07, "loss": 0.6564, "step": 8042 }, { "epoch": 0.7420597393610887, "grad_norm": 1.7818301512941401, "learning_rate": 2.0848328766601304e-07, "loss": 0.6447, "step": 8043 }, { "epoch": 0.7421520009226156, "grad_norm": 1.8039239720617395, "learning_rate": 2.0834303016165508e-07, "loss": 0.7254, "step": 8044 }, { "epoch": 0.7422442624841425, "grad_norm": 3.6483484112245925, "learning_rate": 2.082028104154074e-07, "loss": 0.7985, "step": 8045 }, { "epoch": 0.7422442624841425, "eval_GEN Loss": 0.438777893781662, "eval_GEN top-5 accuracy": 0.9846558526961858, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 Neg": 0.625, "eval_PRM Loss": 0.33837246894836426, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8205228447914124, "eval_runtime": 56.3607, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8045 }, { "epoch": 0.7423365240456695, "grad_norm": 1.7675062463399174, "learning_rate": 2.0806262843997713e-07, "loss": 0.613, "step": 8046 }, { "epoch": 0.7424287856071964, "grad_norm": 2.080071802524963, "learning_rate": 2.0792248424806766e-07, "loss": 0.729, "step": 8047 }, { "epoch": 0.7425210471687234, "grad_norm": 1.4287188444031464, "learning_rate": 2.0778237785237936e-07, "loss": 0.5894, "step": 8048 }, { "epoch": 0.7426133087302502, "grad_norm": 2.230440212887735, "learning_rate": 2.0764230926560853e-07, "loss": 0.8056, "step": 8049 }, { "epoch": 0.7427055702917772, "grad_norm": 2.399450863678101, "learning_rate": 2.075022785004486e-07, "loss": 0.7342, "step": 8050 }, { "epoch": 0.7427055702917772, "eval_GEN Loss": 0.43929818272590637, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3406790494918823, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8148738145828247, "eval_runtime": 56.2515, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8050 }, { "epoch": 0.7427978318533042, "grad_norm": 1.383050681853717, "learning_rate": 2.0736228556958927e-07, "loss": 0.5219, "step": 8051 }, { "epoch": 0.742890093414831, "grad_norm": 2.2549497727394416, "learning_rate": 2.0722233048571723e-07, "loss": 0.6587, "step": 8052 }, { "epoch": 0.742982354976358, "grad_norm": 1.7942750217348034, "learning_rate": 2.0708241326151498e-07, "loss": 0.8211, "step": 8053 }, { "epoch": 0.7430746165378849, "grad_norm": 2.110293135239807, "learning_rate": 2.069425339096623e-07, "loss": 0.7003, "step": 8054 }, { "epoch": 0.7431668780994118, "grad_norm": 2.360835885004535, "learning_rate": 2.0680269244283533e-07, "loss": 0.6667, "step": 8055 }, { "epoch": 0.7431668780994118, "eval_GEN Loss": 0.4388917088508606, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3457129895687103, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8139122724533081, "eval_runtime": 56.1323, "eval_samples_per_second": 1.158, "eval_steps_per_second": 0.089, "step": 8055 }, { "epoch": 0.7432591396609388, "grad_norm": 2.555591559327794, "learning_rate": 2.0666288887370648e-07, "loss": 0.6572, "step": 8056 }, { "epoch": 0.7433514012224657, "grad_norm": 1.5847481045384113, "learning_rate": 2.0652312321494512e-07, "loss": 0.5159, "step": 8057 }, { "epoch": 0.7434436627839927, "grad_norm": 2.139446448486914, "learning_rate": 2.0638339547921702e-07, "loss": 0.7057, "step": 8058 }, { "epoch": 0.7435359243455195, "grad_norm": 2.2098488875808484, "learning_rate": 2.0624370567918473e-07, "loss": 0.525, "step": 8059 }, { "epoch": 0.7436281859070465, "grad_norm": 2.4693250508394065, "learning_rate": 2.0610405382750657e-07, "loss": 0.7677, "step": 8060 }, { "epoch": 0.7436281859070465, "eval_GEN Loss": 0.438445508480072, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3457964062690735, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8094651699066162, "eval_runtime": 56.2412, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8060 }, { "epoch": 0.7437204474685734, "grad_norm": 1.8921055947067549, "learning_rate": 2.0596443993683878e-07, "loss": 0.623, "step": 8061 }, { "epoch": 0.7438127090301003, "grad_norm": 2.7387342484668946, "learning_rate": 2.0582486401983287e-07, "loss": 0.6772, "step": 8062 }, { "epoch": 0.7439049705916273, "grad_norm": 2.4492641103068253, "learning_rate": 2.0568532608913775e-07, "loss": 0.8234, "step": 8063 }, { "epoch": 0.7439972321531542, "grad_norm": 1.9049972739013983, "learning_rate": 2.0554582615739816e-07, "loss": 0.6912, "step": 8064 }, { "epoch": 0.7440894937146811, "grad_norm": 3.0339665163374105, "learning_rate": 2.0540636423725605e-07, "loss": 0.5529, "step": 8065 }, { "epoch": 0.7440894937146811, "eval_GEN Loss": 0.43823832273483276, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3451066315174103, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8099158406257629, "eval_runtime": 56.2565, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8065 }, { "epoch": 0.744181755276208, "grad_norm": 1.6359129446390865, "learning_rate": 2.0526694034134994e-07, "loss": 0.6651, "step": 8066 }, { "epoch": 0.744274016837735, "grad_norm": 2.4577499843953126, "learning_rate": 2.0512755448231407e-07, "loss": 0.7118, "step": 8067 }, { "epoch": 0.744366278399262, "grad_norm": 1.5296619477610705, "learning_rate": 2.0498820667278013e-07, "loss": 0.6314, "step": 8068 }, { "epoch": 0.7444585399607888, "grad_norm": 2.98935448447665, "learning_rate": 2.0484889692537598e-07, "loss": 0.6932, "step": 8069 }, { "epoch": 0.7445508015223158, "grad_norm": 2.6135173648679255, "learning_rate": 2.0470962525272634e-07, "loss": 0.6794, "step": 8070 }, { "epoch": 0.7445508015223158, "eval_GEN Loss": 0.43753138184547424, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3442704975605011, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.809645414352417, "eval_runtime": 56.211, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8070 }, { "epoch": 0.7446430630838426, "grad_norm": 2.200643484787776, "learning_rate": 2.0457039166745164e-07, "loss": 0.6883, "step": 8071 }, { "epoch": 0.7447353246453696, "grad_norm": 2.458626325816072, "learning_rate": 2.0443119618217017e-07, "loss": 0.7375, "step": 8072 }, { "epoch": 0.7448275862068966, "grad_norm": 2.7162349129538264, "learning_rate": 2.042920388094955e-07, "loss": 0.6705, "step": 8073 }, { "epoch": 0.7449198477684235, "grad_norm": 1.6051753846061199, "learning_rate": 2.041529195620387e-07, "loss": 0.4827, "step": 8074 }, { "epoch": 0.7450121093299504, "grad_norm": 1.5373864492957319, "learning_rate": 2.0401383845240653e-07, "loss": 0.5302, "step": 8075 }, { "epoch": 0.7450121093299504, "eval_GEN Loss": 0.4376084506511688, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.33912861347198486, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8088040947914124, "eval_runtime": 56.3313, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 8075 }, { "epoch": 0.7451043708914773, "grad_norm": 2.416557237685905, "learning_rate": 2.0387479549320292e-07, "loss": 0.6882, "step": 8076 }, { "epoch": 0.7451966324530043, "grad_norm": 1.6397212972146815, "learning_rate": 2.0373579069702825e-07, "loss": 0.5739, "step": 8077 }, { "epoch": 0.7452888940145312, "grad_norm": 2.0324572130996548, "learning_rate": 2.0359682407647928e-07, "loss": 0.5816, "step": 8078 }, { "epoch": 0.7453811555760581, "grad_norm": 1.7887536683774683, "learning_rate": 2.0345789564414964e-07, "loss": 0.5513, "step": 8079 }, { "epoch": 0.7454734171375851, "grad_norm": 2.009685914124151, "learning_rate": 2.0331900541262883e-07, "loss": 0.6496, "step": 8080 }, { "epoch": 0.7454734171375851, "eval_GEN Loss": 0.4374493658542633, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33356618881225586, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8133413195610046, "eval_runtime": 57.1914, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8080 }, { "epoch": 0.7455656786991119, "grad_norm": 3.9802073019643194, "learning_rate": 2.0318015339450366e-07, "loss": 0.7408, "step": 8081 }, { "epoch": 0.7456579402606389, "grad_norm": 2.396547249591225, "learning_rate": 2.030413396023565e-07, "loss": 0.713, "step": 8082 }, { "epoch": 0.7457502018221659, "grad_norm": 3.195937280893646, "learning_rate": 2.029025640487678e-07, "loss": 0.6676, "step": 8083 }, { "epoch": 0.7458424633836928, "grad_norm": 1.8267052095609593, "learning_rate": 2.0276382674631293e-07, "loss": 0.5352, "step": 8084 }, { "epoch": 0.7459347249452197, "grad_norm": 2.557676803607631, "learning_rate": 2.0262512770756465e-07, "loss": 0.6206, "step": 8085 }, { "epoch": 0.7459347249452197, "eval_GEN Loss": 0.43800053000450134, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3274078667163849, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8116586804389954, "eval_runtime": 57.2001, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8085 }, { "epoch": 0.7460269865067466, "grad_norm": 2.3680728706233185, "learning_rate": 2.024864669450921e-07, "loss": 0.7487, "step": 8086 }, { "epoch": 0.7461192480682736, "grad_norm": 1.6864861372373663, "learning_rate": 2.0234784447146126e-07, "loss": 0.5152, "step": 8087 }, { "epoch": 0.7462115096298004, "grad_norm": 2.039144785605029, "learning_rate": 2.022092602992337e-07, "loss": 0.6738, "step": 8088 }, { "epoch": 0.7463037711913274, "grad_norm": 3.430485308791236, "learning_rate": 2.020707144409685e-07, "loss": 0.8198, "step": 8089 }, { "epoch": 0.7463960327528544, "grad_norm": 1.898287002787234, "learning_rate": 2.0193220690922112e-07, "loss": 0.5669, "step": 8090 }, { "epoch": 0.7463960327528544, "eval_GEN Loss": 0.43749722838401794, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3259943723678589, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8110576868057251, "eval_runtime": 57.0274, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 8090 }, { "epoch": 0.7464882943143812, "grad_norm": 1.5078621754336834, "learning_rate": 2.0179373771654277e-07, "loss": 0.489, "step": 8091 }, { "epoch": 0.7465805558759082, "grad_norm": 1.4271414973155998, "learning_rate": 2.016553068754821e-07, "loss": 0.6413, "step": 8092 }, { "epoch": 0.7466728174374351, "grad_norm": 1.9109265795612174, "learning_rate": 2.0151691439858387e-07, "loss": 0.6093, "step": 8093 }, { "epoch": 0.746765078998962, "grad_norm": 2.3801957781280403, "learning_rate": 2.0137856029838963e-07, "loss": 0.6118, "step": 8094 }, { "epoch": 0.746857340560489, "grad_norm": 1.844754434448371, "learning_rate": 2.012402445874369e-07, "loss": 0.5635, "step": 8095 }, { "epoch": 0.746857340560489, "eval_GEN Loss": 0.4379826486110687, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.327656626701355, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8125600814819336, "eval_runtime": 57.0091, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 8095 }, { "epoch": 0.7469496021220159, "grad_norm": 1.9626721501204354, "learning_rate": 2.0110196727826013e-07, "loss": 0.5343, "step": 8096 }, { "epoch": 0.7470418636835429, "grad_norm": 1.8532899432597953, "learning_rate": 2.0096372838339032e-07, "loss": 0.6118, "step": 8097 }, { "epoch": 0.7471341252450697, "grad_norm": 2.755702644268455, "learning_rate": 2.0082552791535508e-07, "loss": 0.7845, "step": 8098 }, { "epoch": 0.7472263868065967, "grad_norm": 3.1959674823034425, "learning_rate": 2.00687365886678e-07, "loss": 0.5663, "step": 8099 }, { "epoch": 0.7473186483681237, "grad_norm": 1.7569827449382927, "learning_rate": 2.0054924230987968e-07, "loss": 0.7188, "step": 8100 }, { "epoch": 0.7473186483681237, "eval_GEN Loss": 0.43827423453330994, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3293844163417816, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8154146671295166, "eval_runtime": 57.3889, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8100 }, { "epoch": 0.7474109099296505, "grad_norm": 1.4728977093573952, "learning_rate": 2.0041115719747733e-07, "loss": 0.4483, "step": 8101 }, { "epoch": 0.7475031714911775, "grad_norm": 1.5725359997412163, "learning_rate": 2.00273110561984e-07, "loss": 0.5922, "step": 8102 }, { "epoch": 0.7475954330527044, "grad_norm": 1.894855495549885, "learning_rate": 2.0013510241590997e-07, "loss": 0.527, "step": 8103 }, { "epoch": 0.7476876946142313, "grad_norm": 1.819342552795827, "learning_rate": 1.9999713277176167e-07, "loss": 0.7112, "step": 8104 }, { "epoch": 0.7477799561757583, "grad_norm": 1.5224013345878789, "learning_rate": 1.998592016420424e-07, "loss": 0.5681, "step": 8105 }, { "epoch": 0.7477799561757583, "eval_GEN Loss": 0.4382474422454834, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.32867980003356934, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.818088948726654, "eval_runtime": 57.1212, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8105 }, { "epoch": 0.7478722177372852, "grad_norm": 2.7119973016328864, "learning_rate": 1.9972130903925122e-07, "loss": 0.9509, "step": 8106 }, { "epoch": 0.7479644792988122, "grad_norm": 3.2796993156631404, "learning_rate": 1.995834549758844e-07, "loss": 0.8072, "step": 8107 }, { "epoch": 0.748056740860339, "grad_norm": 1.9734621452797734, "learning_rate": 1.994456394644345e-07, "loss": 0.6788, "step": 8108 }, { "epoch": 0.748149002421866, "grad_norm": 2.223812678196682, "learning_rate": 1.993078625173908e-07, "loss": 0.6738, "step": 8109 }, { "epoch": 0.748241263983393, "grad_norm": 1.9069377581348363, "learning_rate": 1.9917012414723852e-07, "loss": 0.5967, "step": 8110 }, { "epoch": 0.748241263983393, "eval_GEN Loss": 0.4375027120113373, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9101796407185628, "eval_PRM F1 AUC": 0.7839182818229439, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3254123330116272, "eval_PRM NPV": 0.6818181818181818, "eval_PRM Precision": 0.9047619047619048, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8170071840286255, "eval_runtime": 57.1679, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8110 }, { "epoch": 0.7483335255449198, "grad_norm": 2.6679946582291354, "learning_rate": 1.9903242436645979e-07, "loss": 0.9168, "step": 8111 }, { "epoch": 0.7484257871064468, "grad_norm": 1.9011141982821456, "learning_rate": 1.988947631875334e-07, "loss": 0.7708, "step": 8112 }, { "epoch": 0.7485180486679737, "grad_norm": 1.9422400615245567, "learning_rate": 1.9875714062293417e-07, "loss": 0.4816, "step": 8113 }, { "epoch": 0.7486103102295006, "grad_norm": 3.128276242763716, "learning_rate": 1.986195566851337e-07, "loss": 0.5929, "step": 8114 }, { "epoch": 0.7487025717910276, "grad_norm": 2.0296861526726095, "learning_rate": 1.984820113866002e-07, "loss": 0.7423, "step": 8115 }, { "epoch": 0.7487025717910276, "eval_GEN Loss": 0.43707072734832764, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3247678875923157, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8149038553237915, "eval_runtime": 57.0847, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8115 }, { "epoch": 0.7487948333525545, "grad_norm": 1.7650998711611063, "learning_rate": 1.9834450473979833e-07, "loss": 0.608, "step": 8116 }, { "epoch": 0.7488870949140815, "grad_norm": 3.3512376202599805, "learning_rate": 1.982070367571886e-07, "loss": 0.8236, "step": 8117 }, { "epoch": 0.7489793564756083, "grad_norm": 1.5055120640141137, "learning_rate": 1.9806960745122936e-07, "loss": 0.5343, "step": 8118 }, { "epoch": 0.7490716180371353, "grad_norm": 2.3032769890997997, "learning_rate": 1.979322168343741e-07, "loss": 0.715, "step": 8119 }, { "epoch": 0.7491638795986622, "grad_norm": 2.2780968906468004, "learning_rate": 1.9779486491907383e-07, "loss": 0.7181, "step": 8120 }, { "epoch": 0.7491638795986622, "eval_GEN Loss": 0.43772652745246887, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.32814422249794006, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8181790709495544, "eval_runtime": 56.0472, "eval_samples_per_second": 1.16, "eval_steps_per_second": 0.089, "step": 8120 }, { "epoch": 0.7492561411601891, "grad_norm": 2.2256089852294663, "learning_rate": 1.9765755171777492e-07, "loss": 0.6781, "step": 8121 }, { "epoch": 0.7493484027217161, "grad_norm": 2.5383621554907574, "learning_rate": 1.9752027724292167e-07, "loss": 0.7185, "step": 8122 }, { "epoch": 0.749440664283243, "grad_norm": 1.7246551487518726, "learning_rate": 1.973830415069536e-07, "loss": 0.7201, "step": 8123 }, { "epoch": 0.7495329258447699, "grad_norm": 2.0374755417494868, "learning_rate": 1.9724584452230736e-07, "loss": 0.7134, "step": 8124 }, { "epoch": 0.7496251874062968, "grad_norm": 1.4236599160542456, "learning_rate": 1.971086863014162e-07, "loss": 0.6043, "step": 8125 }, { "epoch": 0.7496251874062968, "eval_GEN Loss": 0.43690600991249084, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3260045647621155, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8136118054389954, "eval_runtime": 57.0876, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8125 }, { "epoch": 0.7497174489678238, "grad_norm": 2.562846910082985, "learning_rate": 1.9697156685670917e-07, "loss": 0.7861, "step": 8126 }, { "epoch": 0.7498097105293507, "grad_norm": 2.313736803892231, "learning_rate": 1.9683448620061273e-07, "loss": 0.8796, "step": 8127 }, { "epoch": 0.7499019720908776, "grad_norm": 2.293759244770071, "learning_rate": 1.9669744434554868e-07, "loss": 0.7058, "step": 8128 }, { "epoch": 0.7499942336524046, "grad_norm": 1.3754331815280063, "learning_rate": 1.9656044130393675e-07, "loss": 0.5356, "step": 8129 }, { "epoch": 0.7500864952139314, "grad_norm": 1.962934078325475, "learning_rate": 1.9642347708819182e-07, "loss": 0.7177, "step": 8130 }, { "epoch": 0.7500864952139314, "eval_GEN Loss": 0.4379958510398865, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3294261693954468, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8137620091438293, "eval_runtime": 56.3322, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 8130 }, { "epoch": 0.7501787567754584, "grad_norm": 2.972603253965086, "learning_rate": 1.9628655171072618e-07, "loss": 0.6343, "step": 8131 }, { "epoch": 0.7502710183369854, "grad_norm": 2.2217585323038938, "learning_rate": 1.9614966518394763e-07, "loss": 0.7406, "step": 8132 }, { "epoch": 0.7503632798985123, "grad_norm": 1.645296969658462, "learning_rate": 1.9601281752026184e-07, "loss": 0.4993, "step": 8133 }, { "epoch": 0.7504555414600392, "grad_norm": 2.5592340930225337, "learning_rate": 1.9587600873206956e-07, "loss": 0.8165, "step": 8134 }, { "epoch": 0.7505478030215661, "grad_norm": 1.6644559201766844, "learning_rate": 1.9573923883176888e-07, "loss": 0.5512, "step": 8135 }, { "epoch": 0.7505478030215661, "eval_GEN Loss": 0.43803995847702026, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.33369556069374084, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8110276460647583, "eval_runtime": 56.2602, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8135 }, { "epoch": 0.7506400645830931, "grad_norm": 2.048929582328461, "learning_rate": 1.9560250783175416e-07, "loss": 0.7053, "step": 8136 }, { "epoch": 0.75073232614462, "grad_norm": 2.1544022530798803, "learning_rate": 1.9546581574441586e-07, "loss": 0.4976, "step": 8137 }, { "epoch": 0.7508245877061469, "grad_norm": 1.5903508942360953, "learning_rate": 1.953291625821417e-07, "loss": 0.5678, "step": 8138 }, { "epoch": 0.7509168492676739, "grad_norm": 2.0460725407348925, "learning_rate": 1.951925483573147e-07, "loss": 0.627, "step": 8139 }, { "epoch": 0.7510091108292007, "grad_norm": 2.666972928588087, "learning_rate": 1.9505597308231588e-07, "loss": 0.5111, "step": 8140 }, { "epoch": 0.7510091108292007, "eval_GEN Loss": 0.4382053017616272, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8957055214723927, "eval_PRM F1 AUC": 0.7875851231011, "eval_PRM F1 Neg": 0.6530612244897959, "eval_PRM Loss": 0.3347400426864624, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.9125, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.806911051273346, "eval_runtime": 56.2939, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8140 }, { "epoch": 0.7511013723907277, "grad_norm": 2.076645467245927, "learning_rate": 1.949194367695214e-07, "loss": 0.7322, "step": 8141 }, { "epoch": 0.7511936339522547, "grad_norm": 2.23350516503174, "learning_rate": 1.9478293943130443e-07, "loss": 0.6807, "step": 8142 }, { "epoch": 0.7512858955137816, "grad_norm": 2.0607633677419237, "learning_rate": 1.946464810800347e-07, "loss": 0.6419, "step": 8143 }, { "epoch": 0.7513781570753085, "grad_norm": 3.4250614321352955, "learning_rate": 1.945100617280784e-07, "loss": 0.7383, "step": 8144 }, { "epoch": 0.7514704186368354, "grad_norm": 2.2411310402061186, "learning_rate": 1.9437368138779778e-07, "loss": 0.7196, "step": 8145 }, { "epoch": 0.7514704186368354, "eval_GEN Loss": 0.43878212571144104, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33480730652809143, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8104267120361328, "eval_runtime": 56.3671, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8145 }, { "epoch": 0.7515626801983624, "grad_norm": 1.9855397183650916, "learning_rate": 1.9423734007155193e-07, "loss": 0.6166, "step": 8146 }, { "epoch": 0.7516549417598893, "grad_norm": 1.3654175189651319, "learning_rate": 1.9410103779169652e-07, "loss": 0.5052, "step": 8147 }, { "epoch": 0.7517472033214162, "grad_norm": 3.196947218243195, "learning_rate": 1.9396477456058314e-07, "loss": 0.697, "step": 8148 }, { "epoch": 0.7518394648829432, "grad_norm": 2.2891326997740706, "learning_rate": 1.9382855039056034e-07, "loss": 0.654, "step": 8149 }, { "epoch": 0.75193172644447, "grad_norm": 1.671297561832475, "learning_rate": 1.9369236529397296e-07, "loss": 0.5895, "step": 8150 }, { "epoch": 0.75193172644447, "eval_GEN Loss": 0.438138484954834, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33412107825279236, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8099459409713745, "eval_runtime": 56.2249, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8150 }, { "epoch": 0.752023988005997, "grad_norm": 1.5972797600702555, "learning_rate": 1.9355621928316263e-07, "loss": 0.5336, "step": 8151 }, { "epoch": 0.7521162495675239, "grad_norm": 2.0861859648284504, "learning_rate": 1.9342011237046646e-07, "loss": 0.7205, "step": 8152 }, { "epoch": 0.7522085111290508, "grad_norm": 2.3948060388795667, "learning_rate": 1.9328404456821916e-07, "loss": 0.6371, "step": 8153 }, { "epoch": 0.7523007726905778, "grad_norm": 1.9474863520137902, "learning_rate": 1.9314801588875115e-07, "loss": 0.648, "step": 8154 }, { "epoch": 0.7523930342521047, "grad_norm": 1.830823253726022, "learning_rate": 1.9301202634439e-07, "loss": 0.5667, "step": 8155 }, { "epoch": 0.7523930342521047, "eval_GEN Loss": 0.43860065937042236, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32936906814575195, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8112680315971375, "eval_runtime": 56.2991, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8155 }, { "epoch": 0.7524852958136317, "grad_norm": 3.4474425910418596, "learning_rate": 1.928760759474587e-07, "loss": 0.9126, "step": 8156 }, { "epoch": 0.7525775573751585, "grad_norm": 1.5853072861959285, "learning_rate": 1.9274016471027758e-07, "loss": 0.6144, "step": 8157 }, { "epoch": 0.7526698189366855, "grad_norm": 1.7568088644826867, "learning_rate": 1.9260429264516315e-07, "loss": 0.519, "step": 8158 }, { "epoch": 0.7527620804982125, "grad_norm": 5.243899838599277, "learning_rate": 1.924684597644285e-07, "loss": 0.9248, "step": 8159 }, { "epoch": 0.7528543420597393, "grad_norm": 2.0224130357082766, "learning_rate": 1.9233266608038267e-07, "loss": 0.6452, "step": 8160 }, { "epoch": 0.7528543420597393, "eval_GEN Loss": 0.438906192779541, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3249794542789459, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8107572197914124, "eval_runtime": 56.3026, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 8160 }, { "epoch": 0.7529466036212663, "grad_norm": 2.494416966332092, "learning_rate": 1.9219691160533162e-07, "loss": 0.7626, "step": 8161 }, { "epoch": 0.7530388651827932, "grad_norm": 2.238419829247673, "learning_rate": 1.9206119635157798e-07, "loss": 0.6789, "step": 8162 }, { "epoch": 0.7531311267443201, "grad_norm": 1.4293740946408875, "learning_rate": 1.9192552033141985e-07, "loss": 0.619, "step": 8163 }, { "epoch": 0.7532233883058471, "grad_norm": 1.4320119516656236, "learning_rate": 1.9178988355715278e-07, "loss": 0.5286, "step": 8164 }, { "epoch": 0.753315649867374, "grad_norm": 2.2169591900059924, "learning_rate": 1.916542860410684e-07, "loss": 0.8095, "step": 8165 }, { "epoch": 0.753315649867374, "eval_GEN Loss": 0.43889397382736206, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3234950602054596, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8128004670143127, "eval_runtime": 57.1965, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8165 }, { "epoch": 0.753407911428901, "grad_norm": 1.8468418030434832, "learning_rate": 1.9151872779545486e-07, "loss": 0.6031, "step": 8166 }, { "epoch": 0.7535001729904278, "grad_norm": 1.7930127299253587, "learning_rate": 1.9138320883259614e-07, "loss": 0.7274, "step": 8167 }, { "epoch": 0.7535924345519548, "grad_norm": 2.195065698804633, "learning_rate": 1.91247729164774e-07, "loss": 0.4106, "step": 8168 }, { "epoch": 0.7536846961134818, "grad_norm": 3.915332031883535, "learning_rate": 1.9111228880426513e-07, "loss": 0.8491, "step": 8169 }, { "epoch": 0.7537769576750086, "grad_norm": 1.4910921470369811, "learning_rate": 1.9097688776334375e-07, "loss": 0.6475, "step": 8170 }, { "epoch": 0.7537769576750086, "eval_GEN Loss": 0.43803247809410095, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM Loss": 0.3234235346317291, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8128906488418579, "eval_runtime": 57.1133, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8170 }, { "epoch": 0.7538692192365356, "grad_norm": 8.033970320884695, "learning_rate": 1.9084152605427987e-07, "loss": 0.9438, "step": 8171 }, { "epoch": 0.7539614807980625, "grad_norm": 1.7472973229593507, "learning_rate": 1.907062036893402e-07, "loss": 0.6628, "step": 8172 }, { "epoch": 0.7540537423595894, "grad_norm": 2.0789904028158968, "learning_rate": 1.905709206807882e-07, "loss": 0.8565, "step": 8173 }, { "epoch": 0.7541460039211164, "grad_norm": 1.3324444577229646, "learning_rate": 1.9043567704088273e-07, "loss": 0.632, "step": 8174 }, { "epoch": 0.7542382654826433, "grad_norm": 1.7418046641663827, "learning_rate": 1.903004727818806e-07, "loss": 0.5506, "step": 8175 }, { "epoch": 0.7542382654826433, "eval_GEN Loss": 0.4385905861854553, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3232262134552002, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8116586804389954, "eval_runtime": 57.3486, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8175 }, { "epoch": 0.7543305270441703, "grad_norm": 3.368744474042066, "learning_rate": 1.9016530791603364e-07, "loss": 0.808, "step": 8176 }, { "epoch": 0.7544227886056971, "grad_norm": 1.853650962209374, "learning_rate": 1.900301824555912e-07, "loss": 0.53, "step": 8177 }, { "epoch": 0.7545150501672241, "grad_norm": 1.6351667240723926, "learning_rate": 1.8989509641279783e-07, "loss": 0.7042, "step": 8178 }, { "epoch": 0.7546073117287511, "grad_norm": 2.323942146429441, "learning_rate": 1.8976004979989609e-07, "loss": 0.6409, "step": 8179 }, { "epoch": 0.7546995732902779, "grad_norm": 2.165945590879932, "learning_rate": 1.896250426291235e-07, "loss": 0.6778, "step": 8180 }, { "epoch": 0.7546995732902779, "eval_GEN Loss": 0.4374694228172302, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3219458758831024, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8118990659713745, "eval_runtime": 57.1781, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8180 }, { "epoch": 0.7547918348518049, "grad_norm": 1.5605508355915254, "learning_rate": 1.8949007491271486e-07, "loss": 0.6377, "step": 8181 }, { "epoch": 0.7548840964133318, "grad_norm": 1.827579655499966, "learning_rate": 1.893551466629013e-07, "loss": 0.4943, "step": 8182 }, { "epoch": 0.7549763579748587, "grad_norm": 1.5836242574208046, "learning_rate": 1.8922025789190987e-07, "loss": 0.5565, "step": 8183 }, { "epoch": 0.7550686195363856, "grad_norm": 2.4700738400367555, "learning_rate": 1.8908540861196484e-07, "loss": 0.6452, "step": 8184 }, { "epoch": 0.7551608810979126, "grad_norm": 2.705722850117915, "learning_rate": 1.8895059883528577e-07, "loss": 0.7939, "step": 8185 }, { "epoch": 0.7551608810979126, "eval_GEN Loss": 0.4376782476902008, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3206431269645691, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.814723551273346, "eval_runtime": 57.3005, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8185 }, { "epoch": 0.7552531426594395, "grad_norm": 2.4482922484362706, "learning_rate": 1.888158285740902e-07, "loss": 0.6221, "step": 8186 }, { "epoch": 0.7553454042209664, "grad_norm": 3.0645389011012094, "learning_rate": 1.8868109784059063e-07, "loss": 0.5994, "step": 8187 }, { "epoch": 0.7554376657824934, "grad_norm": 2.5908299195296007, "learning_rate": 1.8854640664699697e-07, "loss": 0.5444, "step": 8188 }, { "epoch": 0.7555299273440202, "grad_norm": 1.9003117869305253, "learning_rate": 1.8841175500551452e-07, "loss": 0.779, "step": 8189 }, { "epoch": 0.7556221889055472, "grad_norm": 3.0093003180869555, "learning_rate": 1.8827714292834641e-07, "loss": 0.9755, "step": 8190 }, { "epoch": 0.7556221889055472, "eval_GEN Loss": 0.43781667947769165, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3237549662590027, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8136418461799622, "eval_runtime": 57.0923, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8190 }, { "epoch": 0.7557144504670742, "grad_norm": 2.1606590175731495, "learning_rate": 1.8814257042769083e-07, "loss": 0.816, "step": 8191 }, { "epoch": 0.7558067120286011, "grad_norm": 2.6779679090882813, "learning_rate": 1.880080375157431e-07, "loss": 0.7089, "step": 8192 }, { "epoch": 0.755898973590128, "grad_norm": 1.5044975988519134, "learning_rate": 1.8787354420469493e-07, "loss": 0.5146, "step": 8193 }, { "epoch": 0.7559912351516549, "grad_norm": 1.5400466735987737, "learning_rate": 1.8773909050673438e-07, "loss": 0.7386, "step": 8194 }, { "epoch": 0.7560834967131819, "grad_norm": 2.0511800085918144, "learning_rate": 1.876046764340455e-07, "loss": 0.5611, "step": 8195 }, { "epoch": 0.7560834967131819, "eval_GEN Loss": 0.4371638894081116, "eval_GEN top-5 accuracy": 0.9842174484875055, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3270287811756134, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.814182698726654, "eval_runtime": 57.1499, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8195 }, { "epoch": 0.7561757582747088, "grad_norm": 1.830482752662486, "learning_rate": 1.8747030199880932e-07, "loss": 0.6229, "step": 8196 }, { "epoch": 0.7562680198362357, "grad_norm": 1.575552056570911, "learning_rate": 1.8733596721320324e-07, "loss": 0.6058, "step": 8197 }, { "epoch": 0.7563602813977627, "grad_norm": 1.484434733286002, "learning_rate": 1.872016720894005e-07, "loss": 0.5576, "step": 8198 }, { "epoch": 0.7564525429592895, "grad_norm": 1.7404912444185128, "learning_rate": 1.870674166395714e-07, "loss": 0.5417, "step": 8199 }, { "epoch": 0.7565448045208165, "grad_norm": 2.219276109078023, "learning_rate": 1.8693320087588224e-07, "loss": 0.7904, "step": 8200 }, { "epoch": 0.7565448045208165, "eval_GEN Loss": 0.43733733892440796, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3274691104888916, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8154447078704834, "eval_runtime": 57.2948, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8200 }, { "epoch": 0.7566370660823435, "grad_norm": 1.990742240863556, "learning_rate": 1.8679902481049617e-07, "loss": 0.6803, "step": 8201 }, { "epoch": 0.7567293276438704, "grad_norm": 2.2082003963052057, "learning_rate": 1.8666488845557204e-07, "loss": 0.6498, "step": 8202 }, { "epoch": 0.7568215892053973, "grad_norm": 2.2948319224915252, "learning_rate": 1.8653079182326568e-07, "loss": 0.7013, "step": 8203 }, { "epoch": 0.7569138507669242, "grad_norm": 2.8825580244406157, "learning_rate": 1.863967349257291e-07, "loss": 0.8275, "step": 8204 }, { "epoch": 0.7570061123284512, "grad_norm": 2.8470844173152567, "learning_rate": 1.8626271777511091e-07, "loss": 0.8384, "step": 8205 }, { "epoch": 0.7570061123284512, "eval_GEN Loss": 0.4373073875904083, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3294365406036377, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8153846263885498, "eval_runtime": 57.1783, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8205 }, { "epoch": 0.7570983738899781, "grad_norm": 2.2569978453999244, "learning_rate": 1.861287403835557e-07, "loss": 0.685, "step": 8206 }, { "epoch": 0.757190635451505, "grad_norm": 1.4528624641898435, "learning_rate": 1.8599480276320484e-07, "loss": 0.5781, "step": 8207 }, { "epoch": 0.757282897013032, "grad_norm": 1.9613279830749017, "learning_rate": 1.8586090492619614e-07, "loss": 0.6101, "step": 8208 }, { "epoch": 0.7573751585745588, "grad_norm": 2.148904098235707, "learning_rate": 1.8572704688466322e-07, "loss": 0.6492, "step": 8209 }, { "epoch": 0.7574674201360858, "grad_norm": 2.2957582713385913, "learning_rate": 1.8559322865073676e-07, "loss": 0.7122, "step": 8210 }, { "epoch": 0.7574674201360858, "eval_GEN Loss": 0.43786996603012085, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33256739377975464, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8177884817123413, "eval_runtime": 57.1288, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8210 }, { "epoch": 0.7575596816976128, "grad_norm": 1.884201162019472, "learning_rate": 1.8545945023654352e-07, "loss": 0.5853, "step": 8211 }, { "epoch": 0.7576519432591396, "grad_norm": 2.81984339813274, "learning_rate": 1.8532571165420697e-07, "loss": 0.6783, "step": 8212 }, { "epoch": 0.7577442048206666, "grad_norm": 1.8838870983932998, "learning_rate": 1.8519201291584611e-07, "loss": 0.6529, "step": 8213 }, { "epoch": 0.7578364663821935, "grad_norm": 1.5530182917049125, "learning_rate": 1.850583540335777e-07, "loss": 0.6243, "step": 8214 }, { "epoch": 0.7579287279437205, "grad_norm": 1.572203527105495, "learning_rate": 1.8492473501951354e-07, "loss": 0.5611, "step": 8215 }, { "epoch": 0.7579287279437205, "eval_GEN Loss": 0.43775320053100586, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33665090799331665, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8170071840286255, "eval_runtime": 57.4703, "eval_samples_per_second": 1.131, "eval_steps_per_second": 0.087, "step": 8215 }, { "epoch": 0.7580209895052473, "grad_norm": 2.286631626256343, "learning_rate": 1.8479115588576277e-07, "loss": 0.6011, "step": 8216 }, { "epoch": 0.7581132510667743, "grad_norm": 2.4478322244554764, "learning_rate": 1.8465761664443013e-07, "loss": 0.7873, "step": 8217 }, { "epoch": 0.7582055126283013, "grad_norm": 1.903439605557677, "learning_rate": 1.845241173076174e-07, "loss": 0.7388, "step": 8218 }, { "epoch": 0.7582977741898281, "grad_norm": 2.041344841872222, "learning_rate": 1.8439065788742265e-07, "loss": 0.7076, "step": 8219 }, { "epoch": 0.7583900357513551, "grad_norm": 2.891270946057163, "learning_rate": 1.8425723839593983e-07, "loss": 0.7134, "step": 8220 }, { "epoch": 0.7583900357513551, "eval_GEN Loss": 0.4384649395942688, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33613020181655884, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8136118054389954, "eval_runtime": 57.1885, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8220 }, { "epoch": 0.758482297312882, "grad_norm": 3.1648237209455163, "learning_rate": 1.841238588452598e-07, "loss": 0.948, "step": 8221 }, { "epoch": 0.7585745588744089, "grad_norm": 1.7815661906254787, "learning_rate": 1.839905192474696e-07, "loss": 0.724, "step": 8222 }, { "epoch": 0.7586668204359359, "grad_norm": 2.771119683016551, "learning_rate": 1.8385721961465298e-07, "loss": 0.8302, "step": 8223 }, { "epoch": 0.7587590819974628, "grad_norm": 1.5625814787470726, "learning_rate": 1.8372395995888907e-07, "loss": 0.6038, "step": 8224 }, { "epoch": 0.7588513435589898, "grad_norm": 1.7086084281182554, "learning_rate": 1.8359074029225488e-07, "loss": 0.7567, "step": 8225 }, { "epoch": 0.7588513435589898, "eval_GEN Loss": 0.43825268745422363, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3394263684749603, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8124699592590332, "eval_runtime": 57.0153, "eval_samples_per_second": 1.14, "eval_steps_per_second": 0.088, "step": 8225 }, { "epoch": 0.7589436051205166, "grad_norm": 1.5802578950042516, "learning_rate": 1.8345756062682235e-07, "loss": 0.6181, "step": 8226 }, { "epoch": 0.7590358666820436, "grad_norm": 1.4094208330255162, "learning_rate": 1.833244209746609e-07, "loss": 0.4553, "step": 8227 }, { "epoch": 0.7591281282435706, "grad_norm": 2.483271576075489, "learning_rate": 1.8319132134783542e-07, "loss": 0.9047, "step": 8228 }, { "epoch": 0.7592203898050974, "grad_norm": 2.6079528145313624, "learning_rate": 1.8305826175840785e-07, "loss": 0.6971, "step": 8229 }, { "epoch": 0.7593126513666244, "grad_norm": 1.9136803225857668, "learning_rate": 1.829252422184362e-07, "loss": 0.6827, "step": 8230 }, { "epoch": 0.7593126513666244, "eval_GEN Loss": 0.43885141611099243, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3431844115257263, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8128004670143127, "eval_runtime": 57.0821, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8230 }, { "epoch": 0.7594049129281513, "grad_norm": 1.8948853318288048, "learning_rate": 1.8279226273997495e-07, "loss": 0.6771, "step": 8231 }, { "epoch": 0.7594971744896782, "grad_norm": 2.0779454408170666, "learning_rate": 1.8265932333507507e-07, "loss": 0.6318, "step": 8232 }, { "epoch": 0.7595894360512052, "grad_norm": 1.3407990519749158, "learning_rate": 1.825264240157834e-07, "loss": 0.3697, "step": 8233 }, { "epoch": 0.7596816976127321, "grad_norm": 2.2254668422340016, "learning_rate": 1.8239356479414383e-07, "loss": 0.652, "step": 8234 }, { "epoch": 0.759773959174259, "grad_norm": 2.264349906447949, "learning_rate": 1.8226074568219572e-07, "loss": 0.5831, "step": 8235 }, { "epoch": 0.759773959174259, "eval_GEN Loss": 0.4385720491409302, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33926352858543396, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8097355961799622, "eval_runtime": 57.064, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8235 }, { "epoch": 0.7598662207357859, "grad_norm": 1.4866265842667665, "learning_rate": 1.8212796669197606e-07, "loss": 0.5652, "step": 8236 }, { "epoch": 0.7599584822973129, "grad_norm": 1.541014514551838, "learning_rate": 1.81995227835517e-07, "loss": 0.6142, "step": 8237 }, { "epoch": 0.7600507438588399, "grad_norm": 2.544310617066871, "learning_rate": 1.818625291248477e-07, "loss": 0.8006, "step": 8238 }, { "epoch": 0.7601430054203667, "grad_norm": 1.7078983021879433, "learning_rate": 1.8172987057199347e-07, "loss": 0.5723, "step": 8239 }, { "epoch": 0.7602352669818937, "grad_norm": 2.136765879874219, "learning_rate": 1.8159725218897633e-07, "loss": 0.6226, "step": 8240 }, { "epoch": 0.7602352669818937, "eval_GEN Loss": 0.4385659396648407, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3363415598869324, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.807812511920929, "eval_runtime": 57.3201, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8240 }, { "epoch": 0.7603275285434206, "grad_norm": 2.2352305370219714, "learning_rate": 1.814646739878139e-07, "loss": 0.8419, "step": 8241 }, { "epoch": 0.7604197901049475, "grad_norm": 2.3832863516149656, "learning_rate": 1.8133213598052083e-07, "loss": 0.5329, "step": 8242 }, { "epoch": 0.7605120516664745, "grad_norm": 1.8954006314126364, "learning_rate": 1.811996381791082e-07, "loss": 0.5403, "step": 8243 }, { "epoch": 0.7606043132280014, "grad_norm": 3.463722040012396, "learning_rate": 1.8106718059558262e-07, "loss": 0.741, "step": 8244 }, { "epoch": 0.7606965747895283, "grad_norm": 3.0961446296268917, "learning_rate": 1.8093476324194814e-07, "loss": 0.9304, "step": 8245 }, { "epoch": 0.7606965747895283, "eval_GEN Loss": 0.43846753239631653, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33185768127441406, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8073017001152039, "eval_runtime": 57.3557, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8245 }, { "epoch": 0.7607888363510552, "grad_norm": 1.6849284375726148, "learning_rate": 1.8080238613020406e-07, "loss": 0.6292, "step": 8246 }, { "epoch": 0.7608810979125822, "grad_norm": 1.4149034904358442, "learning_rate": 1.8067004927234717e-07, "loss": 0.4749, "step": 8247 }, { "epoch": 0.760973359474109, "grad_norm": 1.9034093201789444, "learning_rate": 1.805377526803697e-07, "loss": 0.7024, "step": 8248 }, { "epoch": 0.761065621035636, "grad_norm": 1.9956541828146832, "learning_rate": 1.8040549636626068e-07, "loss": 0.7499, "step": 8249 }, { "epoch": 0.761157882597163, "grad_norm": 2.3071420881629234, "learning_rate": 1.802732803420054e-07, "loss": 0.7609, "step": 8250 }, { "epoch": 0.761157882597163, "eval_GEN Loss": 0.43767455220222473, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32756683230400085, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8034254908561707, "eval_runtime": 57.234, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8250 }, { "epoch": 0.7612501441586899, "grad_norm": 1.821724255001341, "learning_rate": 1.8014110461958563e-07, "loss": 0.6312, "step": 8251 }, { "epoch": 0.7613424057202168, "grad_norm": 1.9333450081787655, "learning_rate": 1.8000896921097897e-07, "loss": 0.4861, "step": 8252 }, { "epoch": 0.7614346672817437, "grad_norm": 2.233090262614207, "learning_rate": 1.7987687412815993e-07, "loss": 0.5331, "step": 8253 }, { "epoch": 0.7615269288432707, "grad_norm": 1.976959279189809, "learning_rate": 1.7974481938309945e-07, "loss": 0.6455, "step": 8254 }, { "epoch": 0.7616191904047976, "grad_norm": 2.1688407358944657, "learning_rate": 1.7961280498776407e-07, "loss": 0.6123, "step": 8255 }, { "epoch": 0.7616191904047976, "eval_GEN Loss": 0.43802475929260254, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3238299787044525, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8028244972229004, "eval_runtime": 57.2428, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8255 }, { "epoch": 0.7617114519663245, "grad_norm": 1.9954839365828536, "learning_rate": 1.7948083095411732e-07, "loss": 0.5842, "step": 8256 }, { "epoch": 0.7618037135278515, "grad_norm": 2.3345562264838877, "learning_rate": 1.793488972941189e-07, "loss": 0.6911, "step": 8257 }, { "epoch": 0.7618959750893783, "grad_norm": 1.5903935306849335, "learning_rate": 1.7921700401972512e-07, "loss": 0.5255, "step": 8258 }, { "epoch": 0.7619882366509053, "grad_norm": 1.5003652577376045, "learning_rate": 1.7908515114288788e-07, "loss": 0.5228, "step": 8259 }, { "epoch": 0.7620804982124323, "grad_norm": 1.86462840780629, "learning_rate": 1.789533386755562e-07, "loss": 0.7521, "step": 8260 }, { "epoch": 0.7620804982124323, "eval_GEN Loss": 0.43785980343818665, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3219125270843506, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7980769276618958, "eval_runtime": 57.1359, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8260 }, { "epoch": 0.7621727597739592, "grad_norm": 2.1960856120932624, "learning_rate": 1.7882156662967497e-07, "loss": 0.6195, "step": 8261 }, { "epoch": 0.7622650213354861, "grad_norm": 2.642364438225876, "learning_rate": 1.786898350171859e-07, "loss": 0.6844, "step": 8262 }, { "epoch": 0.762357282897013, "grad_norm": 1.4632291931302062, "learning_rate": 1.7855814385002625e-07, "loss": 0.6735, "step": 8263 }, { "epoch": 0.76244954445854, "grad_norm": 1.7104199335211858, "learning_rate": 1.7842649314013035e-07, "loss": 0.6198, "step": 8264 }, { "epoch": 0.7625418060200669, "grad_norm": 1.7806305777236608, "learning_rate": 1.7829488289942873e-07, "loss": 0.7442, "step": 8265 }, { "epoch": 0.7625418060200669, "eval_GEN Loss": 0.438467800617218, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32416972517967224, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7995492815971375, "eval_runtime": 57.1028, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8265 }, { "epoch": 0.7626340675815938, "grad_norm": 2.291011574498238, "learning_rate": 1.7816331313984782e-07, "loss": 0.7297, "step": 8266 }, { "epoch": 0.7627263291431208, "grad_norm": 2.0909503836661223, "learning_rate": 1.7803178387331074e-07, "loss": 0.5498, "step": 8267 }, { "epoch": 0.7628185907046476, "grad_norm": 1.4003997743937395, "learning_rate": 1.7790029511173694e-07, "loss": 0.5343, "step": 8268 }, { "epoch": 0.7629108522661746, "grad_norm": 2.218181244532342, "learning_rate": 1.7776884686704236e-07, "loss": 0.683, "step": 8269 }, { "epoch": 0.7630031138277016, "grad_norm": 1.9700208719765857, "learning_rate": 1.776374391511384e-07, "loss": 0.7764, "step": 8270 }, { "epoch": 0.7630031138277016, "eval_GEN Loss": 0.43810564279556274, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3245636224746704, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7960035800933838, "eval_runtime": 57.3638, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8270 }, { "epoch": 0.7630953753892284, "grad_norm": 1.5076569400462998, "learning_rate": 1.775060719759343e-07, "loss": 0.5122, "step": 8271 }, { "epoch": 0.7631876369507554, "grad_norm": 1.9779932706778272, "learning_rate": 1.7737474535333414e-07, "loss": 0.7084, "step": 8272 }, { "epoch": 0.7632798985122823, "grad_norm": 1.5579212637178808, "learning_rate": 1.7724345929523928e-07, "loss": 0.5244, "step": 8273 }, { "epoch": 0.7633721600738093, "grad_norm": 2.1808486530513873, "learning_rate": 1.7711221381354657e-07, "loss": 0.4962, "step": 8274 }, { "epoch": 0.7634644216353362, "grad_norm": 3.02719055087357, "learning_rate": 1.7698100892015033e-07, "loss": 0.8914, "step": 8275 }, { "epoch": 0.7634644216353362, "eval_GEN Loss": 0.43785977363586426, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32250526547431946, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7964242696762085, "eval_runtime": 57.2249, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8275 }, { "epoch": 0.7635566831968631, "grad_norm": 1.921213946046325, "learning_rate": 1.7684984462694019e-07, "loss": 0.6641, "step": 8276 }, { "epoch": 0.7636489447583901, "grad_norm": 1.6748521459232537, "learning_rate": 1.7671872094580268e-07, "loss": 0.5046, "step": 8277 }, { "epoch": 0.7637412063199169, "grad_norm": 1.6660397805500087, "learning_rate": 1.7658763788862e-07, "loss": 0.5397, "step": 8278 }, { "epoch": 0.7638334678814439, "grad_norm": 1.7141744767879774, "learning_rate": 1.7645659546727146e-07, "loss": 0.6602, "step": 8279 }, { "epoch": 0.7639257294429708, "grad_norm": 1.8907723990300103, "learning_rate": 1.763255936936325e-07, "loss": 0.5191, "step": 8280 }, { "epoch": 0.7639257294429708, "eval_GEN Loss": 0.43798375129699707, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32135316729545593, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7966346144676208, "eval_runtime": 57.2126, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8280 }, { "epoch": 0.7640179910044977, "grad_norm": 3.2580389591975285, "learning_rate": 1.7619463257957394e-07, "loss": 0.6454, "step": 8281 }, { "epoch": 0.7641102525660247, "grad_norm": 2.0359536438614985, "learning_rate": 1.7606371213696475e-07, "loss": 0.68, "step": 8282 }, { "epoch": 0.7642025141275516, "grad_norm": 2.129728830177697, "learning_rate": 1.759328323776683e-07, "loss": 0.5765, "step": 8283 }, { "epoch": 0.7642947756890786, "grad_norm": 1.6590959039815458, "learning_rate": 1.758019933135456e-07, "loss": 0.7585, "step": 8284 }, { "epoch": 0.7643870372506054, "grad_norm": 2.1108773646124277, "learning_rate": 1.7567119495645303e-07, "loss": 0.596, "step": 8285 }, { "epoch": 0.7643870372506054, "eval_GEN Loss": 0.43841058015823364, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32289302349090576, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7970853447914124, "eval_runtime": 57.1234, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8285 }, { "epoch": 0.7644792988121324, "grad_norm": 1.6884251048709182, "learning_rate": 1.7554043731824435e-07, "loss": 0.5846, "step": 8286 }, { "epoch": 0.7645715603736594, "grad_norm": 2.6149975975123656, "learning_rate": 1.7540972041076855e-07, "loss": 0.7654, "step": 8287 }, { "epoch": 0.7646638219351862, "grad_norm": 2.7575079065921346, "learning_rate": 1.7527904424587147e-07, "loss": 0.6285, "step": 8288 }, { "epoch": 0.7647560834967132, "grad_norm": 1.5927801074916808, "learning_rate": 1.7514840883539553e-07, "loss": 0.574, "step": 8289 }, { "epoch": 0.7648483450582401, "grad_norm": 2.531706917702764, "learning_rate": 1.7501781419117862e-07, "loss": 0.684, "step": 8290 }, { "epoch": 0.7648483450582401, "eval_GEN Loss": 0.4375576376914978, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3262816369533539, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7969350814819336, "eval_runtime": 57.3825, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8290 }, { "epoch": 0.764940606619767, "grad_norm": 2.523066169523741, "learning_rate": 1.7488726032505592e-07, "loss": 0.6462, "step": 8291 }, { "epoch": 0.765032868181294, "grad_norm": 2.049705113808892, "learning_rate": 1.7475674724885774e-07, "loss": 0.5563, "step": 8292 }, { "epoch": 0.7651251297428209, "grad_norm": 3.7666279719419586, "learning_rate": 1.7462627497441223e-07, "loss": 0.741, "step": 8293 }, { "epoch": 0.7652173913043478, "grad_norm": 1.2070141574497335, "learning_rate": 1.7449584351354235e-07, "loss": 0.5176, "step": 8294 }, { "epoch": 0.7653096528658747, "grad_norm": 2.0720065202046904, "learning_rate": 1.7436545287806833e-07, "loss": 0.6577, "step": 8295 }, { "epoch": 0.7653096528658747, "eval_GEN Loss": 0.4376376271247864, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33136820793151855, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8005709052085876, "eval_runtime": 57.0695, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8295 }, { "epoch": 0.7654019144274017, "grad_norm": 2.534985333684985, "learning_rate": 1.7423510307980617e-07, "loss": 0.614, "step": 8296 }, { "epoch": 0.7654941759889287, "grad_norm": 1.7155556919402226, "learning_rate": 1.7410479413056876e-07, "loss": 0.6143, "step": 8297 }, { "epoch": 0.7655864375504555, "grad_norm": 1.9054694146289868, "learning_rate": 1.7397452604216437e-07, "loss": 0.6292, "step": 8298 }, { "epoch": 0.7656786991119825, "grad_norm": 1.2697254504909397, "learning_rate": 1.7384429882639838e-07, "loss": 0.5893, "step": 8299 }, { "epoch": 0.7657709606735094, "grad_norm": 3.9375745056563884, "learning_rate": 1.7371411249507239e-07, "loss": 0.6973, "step": 8300 }, { "epoch": 0.7657709606735094, "eval_GEN Loss": 0.4385286271572113, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3311026692390442, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7992488145828247, "eval_runtime": 57.2947, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8300 }, { "epoch": 0.7658632222350363, "grad_norm": 2.451367622567154, "learning_rate": 1.7358396705998363e-07, "loss": 0.7062, "step": 8301 }, { "epoch": 0.7659554837965633, "grad_norm": 2.153462114573505, "learning_rate": 1.7345386253292628e-07, "loss": 0.7774, "step": 8302 }, { "epoch": 0.7660477453580902, "grad_norm": 1.5213113925819575, "learning_rate": 1.733237989256907e-07, "loss": 0.5484, "step": 8303 }, { "epoch": 0.7661400069196171, "grad_norm": 2.319329368478793, "learning_rate": 1.7319377625006357e-07, "loss": 0.6809, "step": 8304 }, { "epoch": 0.766232268481144, "grad_norm": 2.03446723011652, "learning_rate": 1.730637945178274e-07, "loss": 0.6864, "step": 8305 }, { "epoch": 0.766232268481144, "eval_GEN Loss": 0.43720242381095886, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33146587014198303, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7989482879638672, "eval_runtime": 57.2952, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8305 }, { "epoch": 0.766324530042671, "grad_norm": 2.2360873467646707, "learning_rate": 1.7293385374076163e-07, "loss": 0.677, "step": 8306 }, { "epoch": 0.766416791604198, "grad_norm": 1.640909979412779, "learning_rate": 1.7280395393064148e-07, "loss": 0.7212, "step": 8307 }, { "epoch": 0.7665090531657248, "grad_norm": 1.707021713677753, "learning_rate": 1.7267409509923902e-07, "loss": 0.6332, "step": 8308 }, { "epoch": 0.7666013147272518, "grad_norm": 2.184972177288169, "learning_rate": 1.7254427725832182e-07, "loss": 0.7477, "step": 8309 }, { "epoch": 0.7666935762887787, "grad_norm": 1.9613813994730138, "learning_rate": 1.7241450041965444e-07, "loss": 0.5088, "step": 8310 }, { "epoch": 0.7666935762887787, "eval_GEN Loss": 0.4370870590209961, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33012357354164124, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7983773946762085, "eval_runtime": 56.2095, "eval_samples_per_second": 1.156, "eval_steps_per_second": 0.089, "step": 8310 }, { "epoch": 0.7667858378503056, "grad_norm": 1.6294882681153042, "learning_rate": 1.7228476459499737e-07, "loss": 0.5669, "step": 8311 }, { "epoch": 0.7668780994118325, "grad_norm": 1.7308193507597405, "learning_rate": 1.7215506979610775e-07, "loss": 0.5513, "step": 8312 }, { "epoch": 0.7669703609733595, "grad_norm": 1.7037928557868551, "learning_rate": 1.7202541603473823e-07, "loss": 0.5679, "step": 8313 }, { "epoch": 0.7670626225348864, "grad_norm": 1.800807772559463, "learning_rate": 1.7189580332263852e-07, "loss": 0.574, "step": 8314 }, { "epoch": 0.7671548840964133, "grad_norm": 2.087675601421281, "learning_rate": 1.7176623167155453e-07, "loss": 0.4702, "step": 8315 }, { "epoch": 0.7671548840964133, "eval_GEN Loss": 0.43705663084983826, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32644426822662354, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7972355484962463, "eval_runtime": 56.394, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8315 }, { "epoch": 0.7672471456579403, "grad_norm": 2.0720751570272395, "learning_rate": 1.7163670109322788e-07, "loss": 0.6726, "step": 8316 }, { "epoch": 0.7673394072194671, "grad_norm": 2.1112560810941314, "learning_rate": 1.7150721159939688e-07, "loss": 0.637, "step": 8317 }, { "epoch": 0.7674316687809941, "grad_norm": 1.7357405093574738, "learning_rate": 1.7137776320179628e-07, "loss": 0.6472, "step": 8318 }, { "epoch": 0.7675239303425211, "grad_norm": 2.170909751044219, "learning_rate": 1.7124835591215688e-07, "loss": 0.5077, "step": 8319 }, { "epoch": 0.767616191904048, "grad_norm": 1.8845324058657804, "learning_rate": 1.711189897422054e-07, "loss": 0.6107, "step": 8320 }, { "epoch": 0.767616191904048, "eval_GEN Loss": 0.4362417459487915, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32475900650024414, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8017127513885498, "eval_runtime": 56.3864, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8320 }, { "epoch": 0.7677084534655749, "grad_norm": 1.870535957332796, "learning_rate": 1.7098966470366581e-07, "loss": 0.5703, "step": 8321 }, { "epoch": 0.7678007150271018, "grad_norm": 2.1470771644709643, "learning_rate": 1.708603808082572e-07, "loss": 0.5576, "step": 8322 }, { "epoch": 0.7678929765886288, "grad_norm": 1.4219593292717811, "learning_rate": 1.7073113806769598e-07, "loss": 0.5006, "step": 8323 }, { "epoch": 0.7679852381501557, "grad_norm": 2.282387400868935, "learning_rate": 1.706019364936938e-07, "loss": 0.7921, "step": 8324 }, { "epoch": 0.7680774997116826, "grad_norm": 1.7554333353213587, "learning_rate": 1.7047277609795944e-07, "loss": 0.627, "step": 8325 }, { "epoch": 0.7680774997116826, "eval_GEN Loss": 0.43732336163520813, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32204967737197876, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8031851053237915, "eval_runtime": 56.4892, "eval_samples_per_second": 1.151, "eval_steps_per_second": 0.089, "step": 8325 }, { "epoch": 0.7681697612732096, "grad_norm": 1.5384279897725803, "learning_rate": 1.703436568921977e-07, "loss": 0.5447, "step": 8326 }, { "epoch": 0.7682620228347364, "grad_norm": 3.280690874099196, "learning_rate": 1.7021457888810899e-07, "loss": 0.7083, "step": 8327 }, { "epoch": 0.7683542843962634, "grad_norm": 1.6220413781801875, "learning_rate": 1.7008554209739138e-07, "loss": 0.5266, "step": 8328 }, { "epoch": 0.7684465459577904, "grad_norm": 1.6431476463025578, "learning_rate": 1.6995654653173786e-07, "loss": 0.5451, "step": 8329 }, { "epoch": 0.7685388075193172, "grad_norm": 1.6839927832947659, "learning_rate": 1.6982759220283848e-07, "loss": 0.6133, "step": 8330 }, { "epoch": 0.7685388075193172, "eval_GEN Loss": 0.4367929697036743, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3219328224658966, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8060697317123413, "eval_runtime": 57.3969, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 8330 }, { "epoch": 0.7686310690808442, "grad_norm": 2.275767607172405, "learning_rate": 1.6969867912237875e-07, "loss": 0.664, "step": 8331 }, { "epoch": 0.7687233306423711, "grad_norm": 1.4429000670947283, "learning_rate": 1.695698073020418e-07, "loss": 0.555, "step": 8332 }, { "epoch": 0.7688155922038981, "grad_norm": 2.3238769005877624, "learning_rate": 1.694409767535056e-07, "loss": 0.5864, "step": 8333 }, { "epoch": 0.768907853765425, "grad_norm": 2.244473418439422, "learning_rate": 1.6931218748844527e-07, "loss": 0.8236, "step": 8334 }, { "epoch": 0.7690001153269519, "grad_norm": 2.719566919628414, "learning_rate": 1.6918343951853162e-07, "loss": 0.6925, "step": 8335 }, { "epoch": 0.7690001153269519, "eval_GEN Loss": 0.43657976388931274, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3214704394340515, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8061298131942749, "eval_runtime": 56.2595, "eval_samples_per_second": 1.155, "eval_steps_per_second": 0.089, "step": 8335 }, { "epoch": 0.7690923768884789, "grad_norm": 3.0241117935590003, "learning_rate": 1.6905473285543213e-07, "loss": 0.6244, "step": 8336 }, { "epoch": 0.7691846384500057, "grad_norm": 2.910706588146261, "learning_rate": 1.6892606751081065e-07, "loss": 0.8693, "step": 8337 }, { "epoch": 0.7692769000115327, "grad_norm": 2.219825575192377, "learning_rate": 1.6879744349632639e-07, "loss": 0.597, "step": 8338 }, { "epoch": 0.7693691615730597, "grad_norm": 1.846161085710625, "learning_rate": 1.686688608236362e-07, "loss": 0.4265, "step": 8339 }, { "epoch": 0.7694614231345865, "grad_norm": 1.6455526191437773, "learning_rate": 1.68540319504392e-07, "loss": 0.4324, "step": 8340 }, { "epoch": 0.7694614231345865, "eval_GEN Loss": 0.4368555247783661, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.322213739156723, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.810546875, "eval_runtime": 56.1859, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 8340 }, { "epoch": 0.7695536846961135, "grad_norm": 2.648950878280339, "learning_rate": 1.6841181955024273e-07, "loss": 0.608, "step": 8341 }, { "epoch": 0.7696459462576404, "grad_norm": 1.5826036840823006, "learning_rate": 1.6828336097283265e-07, "loss": 0.4892, "step": 8342 }, { "epoch": 0.7697382078191674, "grad_norm": 1.398968822676665, "learning_rate": 1.6815494378380362e-07, "loss": 0.4792, "step": 8343 }, { "epoch": 0.7698304693806942, "grad_norm": 1.7652701011123493, "learning_rate": 1.6802656799479254e-07, "loss": 0.6713, "step": 8344 }, { "epoch": 0.7699227309422212, "grad_norm": 2.1731594772090803, "learning_rate": 1.6789823361743314e-07, "loss": 0.7616, "step": 8345 }, { "epoch": 0.7699227309422212, "eval_GEN Loss": 0.4365482032299042, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3192671537399292, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8060095906257629, "eval_runtime": 56.0617, "eval_samples_per_second": 1.159, "eval_steps_per_second": 0.089, "step": 8345 }, { "epoch": 0.7700149925037482, "grad_norm": 2.1022556469438376, "learning_rate": 1.6776994066335525e-07, "loss": 0.6401, "step": 8346 }, { "epoch": 0.770107254065275, "grad_norm": 2.029000468908562, "learning_rate": 1.6764168914418525e-07, "loss": 0.5976, "step": 8347 }, { "epoch": 0.770199515626802, "grad_norm": 1.5181528260333752, "learning_rate": 1.6751347907154505e-07, "loss": 0.5589, "step": 8348 }, { "epoch": 0.7702917771883289, "grad_norm": 2.2228278566981956, "learning_rate": 1.6738531045705352e-07, "loss": 0.5058, "step": 8349 }, { "epoch": 0.7703840387498558, "grad_norm": 1.7034511406522683, "learning_rate": 1.6725718331232564e-07, "loss": 0.5903, "step": 8350 }, { "epoch": 0.7703840387498558, "eval_GEN Loss": 0.43636012077331543, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM Loss": 0.3203793168067932, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.8072415590286255, "eval_runtime": 56.3808, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8350 }, { "epoch": 0.7704763003113828, "grad_norm": 1.632665546663161, "learning_rate": 1.6712909764897215e-07, "loss": 0.6977, "step": 8351 }, { "epoch": 0.7705685618729097, "grad_norm": 1.982626210912946, "learning_rate": 1.6700105347860046e-07, "loss": 0.6542, "step": 8352 }, { "epoch": 0.7706608234344366, "grad_norm": 2.9119023476571306, "learning_rate": 1.668730508128142e-07, "loss": 0.8019, "step": 8353 }, { "epoch": 0.7707530849959635, "grad_norm": 2.1527651541270507, "learning_rate": 1.667450896632134e-07, "loss": 0.6951, "step": 8354 }, { "epoch": 0.7708453465574905, "grad_norm": 1.378400074754103, "learning_rate": 1.666171700413937e-07, "loss": 0.6934, "step": 8355 }, { "epoch": 0.7708453465574905, "eval_GEN Loss": 0.4366629719734192, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32200103998184204, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.807421863079071, "eval_runtime": 57.2637, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 8355 }, { "epoch": 0.7709376081190175, "grad_norm": 2.823441276217777, "learning_rate": 1.6648929195894752e-07, "loss": 0.7409, "step": 8356 }, { "epoch": 0.7710298696805443, "grad_norm": 1.7250256966745947, "learning_rate": 1.6636145542746346e-07, "loss": 0.6483, "step": 8357 }, { "epoch": 0.7711221312420713, "grad_norm": 2.338909810861704, "learning_rate": 1.6623366045852637e-07, "loss": 0.6899, "step": 8358 }, { "epoch": 0.7712143928035982, "grad_norm": 1.8442653032938252, "learning_rate": 1.6610590706371694e-07, "loss": 0.6754, "step": 8359 }, { "epoch": 0.7713066543651251, "grad_norm": 1.8907550850965666, "learning_rate": 1.6597819525461244e-07, "loss": 0.7978, "step": 8360 }, { "epoch": 0.7713066543651251, "eval_GEN Loss": 0.43636590242385864, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3241529166698456, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8064002394676208, "eval_runtime": 57.3246, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8360 }, { "epoch": 0.7713989159266521, "grad_norm": 1.5793724762861654, "learning_rate": 1.6585052504278664e-07, "loss": 0.6265, "step": 8361 }, { "epoch": 0.771491177488179, "grad_norm": 2.087958438419085, "learning_rate": 1.6572289643980873e-07, "loss": 0.7591, "step": 8362 }, { "epoch": 0.7715834390497059, "grad_norm": 2.0497378358065563, "learning_rate": 1.6559530945724488e-07, "loss": 0.555, "step": 8363 }, { "epoch": 0.7716757006112328, "grad_norm": 2.3256796400582527, "learning_rate": 1.6546776410665725e-07, "loss": 0.7177, "step": 8364 }, { "epoch": 0.7717679621727598, "grad_norm": 2.2482047375774874, "learning_rate": 1.6534026039960432e-07, "loss": 0.7282, "step": 8365 }, { "epoch": 0.7717679621727598, "eval_GEN Loss": 0.4359719753265381, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32440218329429626, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8025540709495544, "eval_runtime": 56.3484, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 8365 }, { "epoch": 0.7718602237342868, "grad_norm": 1.563584061329305, "learning_rate": 1.652127983476403e-07, "loss": 0.4654, "step": 8366 }, { "epoch": 0.7719524852958136, "grad_norm": 2.101999722687526, "learning_rate": 1.650853779623162e-07, "loss": 0.6687, "step": 8367 }, { "epoch": 0.7720447468573406, "grad_norm": 3.310132225936115, "learning_rate": 1.6495799925517911e-07, "loss": 0.6755, "step": 8368 }, { "epoch": 0.7721370084188675, "grad_norm": 1.7662118972156842, "learning_rate": 1.6483066223777239e-07, "loss": 0.6065, "step": 8369 }, { "epoch": 0.7722292699803944, "grad_norm": 2.6422076421316345, "learning_rate": 1.6470336692163518e-07, "loss": 0.7107, "step": 8370 }, { "epoch": 0.7722292699803944, "eval_GEN Loss": 0.4365704655647278, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3253695070743561, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8012920618057251, "eval_runtime": 56.3925, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8370 }, { "epoch": 0.7723215315419214, "grad_norm": 2.412151994403999, "learning_rate": 1.645761133183034e-07, "loss": 0.6442, "step": 8371 }, { "epoch": 0.7724137931034483, "grad_norm": 1.7765886718513895, "learning_rate": 1.6444890143930914e-07, "loss": 0.6753, "step": 8372 }, { "epoch": 0.7725060546649752, "grad_norm": 2.130094876698409, "learning_rate": 1.643217312961802e-07, "loss": 0.5409, "step": 8373 }, { "epoch": 0.7725983162265021, "grad_norm": 1.86187552346424, "learning_rate": 1.6419460290044106e-07, "loss": 0.5445, "step": 8374 }, { "epoch": 0.7726905777880291, "grad_norm": 1.9406735340389736, "learning_rate": 1.6406751626361225e-07, "loss": 0.5743, "step": 8375 }, { "epoch": 0.7726905777880291, "eval_GEN Loss": 0.43632611632347107, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32797861099243164, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.8006610870361328, "eval_runtime": 56.1907, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 8375 }, { "epoch": 0.7727828393495559, "grad_norm": 2.0153644614605932, "learning_rate": 1.6394047139721092e-07, "loss": 0.654, "step": 8376 }, { "epoch": 0.7728751009110829, "grad_norm": 2.645652324405637, "learning_rate": 1.6381346831274938e-07, "loss": 0.6343, "step": 8377 }, { "epoch": 0.7729673624726099, "grad_norm": 2.2872392688255547, "learning_rate": 1.6368650702173763e-07, "loss": 0.6506, "step": 8378 }, { "epoch": 0.7730596240341367, "grad_norm": 2.471728452312835, "learning_rate": 1.6355958753568052e-07, "loss": 0.6662, "step": 8379 }, { "epoch": 0.7731518855956637, "grad_norm": 1.6413580935229666, "learning_rate": 1.6343270986608013e-07, "loss": 0.6149, "step": 8380 }, { "epoch": 0.7731518855956637, "eval_GEN Loss": 0.4372888207435608, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32957908511161804, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7981069684028625, "eval_runtime": 56.3411, "eval_samples_per_second": 1.154, "eval_steps_per_second": 0.089, "step": 8380 }, { "epoch": 0.7732441471571906, "grad_norm": 1.83926053958227, "learning_rate": 1.6330587402443387e-07, "loss": 0.5811, "step": 8381 }, { "epoch": 0.7733364087187176, "grad_norm": 1.709832480091853, "learning_rate": 1.6317908002223602e-07, "loss": 0.5009, "step": 8382 }, { "epoch": 0.7734286702802445, "grad_norm": 2.0203237504155833, "learning_rate": 1.630523278709769e-07, "loss": 0.5465, "step": 8383 }, { "epoch": 0.7735209318417714, "grad_norm": 2.1510978093738493, "learning_rate": 1.6292561758214295e-07, "loss": 0.8014, "step": 8384 }, { "epoch": 0.7736131934032984, "grad_norm": 1.748037385470435, "learning_rate": 1.6279894916721704e-07, "loss": 0.7463, "step": 8385 }, { "epoch": 0.7736131934032984, "eval_GEN Loss": 0.4370570182800293, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33216702938079834, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7978065013885498, "eval_runtime": 56.4435, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 8385 }, { "epoch": 0.7737054549648252, "grad_norm": 2.069207962198144, "learning_rate": 1.6267232263767758e-07, "loss": 0.6089, "step": 8386 }, { "epoch": 0.7737977165263522, "grad_norm": 2.1148606221845445, "learning_rate": 1.6254573800500023e-07, "loss": 0.6534, "step": 8387 }, { "epoch": 0.7738899780878792, "grad_norm": 1.5103935617703588, "learning_rate": 1.6241919528065564e-07, "loss": 0.6036, "step": 8388 }, { "epoch": 0.773982239649406, "grad_norm": 1.6950361984446556, "learning_rate": 1.622926944761121e-07, "loss": 0.5449, "step": 8389 }, { "epoch": 0.774074501210933, "grad_norm": 2.7034609456927967, "learning_rate": 1.6216623560283264e-07, "loss": 0.773, "step": 8390 }, { "epoch": 0.774074501210933, "eval_GEN Loss": 0.43656986951828003, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33076009154319763, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7956730723381042, "eval_runtime": 56.1636, "eval_samples_per_second": 1.157, "eval_steps_per_second": 0.089, "step": 8390 }, { "epoch": 0.7741667627724599, "grad_norm": 2.3706798565284273, "learning_rate": 1.620398186722774e-07, "loss": 0.7273, "step": 8391 }, { "epoch": 0.7742590243339869, "grad_norm": 1.801212315803453, "learning_rate": 1.619134436959026e-07, "loss": 0.7376, "step": 8392 }, { "epoch": 0.7743512858955138, "grad_norm": 2.2091327411894373, "learning_rate": 1.6178711068516052e-07, "loss": 0.6799, "step": 8393 }, { "epoch": 0.7744435474570407, "grad_norm": 1.7759667041144558, "learning_rate": 1.6166081965149953e-07, "loss": 0.5389, "step": 8394 }, { "epoch": 0.7745358090185677, "grad_norm": 3.005567912940057, "learning_rate": 1.6153457060636423e-07, "loss": 0.909, "step": 8395 }, { "epoch": 0.7745358090185677, "eval_GEN Loss": 0.4366840422153473, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33229777216911316, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7965144515037537, "eval_runtime": 56.3742, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8395 }, { "epoch": 0.7746280705800945, "grad_norm": 1.919581087619379, "learning_rate": 1.6140836356119591e-07, "loss": 0.6555, "step": 8396 }, { "epoch": 0.7747203321416215, "grad_norm": 1.4784583574010643, "learning_rate": 1.612821985274312e-07, "loss": 0.6898, "step": 8397 }, { "epoch": 0.7748125937031485, "grad_norm": 2.2811783193897006, "learning_rate": 1.611560755165037e-07, "loss": 0.6329, "step": 8398 }, { "epoch": 0.7749048552646753, "grad_norm": 1.8856223825493281, "learning_rate": 1.610299945398424e-07, "loss": 0.6095, "step": 8399 }, { "epoch": 0.7749971168262023, "grad_norm": 1.534555832367856, "learning_rate": 1.6090395560887366e-07, "loss": 0.4561, "step": 8400 }, { "epoch": 0.7749971168262023, "eval_GEN Loss": 0.4371236264705658, "eval_GEN top-5 accuracy": 0.9829022358614643, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33130961656570435, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.797656238079071, "eval_runtime": 56.4154, "eval_samples_per_second": 1.152, "eval_steps_per_second": 0.089, "step": 8400 }, { "epoch": 0.7750893783877292, "grad_norm": 2.454928406056304, "learning_rate": 1.6077795873501881e-07, "loss": 0.6131, "step": 8401 }, { "epoch": 0.7751816399492562, "grad_norm": 1.5039487656523156, "learning_rate": 1.6065200392969596e-07, "loss": 0.5354, "step": 8402 }, { "epoch": 0.775273901510783, "grad_norm": 2.010154197211754, "learning_rate": 1.6052609120431946e-07, "loss": 0.8682, "step": 8403 }, { "epoch": 0.77536616307231, "grad_norm": 3.0199729574010226, "learning_rate": 1.6040022057029988e-07, "loss": 0.7326, "step": 8404 }, { "epoch": 0.775458424633837, "grad_norm": 2.4929222921214493, "learning_rate": 1.6027439203904336e-07, "loss": 0.6189, "step": 8405 }, { "epoch": 0.775458424633837, "eval_GEN Loss": 0.43548187613487244, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.33075666427612305, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7927283644676208, "eval_runtime": 57.1772, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8405 }, { "epoch": 0.7755506861953638, "grad_norm": 1.5760521723629257, "learning_rate": 1.6014860562195298e-07, "loss": 0.5906, "step": 8406 }, { "epoch": 0.7756429477568908, "grad_norm": 1.819018855560146, "learning_rate": 1.6002286133042777e-07, "loss": 0.5897, "step": 8407 }, { "epoch": 0.7757352093184177, "grad_norm": 2.2427989979178626, "learning_rate": 1.598971591758626e-07, "loss": 0.6323, "step": 8408 }, { "epoch": 0.7758274708799446, "grad_norm": 2.971123630184401, "learning_rate": 1.597714991696489e-07, "loss": 0.8218, "step": 8409 }, { "epoch": 0.7759197324414716, "grad_norm": 1.5886375418205465, "learning_rate": 1.5964588132317432e-07, "loss": 0.6229, "step": 8410 }, { "epoch": 0.7759197324414716, "eval_GEN Loss": 0.43598079681396484, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3324354588985443, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7974759340286255, "eval_runtime": 57.187, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8410 }, { "epoch": 0.7760119940029985, "grad_norm": 3.0988373331752075, "learning_rate": 1.5952030564782256e-07, "loss": 0.9405, "step": 8411 }, { "epoch": 0.7761042555645254, "grad_norm": 1.8283444389230543, "learning_rate": 1.5939477215497323e-07, "loss": 0.6484, "step": 8412 }, { "epoch": 0.7761965171260523, "grad_norm": 2.1726538469660026, "learning_rate": 1.592692808560025e-07, "loss": 0.7066, "step": 8413 }, { "epoch": 0.7762887786875793, "grad_norm": 2.3093499711298406, "learning_rate": 1.591438317622826e-07, "loss": 0.557, "step": 8414 }, { "epoch": 0.7763810402491063, "grad_norm": 1.8305854068291592, "learning_rate": 1.5901842488518212e-07, "loss": 0.5507, "step": 8415 }, { "epoch": 0.7763810402491063, "eval_GEN Loss": 0.43566375970840454, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3298782408237457, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7959434986114502, "eval_runtime": 57.3208, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8415 }, { "epoch": 0.7764733018106331, "grad_norm": 2.609164640974667, "learning_rate": 1.5889306023606527e-07, "loss": 0.8177, "step": 8416 }, { "epoch": 0.7765655633721601, "grad_norm": 2.0555377160793538, "learning_rate": 1.58767737826293e-07, "loss": 0.5983, "step": 8417 }, { "epoch": 0.776657824933687, "grad_norm": 1.2398433133818685, "learning_rate": 1.5864245766722214e-07, "loss": 0.396, "step": 8418 }, { "epoch": 0.7767500864952139, "grad_norm": 1.8688007746644697, "learning_rate": 1.5851721977020604e-07, "loss": 0.7133, "step": 8419 }, { "epoch": 0.7768423480567409, "grad_norm": 3.053504270685506, "learning_rate": 1.5839202414659354e-07, "loss": 0.8744, "step": 8420 }, { "epoch": 0.7768423480567409, "eval_GEN Loss": 0.4357409179210663, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3255630135536194, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7946814894676208, "eval_runtime": 57.0717, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8420 }, { "epoch": 0.7769346096182678, "grad_norm": 2.075738626393291, "learning_rate": 1.5826687080773028e-07, "loss": 0.5482, "step": 8421 }, { "epoch": 0.7770268711797947, "grad_norm": 2.1799876353530787, "learning_rate": 1.58141759764958e-07, "loss": 0.5394, "step": 8422 }, { "epoch": 0.7771191327413216, "grad_norm": 1.8528708632749227, "learning_rate": 1.5801669102961396e-07, "loss": 0.5852, "step": 8423 }, { "epoch": 0.7772113943028486, "grad_norm": 2.5462955358417476, "learning_rate": 1.5789166461303276e-07, "loss": 0.6367, "step": 8424 }, { "epoch": 0.7773036558643756, "grad_norm": 2.1919169175400004, "learning_rate": 1.5776668052654397e-07, "loss": 0.7394, "step": 8425 }, { "epoch": 0.7773036558643756, "eval_GEN Loss": 0.4357832968235016, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.3276459276676178, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.794140636920929, "eval_runtime": 57.4381, "eval_samples_per_second": 1.132, "eval_steps_per_second": 0.087, "step": 8425 }, { "epoch": 0.7773959174259024, "grad_norm": 2.406258853317111, "learning_rate": 1.5764173878147416e-07, "loss": 0.7939, "step": 8426 }, { "epoch": 0.7774881789874294, "grad_norm": 2.7606846408450245, "learning_rate": 1.5751683938914532e-07, "loss": 0.8564, "step": 8427 }, { "epoch": 0.7775804405489563, "grad_norm": 1.765638976619787, "learning_rate": 1.5739198236087666e-07, "loss": 0.5404, "step": 8428 }, { "epoch": 0.7776727021104832, "grad_norm": 2.4669027860241695, "learning_rate": 1.572671677079824e-07, "loss": 0.6651, "step": 8429 }, { "epoch": 0.7777649636720102, "grad_norm": 2.417401681053125, "learning_rate": 1.5714239544177384e-07, "loss": 0.8059, "step": 8430 }, { "epoch": 0.7777649636720102, "eval_GEN Loss": 0.43566399812698364, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32808634638786316, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7945011854171753, "eval_runtime": 57.2946, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8430 }, { "epoch": 0.7778572252335371, "grad_norm": 1.8004511005883805, "learning_rate": 1.570176655735576e-07, "loss": 0.7811, "step": 8431 }, { "epoch": 0.777949486795064, "grad_norm": 2.4099529180165153, "learning_rate": 1.5689297811463715e-07, "loss": 0.7216, "step": 8432 }, { "epoch": 0.7780417483565909, "grad_norm": 1.7697932532984162, "learning_rate": 1.56768333076312e-07, "loss": 0.742, "step": 8433 }, { "epoch": 0.7781340099181179, "grad_norm": 2.86734130069678, "learning_rate": 1.5664373046987716e-07, "loss": 0.8258, "step": 8434 }, { "epoch": 0.7782262714796447, "grad_norm": 1.3248291976713735, "learning_rate": 1.5651917030662503e-07, "loss": 0.5527, "step": 8435 }, { "epoch": 0.7782262714796447, "eval_GEN Loss": 0.4345187842845917, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.32732710242271423, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7926682829856873, "eval_runtime": 57.2382, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8435 }, { "epoch": 0.7783185330411717, "grad_norm": 2.3530330060096305, "learning_rate": 1.563946525978429e-07, "loss": 0.6324, "step": 8436 }, { "epoch": 0.7784107946026987, "grad_norm": 1.7469685136525641, "learning_rate": 1.5627017735481518e-07, "loss": 0.6074, "step": 8437 }, { "epoch": 0.7785030561642255, "grad_norm": 4.180933618359915, "learning_rate": 1.5614574458882133e-07, "loss": 0.8903, "step": 8438 }, { "epoch": 0.7785953177257525, "grad_norm": 1.5764636548428201, "learning_rate": 1.560213543111385e-07, "loss": 0.6509, "step": 8439 }, { "epoch": 0.7786875792872794, "grad_norm": 1.9622613144689192, "learning_rate": 1.5589700653303855e-07, "loss": 0.8077, "step": 8440 }, { "epoch": 0.7786875792872794, "eval_GEN Loss": 0.4354039132595062, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9024390243902439, "eval_PRM F1 AUC": 0.7936092194866422, "eval_PRM F1 Neg": 0.6666666666666666, "eval_PRM Loss": 0.327920526266098, "eval_PRM NPV": 0.64, "eval_PRM Precision": 0.9135802469135802, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7938100695610046, "eval_runtime": 57.112, "eval_samples_per_second": 1.138, "eval_steps_per_second": 0.088, "step": 8440 }, { "epoch": 0.7787798408488064, "grad_norm": 2.1625983523913, "learning_rate": 1.5577270126579023e-07, "loss": 0.598, "step": 8441 }, { "epoch": 0.7788721024103333, "grad_norm": 2.3081511161076502, "learning_rate": 1.5564843852065844e-07, "loss": 0.5846, "step": 8442 }, { "epoch": 0.7789643639718602, "grad_norm": 2.423641545959306, "learning_rate": 1.5552421830890382e-07, "loss": 0.7878, "step": 8443 }, { "epoch": 0.7790566255333872, "grad_norm": 1.1650994466303577, "learning_rate": 1.554000406417837e-07, "loss": 0.4173, "step": 8444 }, { "epoch": 0.779148887094914, "grad_norm": 1.8069209832255486, "learning_rate": 1.5527590553055062e-07, "loss": 0.4199, "step": 8445 }, { "epoch": 0.779148887094914, "eval_GEN Loss": 0.43526574969291687, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32563474774360657, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7942307591438293, "eval_runtime": 56.3842, "eval_samples_per_second": 1.153, "eval_steps_per_second": 0.089, "step": 8445 }, { "epoch": 0.779241148656441, "grad_norm": 2.0693549524086463, "learning_rate": 1.5515181298645467e-07, "loss": 0.5884, "step": 8446 }, { "epoch": 0.779333410217968, "grad_norm": 2.608434904625606, "learning_rate": 1.5502776302074086e-07, "loss": 0.865, "step": 8447 }, { "epoch": 0.7794256717794948, "grad_norm": 1.7899280858376254, "learning_rate": 1.5490375564465095e-07, "loss": 0.5205, "step": 8448 }, { "epoch": 0.7795179333410218, "grad_norm": 1.5995940750540711, "learning_rate": 1.5477979086942256e-07, "loss": 0.5967, "step": 8449 }, { "epoch": 0.7796101949025487, "grad_norm": 1.7945689867569454, "learning_rate": 1.546558687062899e-07, "loss": 0.6165, "step": 8450 }, { "epoch": 0.7796101949025487, "eval_GEN Loss": 0.4348452389240265, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3238103985786438, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7939603328704834, "eval_runtime": 57.2544, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 8450 }, { "epoch": 0.7797024564640757, "grad_norm": 2.207307700309632, "learning_rate": 1.5453198916648254e-07, "loss": 0.5056, "step": 8451 }, { "epoch": 0.7797947180256026, "grad_norm": 2.318646380103928, "learning_rate": 1.5440815226122688e-07, "loss": 0.734, "step": 8452 }, { "epoch": 0.7798869795871295, "grad_norm": 1.975864214164888, "learning_rate": 1.5428435800174537e-07, "loss": 0.6279, "step": 8453 }, { "epoch": 0.7799792411486565, "grad_norm": 2.111546802930889, "learning_rate": 1.5416060639925602e-07, "loss": 0.7407, "step": 8454 }, { "epoch": 0.7800715027101833, "grad_norm": 2.768733396803873, "learning_rate": 1.5403689746497364e-07, "loss": 0.8079, "step": 8455 }, { "epoch": 0.7800715027101833, "eval_GEN Loss": 0.4338414669036865, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3202202022075653, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7908653616905212, "eval_runtime": 57.2034, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8455 }, { "epoch": 0.7801637642717103, "grad_norm": 3.087517295963231, "learning_rate": 1.5391323121010896e-07, "loss": 0.5672, "step": 8456 }, { "epoch": 0.7802560258332373, "grad_norm": 2.308140592828051, "learning_rate": 1.5378960764586893e-07, "loss": 0.6422, "step": 8457 }, { "epoch": 0.7803482873947641, "grad_norm": 2.3212340936603155, "learning_rate": 1.5366602678345617e-07, "loss": 0.6882, "step": 8458 }, { "epoch": 0.7804405489562911, "grad_norm": 1.4858401972879265, "learning_rate": 1.5354248863406995e-07, "loss": 0.5245, "step": 8459 }, { "epoch": 0.780532810517818, "grad_norm": 1.3895377843735428, "learning_rate": 1.5341899320890552e-07, "loss": 0.5089, "step": 8460 }, { "epoch": 0.780532810517818, "eval_GEN Loss": 0.43400251865386963, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3228021562099457, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7951622605323792, "eval_runtime": 57.1615, "eval_samples_per_second": 1.137, "eval_steps_per_second": 0.087, "step": 8460 }, { "epoch": 0.780625072079345, "grad_norm": 2.43287510461366, "learning_rate": 1.5329554051915433e-07, "loss": 0.7847, "step": 8461 }, { "epoch": 0.7807173336408719, "grad_norm": 1.8202395165558156, "learning_rate": 1.531721305760036e-07, "loss": 0.5407, "step": 8462 }, { "epoch": 0.7808095952023988, "grad_norm": 2.125253751145254, "learning_rate": 1.5304876339063703e-07, "loss": 0.5581, "step": 8463 }, { "epoch": 0.7809018567639258, "grad_norm": 2.416374524819352, "learning_rate": 1.529254389742344e-07, "loss": 0.7278, "step": 8464 }, { "epoch": 0.7809941183254526, "grad_norm": 2.5091675371071345, "learning_rate": 1.5280215733797177e-07, "loss": 0.925, "step": 8465 }, { "epoch": 0.7809941183254526, "eval_GEN Loss": 0.4343210458755493, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3212469518184662, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7960637211799622, "eval_runtime": 57.2403, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8465 }, { "epoch": 0.7810863798869796, "grad_norm": 1.4489718916752958, "learning_rate": 1.5267891849302067e-07, "loss": 0.7478, "step": 8466 }, { "epoch": 0.7811786414485065, "grad_norm": 2.1050325239791565, "learning_rate": 1.5255572245054938e-07, "loss": 0.5855, "step": 8467 }, { "epoch": 0.7812709030100334, "grad_norm": 2.440869932847777, "learning_rate": 1.5243256922172239e-07, "loss": 0.775, "step": 8468 }, { "epoch": 0.7813631645715604, "grad_norm": 1.8062519451914112, "learning_rate": 1.5230945881769968e-07, "loss": 0.6174, "step": 8469 }, { "epoch": 0.7814554261330873, "grad_norm": 1.584341555063955, "learning_rate": 1.5218639124963776e-07, "loss": 0.7526, "step": 8470 }, { "epoch": 0.7814554261330873, "eval_GEN Loss": 0.43397843837738037, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3224678337574005, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7962740659713745, "eval_runtime": 57.2643, "eval_samples_per_second": 1.135, "eval_steps_per_second": 0.087, "step": 8470 }, { "epoch": 0.7815476876946142, "grad_norm": 1.9892205255928528, "learning_rate": 1.5206336652868928e-07, "loss": 0.679, "step": 8471 }, { "epoch": 0.7816399492561411, "grad_norm": 2.3807658449049507, "learning_rate": 1.5194038466600315e-07, "loss": 0.5927, "step": 8472 }, { "epoch": 0.7817322108176681, "grad_norm": 2.359705825709136, "learning_rate": 1.518174456727236e-07, "loss": 0.7308, "step": 8473 }, { "epoch": 0.7818244723791951, "grad_norm": 3.278155085145706, "learning_rate": 1.5169454955999232e-07, "loss": 0.879, "step": 8474 }, { "epoch": 0.7819167339407219, "grad_norm": 2.3238535609027586, "learning_rate": 1.5157169633894567e-07, "loss": 0.6518, "step": 8475 }, { "epoch": 0.7819167339407219, "eval_GEN Loss": 0.43384841084480286, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.324123352766037, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7957331538200378, "eval_runtime": 57.3092, "eval_samples_per_second": 1.134, "eval_steps_per_second": 0.087, "step": 8475 }, { "epoch": 0.7820089955022489, "grad_norm": 1.6792873894936133, "learning_rate": 1.5144888602071737e-07, "loss": 0.6335, "step": 8476 }, { "epoch": 0.7821012570637758, "grad_norm": 1.4885740189520988, "learning_rate": 1.5132611861643616e-07, "loss": 0.4749, "step": 8477 }, { "epoch": 0.7821935186253027, "grad_norm": 1.6940334695961665, "learning_rate": 1.5120339413722768e-07, "loss": 0.5082, "step": 8478 }, { "epoch": 0.7822857801868297, "grad_norm": 1.5820103337009979, "learning_rate": 1.510807125942136e-07, "loss": 0.6258, "step": 8479 }, { "epoch": 0.7823780417483566, "grad_norm": 2.5741502828695437, "learning_rate": 1.5095807399851086e-07, "loss": 0.5594, "step": 8480 }, { "epoch": 0.7823780417483566, "eval_GEN Loss": 0.43457165360450745, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.3251239061355591, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.793870210647583, "eval_runtime": 56.916, "eval_samples_per_second": 1.142, "eval_steps_per_second": 0.088, "step": 8480 }, { "epoch": 0.7824703033098835, "grad_norm": 2.004361870066249, "learning_rate": 1.5083547836123404e-07, "loss": 0.6361, "step": 8481 }, { "epoch": 0.7825625648714104, "grad_norm": 2.0751821048758905, "learning_rate": 1.5071292569349234e-07, "loss": 0.6794, "step": 8482 }, { "epoch": 0.7826548264329374, "grad_norm": 2.3503941692417873, "learning_rate": 1.50590416006392e-07, "loss": 0.6935, "step": 8483 }, { "epoch": 0.7827470879944644, "grad_norm": 2.7775134316779395, "learning_rate": 1.5046794931103454e-07, "loss": 0.7783, "step": 8484 }, { "epoch": 0.7828393495559912, "grad_norm": 1.8101691019615114, "learning_rate": 1.503455256185188e-07, "loss": 0.6455, "step": 8485 }, { "epoch": 0.7828393495559912, "eval_GEN Loss": 0.43448564410209656, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32665809988975525, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7944411039352417, "eval_runtime": 56.9786, "eval_samples_per_second": 1.141, "eval_steps_per_second": 0.088, "step": 8485 }, { "epoch": 0.7829316111175182, "grad_norm": 2.5234703535494116, "learning_rate": 1.5022314493993849e-07, "loss": 0.7019, "step": 8486 }, { "epoch": 0.783023872679045, "grad_norm": 1.668563896717364, "learning_rate": 1.5010080728638424e-07, "loss": 0.6153, "step": 8487 }, { "epoch": 0.783116134240572, "grad_norm": 1.925825092714134, "learning_rate": 1.4997851266894215e-07, "loss": 0.6094, "step": 8488 }, { "epoch": 0.783208395802099, "grad_norm": 1.481221464506428, "learning_rate": 1.49856261098695e-07, "loss": 0.576, "step": 8489 }, { "epoch": 0.7833006573636259, "grad_norm": 2.641590183649685, "learning_rate": 1.4973405258672129e-07, "loss": 1.0045, "step": 8490 }, { "epoch": 0.7833006573636259, "eval_GEN Loss": 0.43546396493911743, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32905712723731995, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.793749988079071, "eval_runtime": 57.0918, "eval_samples_per_second": 1.139, "eval_steps_per_second": 0.088, "step": 8490 }, { "epoch": 0.7833929189251528, "grad_norm": 2.2555101852496726, "learning_rate": 1.496118871440958e-07, "loss": 0.7047, "step": 8491 }, { "epoch": 0.7834851804866797, "grad_norm": 2.983415091979887, "learning_rate": 1.4948976478188956e-07, "loss": 0.7618, "step": 8492 }, { "epoch": 0.7835774420482067, "grad_norm": 2.590744665606835, "learning_rate": 1.493676855111692e-07, "loss": 0.644, "step": 8493 }, { "epoch": 0.7836697036097336, "grad_norm": 2.3065638789455982, "learning_rate": 1.4924564934299793e-07, "loss": 0.6444, "step": 8494 }, { "epoch": 0.7837619651712605, "grad_norm": 2.227353463982034, "learning_rate": 1.4912365628843447e-07, "loss": 0.8847, "step": 8495 }, { "epoch": 0.7837619651712605, "eval_GEN Loss": 0.4348280131816864, "eval_GEN top-5 accuracy": 0.9833406400701447, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.32969358563423157, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7927584052085876, "eval_runtime": 57.2277, "eval_samples_per_second": 1.136, "eval_steps_per_second": 0.087, "step": 8495 }, { "epoch": 0.7838542267327875, "grad_norm": 2.572387001506329, "learning_rate": 1.4900170635853467e-07, "loss": 0.6738, "step": 8496 }, { "epoch": 0.7839464882943143, "grad_norm": 1.9649865363409786, "learning_rate": 1.488797995643492e-07, "loss": 0.7222, "step": 8497 }, { "epoch": 0.7840387498558413, "grad_norm": 2.4339860211537307, "learning_rate": 1.4875793591692583e-07, "loss": 0.7584, "step": 8498 }, { "epoch": 0.7841310114173682, "grad_norm": 2.2221872186283447, "learning_rate": 1.4863611542730785e-07, "loss": 0.8218, "step": 8499 }, { "epoch": 0.7842232729788952, "grad_norm": 2.215116996980214, "learning_rate": 1.4851433810653508e-07, "loss": 0.8638, "step": 8500 }, { "epoch": 0.7842232729788952, "eval_GEN Loss": 0.43536677956581116, "eval_GEN top-5 accuracy": 0.9837790442788251, "eval_PRM Accuracy": 0.8584905660377359, "eval_PRM F1": 0.9090909090909091, "eval_PRM F1 AUC": 0.7996333158721844, "eval_PRM F1 Neg": 0.6808510638297872, "eval_PRM Loss": 0.33258911967277527, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.9146341463414634, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.7951322197914124, "eval_runtime": 57.3669, "eval_samples_per_second": 1.133, "eval_steps_per_second": 0.087, "step": 8500 } ], "logging_steps": 1, "max_steps": 10838, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": false }, "attributes": {} } }, "total_flos": 267795579617280.0, "train_batch_size": 2, "trial_name": null, "trial_params": null }