{ "best_metric": null, "best_model_checkpoint": null, "epoch": 0.9999678011398396, "eval_steps": 5, "global_step": 3882, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.5429544264012572, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.4157159328460693, "eval_runtime": 15.9699, "eval_samples_per_second": 2.755, "eval_steps_per_second": 0.188, "step": 0 }, { "epoch": 0.00025759088128280257, "grad_norm": 0.8051918506636666, "learning_rate": 2.570694087403599e-07, "loss": 2.3123, "step": 1 }, { "epoch": 0.0005151817625656051, "grad_norm": 0.6504008311511874, "learning_rate": 5.141388174807198e-07, "loss": 2.0026, "step": 2 }, { "epoch": 0.0007727726438484078, "grad_norm": 0.6831669558853579, "learning_rate": 7.712082262210797e-07, "loss": 2.273, "step": 3 }, { "epoch": 0.0010303635251312103, "grad_norm": 0.7544623732284279, "learning_rate": 1.0282776349614395e-06, "loss": 2.3691, "step": 4 }, { "epoch": 0.001287954406414013, "grad_norm": 0.8970171709833432, "learning_rate": 1.2853470437017995e-06, "loss": 2.4009, "step": 5 }, { "epoch": 0.001287954406414013, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.5392875851231012, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.423478603363037, "eval_runtime": 17.5437, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 5 }, { "epoch": 0.0015455452876968155, "grad_norm": 0.8330047843260688, "learning_rate": 1.5424164524421595e-06, "loss": 2.4836, "step": 6 }, { "epoch": 0.0018031361689796182, "grad_norm": 0.7964684277328417, "learning_rate": 1.7994858611825194e-06, "loss": 2.377, "step": 7 }, { "epoch": 0.0020607270502624206, "grad_norm": 0.7688399696495979, "learning_rate": 2.056555269922879e-06, "loss": 2.399, "step": 8 }, { "epoch": 0.002318317931545223, "grad_norm": 0.7883631693566643, "learning_rate": 2.313624678663239e-06, "loss": 2.3927, "step": 9 }, { "epoch": 0.002575908812828026, "grad_norm": 0.8206910541503305, "learning_rate": 2.570694087403599e-06, "loss": 2.5266, "step": 10 }, { "epoch": 0.002575908812828026, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.539287585123101, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.4073431491851807, "eval_runtime": 16.6728, "eval_samples_per_second": 2.639, "eval_steps_per_second": 0.18, "step": 10 }, { "epoch": 0.0028334996941108284, "grad_norm": 0.8369215273897154, "learning_rate": 2.8277634961439587e-06, "loss": 2.6343, "step": 11 }, { "epoch": 0.003091090575393631, "grad_norm": 0.7550418511394903, "learning_rate": 3.084832904884319e-06, "loss": 2.2193, "step": 12 }, { "epoch": 0.0033486814566764337, "grad_norm": 0.7637079998742741, "learning_rate": 3.3419023136246787e-06, "loss": 2.4411, "step": 13 }, { "epoch": 0.0036062723379592363, "grad_norm": 0.7743593751053474, "learning_rate": 3.598971722365039e-06, "loss": 2.4353, "step": 14 }, { "epoch": 0.003863863219242039, "grad_norm": 0.7500281156214608, "learning_rate": 3.856041131105398e-06, "loss": 2.0151, "step": 15 }, { "epoch": 0.003863863219242039, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.5358826610790991, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.3990285396575928, "eval_runtime": 16.9366, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 15 }, { "epoch": 0.004121454100524841, "grad_norm": 0.9354540659707624, "learning_rate": 4.113110539845758e-06, "loss": 2.774, "step": 16 }, { "epoch": 0.004379044981807644, "grad_norm": 0.7880083262169871, "learning_rate": 4.370179948586119e-06, "loss": 2.1761, "step": 17 }, { "epoch": 0.004636635863090446, "grad_norm": 0.8544310034985346, "learning_rate": 4.627249357326478e-06, "loss": 2.4548, "step": 18 }, { "epoch": 0.0048942267443732495, "grad_norm": 0.758651866184643, "learning_rate": 4.884318766066838e-06, "loss": 1.9793, "step": 19 }, { "epoch": 0.005151817625656052, "grad_norm": 0.9540683765325954, "learning_rate": 5.141388174807198e-06, "loss": 2.4581, "step": 20 }, { "epoch": 0.005151817625656052, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.5424305919329493, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.3500921726226807, "eval_runtime": 17.1383, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 20 }, { "epoch": 0.005409408506938855, "grad_norm": 0.9223911764470025, "learning_rate": 5.398457583547558e-06, "loss": 2.4388, "step": 21 }, { "epoch": 0.005666999388221657, "grad_norm": 0.9480623938341571, "learning_rate": 5.6555269922879175e-06, "loss": 2.5247, "step": 22 }, { "epoch": 0.00592459026950446, "grad_norm": 0.9032837632960887, "learning_rate": 5.912596401028278e-06, "loss": 2.1964, "step": 23 }, { "epoch": 0.006182181150787262, "grad_norm": 0.8802500159367916, "learning_rate": 6.169665809768638e-06, "loss": 2.3572, "step": 24 }, { "epoch": 0.006439772032070064, "grad_norm": 0.8590674687942792, "learning_rate": 6.426735218508998e-06, "loss": 2.3108, "step": 25 }, { "epoch": 0.006439772032070064, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.5390256678889471, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.2937705516815186, "eval_runtime": 17.5628, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 25 }, { "epoch": 0.006697362913352867, "grad_norm": 0.9133613529417643, "learning_rate": 6.683804627249357e-06, "loss": 2.247, "step": 26 }, { "epoch": 0.00695495379463567, "grad_norm": 1.0117622857576738, "learning_rate": 6.940874035989718e-06, "loss": 2.4818, "step": 27 }, { "epoch": 0.007212544675918473, "grad_norm": 0.8353370483325568, "learning_rate": 7.197943444730078e-06, "loss": 2.0124, "step": 28 }, { "epoch": 0.007470135557201275, "grad_norm": 0.896092221073639, "learning_rate": 7.4550128534704376e-06, "loss": 2.0647, "step": 29 }, { "epoch": 0.007727726438484078, "grad_norm": 0.9318348830048263, "learning_rate": 7.712082262210796e-06, "loss": 2.1209, "step": 30 }, { "epoch": 0.007727726438484078, "eval_PRM Accuracy": 0.2169811320754717, "eval_PRM F1": 0.0, "eval_PRM F1 AUC": 0.5, "eval_PRM F1 AUC (fixed)": 0.536668412781561, "eval_PRM F1 Neg": 0.35658914728682173, "eval_PRM NPV": 0.2169811320754717, "eval_PRM Precision": 0.0, "eval_PRM Recall": 0.0, "eval_PRM Specificty": 1.0, "eval_loss": 2.173092842102051, "eval_runtime": 17.0642, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 30 }, { "epoch": 0.00798531731976688, "grad_norm": 1.0558922414062275, "learning_rate": 7.969151670951156e-06, "loss": 2.2368, "step": 31 }, { "epoch": 0.008242908201049682, "grad_norm": 0.9362611865277034, "learning_rate": 8.226221079691516e-06, "loss": 1.9336, "step": 32 }, { "epoch": 0.008500499082332486, "grad_norm": 0.9108463665312627, "learning_rate": 8.483290488431877e-06, "loss": 1.8443, "step": 33 }, { "epoch": 0.008758089963615288, "grad_norm": 0.9079402465898436, "learning_rate": 8.740359897172237e-06, "loss": 1.9206, "step": 34 }, { "epoch": 0.00901568084489809, "grad_norm": 0.9037053465966511, "learning_rate": 8.997429305912597e-06, "loss": 1.8145, "step": 35 }, { "epoch": 0.00901568084489809, "eval_PRM Accuracy": 0.22641509433962265, "eval_PRM F1": 0.023809523809523808, "eval_PRM F1 AUC": 0.5060240963855421, "eval_PRM F1 AUC (fixed)": 0.5440020953378732, "eval_PRM F1 Neg": 0.359375, "eval_PRM NPV": 0.21904761904761905, "eval_PRM Precision": 1.0, "eval_PRM Recall": 0.012048192771084338, "eval_PRM Specificty": 1.0, "eval_loss": 1.998551845550537, "eval_runtime": 16.8543, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 35 }, { "epoch": 0.009273271726180893, "grad_norm": 1.0002437475971433, "learning_rate": 9.254498714652957e-06, "loss": 1.8602, "step": 36 }, { "epoch": 0.009530862607463695, "grad_norm": 0.8854871915785585, "learning_rate": 9.511568123393317e-06, "loss": 1.6786, "step": 37 }, { "epoch": 0.009788453488746499, "grad_norm": 1.3480807223592863, "learning_rate": 9.768637532133676e-06, "loss": 1.983, "step": 38 }, { "epoch": 0.010046044370029301, "grad_norm": 1.0498438068866873, "learning_rate": 1.0025706940874038e-05, "loss": 1.7863, "step": 39 }, { "epoch": 0.010303635251312103, "grad_norm": 0.8645566617587029, "learning_rate": 1.0282776349614396e-05, "loss": 1.5971, "step": 40 }, { "epoch": 0.010303635251312103, "eval_PRM Accuracy": 0.22641509433962265, "eval_PRM F1": 0.046511627906976744, "eval_PRM F1 AUC": 0.4903090623363018, "eval_PRM F1 AUC (fixed)": 0.5497642744892614, "eval_PRM F1 Neg": 0.3492063492063492, "eval_PRM NPV": 0.21359223300970873, "eval_PRM Precision": 0.6666666666666666, "eval_PRM Recall": 0.024096385542168676, "eval_PRM Specificty": 0.9565217391304348, "eval_loss": 1.7518699169158936, "eval_runtime": 16.9621, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 40 }, { "epoch": 0.010561226132594905, "grad_norm": 1.0979943699513763, "learning_rate": 1.0539845758354756e-05, "loss": 1.8441, "step": 41 }, { "epoch": 0.01081881701387771, "grad_norm": 0.9858112048400034, "learning_rate": 1.0796915167095115e-05, "loss": 1.4734, "step": 42 }, { "epoch": 0.011076407895160512, "grad_norm": 0.9826991597646841, "learning_rate": 1.1053984575835475e-05, "loss": 1.4919, "step": 43 }, { "epoch": 0.011333998776443314, "grad_norm": 0.9862761379290508, "learning_rate": 1.1311053984575835e-05, "loss": 1.4041, "step": 44 }, { "epoch": 0.011591589657726116, "grad_norm": 0.9104499793280701, "learning_rate": 1.1568123393316196e-05, "loss": 1.4358, "step": 45 }, { "epoch": 0.011591589657726116, "eval_PRM Accuracy": 0.25471698113207547, "eval_PRM F1": 0.11235955056179775, "eval_PRM F1 AUC": 0.5083813514929283, "eval_PRM F1 AUC (fixed)": 0.5531691985332635, "eval_PRM F1 Neg": 0.35772357723577236, "eval_PRM NPV": 0.22, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.060240963855421686, "eval_PRM Specificty": 0.9565217391304348, "eval_loss": 1.4646550416946411, "eval_runtime": 16.4245, "eval_samples_per_second": 2.679, "eval_steps_per_second": 0.183, "step": 45 }, { "epoch": 0.01184918053900892, "grad_norm": 0.8696901806982194, "learning_rate": 1.1825192802056556e-05, "loss": 1.2637, "step": 46 }, { "epoch": 0.012106771420291722, "grad_norm": 0.9364163540519426, "learning_rate": 1.2082262210796916e-05, "loss": 1.4164, "step": 47 }, { "epoch": 0.012364362301574524, "grad_norm": 0.8216872168739721, "learning_rate": 1.2339331619537276e-05, "loss": 1.1048, "step": 48 }, { "epoch": 0.012621953182857326, "grad_norm": 0.9035446323192594, "learning_rate": 1.2596401028277636e-05, "loss": 1.2616, "step": 49 }, { "epoch": 0.012879544064140129, "grad_norm": 0.5908342218030821, "learning_rate": 1.2853470437017995e-05, "loss": 0.9679, "step": 50 }, { "epoch": 0.012879544064140129, "eval_PRM Accuracy": 0.3490566037735849, "eval_PRM F1": 0.34285714285714286, "eval_PRM F1 AUC": 0.5214772132006286, "eval_PRM F1 AUC (fixed)": 0.5487166055526453, "eval_PRM F1 Neg": 0.35514018691588783, "eval_PRM NPV": 0.2261904761904762, "eval_PRM Precision": 0.8181818181818182, "eval_PRM Recall": 0.21686746987951808, "eval_PRM Specificty": 0.8260869565217391, "eval_loss": 1.152876377105713, "eval_runtime": 16.9732, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 50 }, { "epoch": 0.013137134945422933, "grad_norm": 0.7045028702966702, "learning_rate": 1.3110539845758355e-05, "loss": 1.1022, "step": 51 }, { "epoch": 0.013394725826705735, "grad_norm": 0.5388857735593554, "learning_rate": 1.3367609254498715e-05, "loss": 1.1006, "step": 52 }, { "epoch": 0.013652316707988537, "grad_norm": 0.5452779007768951, "learning_rate": 1.3624678663239075e-05, "loss": 0.947, "step": 53 }, { "epoch": 0.01390990758927134, "grad_norm": 0.6110093049693048, "learning_rate": 1.3881748071979436e-05, "loss": 0.9761, "step": 54 }, { "epoch": 0.014167498470554143, "grad_norm": 0.4850433742895813, "learning_rate": 1.4138817480719796e-05, "loss": 0.829, "step": 55 }, { "epoch": 0.014167498470554143, "eval_PRM Accuracy": 0.5, "eval_PRM F1": 0.6015037593984962, "eval_PRM F1 AUC": 0.5235725510738607, "eval_PRM F1 AUC (fixed)": 0.5581456259821896, "eval_PRM F1 Neg": 0.3291139240506329, "eval_PRM NPV": 0.23214285714285715, "eval_PRM Precision": 0.8, "eval_PRM Recall": 0.4819277108433735, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.9325727820396423, "eval_runtime": 17.1055, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 55 }, { "epoch": 0.014425089351836945, "grad_norm": 0.3359339613965973, "learning_rate": 1.4395886889460156e-05, "loss": 0.8123, "step": 56 }, { "epoch": 0.014682680233119748, "grad_norm": 0.3896172539980878, "learning_rate": 1.4652956298200515e-05, "loss": 0.757, "step": 57 }, { "epoch": 0.01494027111440255, "grad_norm": 0.19375563528447443, "learning_rate": 1.4910025706940875e-05, "loss": 0.7805, "step": 58 }, { "epoch": 0.015197861995685352, "grad_norm": 0.251097380622233, "learning_rate": 1.5167095115681235e-05, "loss": 0.7663, "step": 59 }, { "epoch": 0.015455452876968156, "grad_norm": 0.3421838491024599, "learning_rate": 1.5424164524421593e-05, "loss": 0.685, "step": 60 }, { "epoch": 0.015455452876968156, "eval_PRM Accuracy": 0.6320754716981132, "eval_PRM F1": 0.7607361963190185, "eval_PRM F1 AUC": 0.4821896280775274, "eval_PRM F1 AUC (fixed)": 0.5780513357778941, "eval_PRM F1 Neg": 0.20408163265306123, "eval_PRM NPV": 0.19230769230769232, "eval_PRM Precision": 0.775, "eval_PRM Recall": 0.7469879518072289, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8294566869735718, "eval_runtime": 16.9927, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 60 }, { "epoch": 0.015713043758250958, "grad_norm": 0.2440925507542803, "learning_rate": 1.5681233933161953e-05, "loss": 0.5873, "step": 61 }, { "epoch": 0.01597063463953376, "grad_norm": 0.15104598040732764, "learning_rate": 1.5938303341902313e-05, "loss": 0.6311, "step": 62 }, { "epoch": 0.016228225520816562, "grad_norm": 0.3089989759736661, "learning_rate": 1.6195372750642672e-05, "loss": 0.8766, "step": 63 }, { "epoch": 0.016485816402099365, "grad_norm": 0.26484009633010885, "learning_rate": 1.6452442159383032e-05, "loss": 0.7188, "step": 64 }, { "epoch": 0.016743407283382167, "grad_norm": 0.2337554037482912, "learning_rate": 1.6709511568123395e-05, "loss": 0.788, "step": 65 }, { "epoch": 0.016743407283382167, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8457142857142858, "eval_PRM F1 AUC": 0.5544787847040336, "eval_PRM F1 AUC (fixed)": 0.5953378732320587, "eval_PRM F1 Neg": 0.2702702702702703, "eval_PRM NPV": 0.35714285714285715, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8297230005264282, "eval_runtime": 17.6404, "eval_samples_per_second": 2.494, "eval_steps_per_second": 0.17, "step": 65 }, { "epoch": 0.017000998164664972, "grad_norm": 0.1911808703380372, "learning_rate": 1.6966580976863755e-05, "loss": 0.6419, "step": 66 }, { "epoch": 0.017258589045947775, "grad_norm": 0.40995439764688685, "learning_rate": 1.7223650385604115e-05, "loss": 0.9034, "step": 67 }, { "epoch": 0.017516179927230577, "grad_norm": 0.48022926582155917, "learning_rate": 1.7480719794344475e-05, "loss": 0.8713, "step": 68 }, { "epoch": 0.01777377080851338, "grad_norm": 0.3650960041222673, "learning_rate": 1.7737789203084834e-05, "loss": 0.8209, "step": 69 }, { "epoch": 0.01803136168979618, "grad_norm": 0.5294308132341357, "learning_rate": 1.7994858611825194e-05, "loss": 0.8833, "step": 70 }, { "epoch": 0.01803136168979618, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8457142857142858, "eval_PRM F1 AUC": 0.5544787847040336, "eval_PRM F1 AUC (fixed)": 0.605552645364065, "eval_PRM F1 Neg": 0.2702702702702703, "eval_PRM NPV": 0.35714285714285715, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8277698755264282, "eval_runtime": 17.3953, "eval_samples_per_second": 2.529, "eval_steps_per_second": 0.172, "step": 70 }, { "epoch": 0.018288952571078983, "grad_norm": 0.29727869767430204, "learning_rate": 1.8251928020565554e-05, "loss": 0.7649, "step": 71 }, { "epoch": 0.018546543452361786, "grad_norm": 0.3811293140967061, "learning_rate": 1.8508997429305914e-05, "loss": 0.745, "step": 72 }, { "epoch": 0.018804134333644588, "grad_norm": 0.1474695447123835, "learning_rate": 1.8766066838046273e-05, "loss": 0.5767, "step": 73 }, { "epoch": 0.01906172521492739, "grad_norm": 0.16434763897841323, "learning_rate": 1.9023136246786633e-05, "loss": 0.6535, "step": 74 }, { "epoch": 0.019319316096210196, "grad_norm": 0.12518156340136305, "learning_rate": 1.9280205655526993e-05, "loss": 0.572, "step": 75 }, { "epoch": 0.019319316096210196, "eval_PRM Accuracy": 0.7264150943396226, "eval_PRM F1": 0.8323699421965318, "eval_PRM F1 AUC": 0.5424305919329492, "eval_PRM F1 AUC (fixed)": 0.6086956521739131, "eval_PRM F1 Neg": 0.2564102564102564, "eval_PRM NPV": 0.3125, "eval_PRM Precision": 0.8, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8133878111839294, "eval_runtime": 17.1592, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 75 }, { "epoch": 0.019576906977492998, "grad_norm": 0.2861216290044323, "learning_rate": 1.9537275064267353e-05, "loss": 0.6898, "step": 76 }, { "epoch": 0.0198344978587758, "grad_norm": 0.19202267264915562, "learning_rate": 1.9794344473007716e-05, "loss": 0.6944, "step": 77 }, { "epoch": 0.020092088740058602, "grad_norm": 0.17177799421815249, "learning_rate": 2.0051413881748076e-05, "loss": 0.6358, "step": 78 }, { "epoch": 0.020349679621341404, "grad_norm": 0.4074744596049904, "learning_rate": 2.0308483290488432e-05, "loss": 0.907, "step": 79 }, { "epoch": 0.020607270502624207, "grad_norm": 0.20044860761151412, "learning_rate": 2.0565552699228792e-05, "loss": 0.7944, "step": 80 }, { "epoch": 0.020607270502624207, "eval_PRM Accuracy": 0.7075471698113207, "eval_PRM F1": 0.8187134502923976, "eval_PRM F1 AUC": 0.5303823991618648, "eval_PRM F1 AUC (fixed)": 0.6157674174960712, "eval_PRM F1 Neg": 0.24390243902439024, "eval_PRM NPV": 0.2777777777777778, "eval_PRM Precision": 0.7954545454545454, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8000710010528564, "eval_runtime": 16.7799, "eval_samples_per_second": 2.622, "eval_steps_per_second": 0.179, "step": 80 }, { "epoch": 0.02086486138390701, "grad_norm": 0.13701795649516482, "learning_rate": 2.082262210796915e-05, "loss": 0.515, "step": 81 }, { "epoch": 0.02112245226518981, "grad_norm": 0.13006567894740256, "learning_rate": 2.107969151670951e-05, "loss": 0.6353, "step": 82 }, { "epoch": 0.021380043146472613, "grad_norm": 0.1518960998734976, "learning_rate": 2.133676092544987e-05, "loss": 0.6871, "step": 83 }, { "epoch": 0.02163763402775542, "grad_norm": 0.12490936231146701, "learning_rate": 2.159383033419023e-05, "loss": 0.6212, "step": 84 }, { "epoch": 0.02189522490903822, "grad_norm": 0.14481744514671652, "learning_rate": 2.185089974293059e-05, "loss": 0.6463, "step": 85 }, { "epoch": 0.02189522490903822, "eval_PRM Accuracy": 0.6698113207547169, "eval_PRM F1": 0.7904191616766467, "eval_PRM F1 AUC": 0.5062860136196962, "eval_PRM F1 AUC (fixed)": 0.6246726034573075, "eval_PRM F1 Neg": 0.2222222222222222, "eval_PRM NPV": 0.22727272727272727, "eval_PRM Precision": 0.7857142857142857, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7958984375, "eval_runtime": 16.6365, "eval_samples_per_second": 2.645, "eval_steps_per_second": 0.18, "step": 85 }, { "epoch": 0.022152815790321023, "grad_norm": 0.2761576885999609, "learning_rate": 2.210796915167095e-05, "loss": 0.7789, "step": 86 }, { "epoch": 0.022410406671603825, "grad_norm": 0.3076896950510689, "learning_rate": 2.236503856041131e-05, "loss": 0.8013, "step": 87 }, { "epoch": 0.022667997552886628, "grad_norm": 0.1381424015291319, "learning_rate": 2.262210796915167e-05, "loss": 0.6188, "step": 88 }, { "epoch": 0.02292558843416943, "grad_norm": 0.23919741447539714, "learning_rate": 2.2879177377892033e-05, "loss": 0.6455, "step": 89 }, { "epoch": 0.023183179315452232, "grad_norm": 0.1723837628396957, "learning_rate": 2.3136246786632393e-05, "loss": 0.7532, "step": 90 }, { "epoch": 0.023183179315452232, "eval_PRM Accuracy": 0.6226415094339622, "eval_PRM F1": 0.7530864197530864, "eval_PRM F1 AUC": 0.47616553169198533, "eval_PRM F1 AUC (fixed)": 0.6210057621791514, "eval_PRM F1 Neg": 0.2, "eval_PRM NPV": 0.18518518518518517, "eval_PRM Precision": 0.7721518987341772, "eval_PRM Recall": 0.7349397590361446, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.8022904992103577, "eval_runtime": 16.7896, "eval_samples_per_second": 2.621, "eval_steps_per_second": 0.179, "step": 90 }, { "epoch": 0.023440770196735034, "grad_norm": 0.2123413450675764, "learning_rate": 2.3393316195372753e-05, "loss": 0.6432, "step": 91 }, { "epoch": 0.02369836107801784, "grad_norm": 0.18069067070384887, "learning_rate": 2.3650385604113112e-05, "loss": 0.7004, "step": 92 }, { "epoch": 0.023955951959300642, "grad_norm": 0.1446062857149826, "learning_rate": 2.3907455012853472e-05, "loss": 0.6474, "step": 93 }, { "epoch": 0.024213542840583444, "grad_norm": 0.14091684315023018, "learning_rate": 2.4164524421593832e-05, "loss": 0.6335, "step": 94 }, { "epoch": 0.024471133721866246, "grad_norm": 0.20692690736920014, "learning_rate": 2.4421593830334192e-05, "loss": 0.6736, "step": 95 }, { "epoch": 0.024471133721866246, "eval_PRM Accuracy": 0.6320754716981132, "eval_PRM F1": 0.7607361963190185, "eval_PRM F1 AUC": 0.4821896280775274, "eval_PRM F1 AUC (fixed)": 0.641697223677318, "eval_PRM F1 Neg": 0.20408163265306123, "eval_PRM NPV": 0.19230769230769232, "eval_PRM Precision": 0.775, "eval_PRM Recall": 0.7469879518072289, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7978515625, "eval_runtime": 17.0287, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 95 }, { "epoch": 0.02472872460314905, "grad_norm": 0.15649382065534395, "learning_rate": 2.467866323907455e-05, "loss": 0.665, "step": 96 }, { "epoch": 0.02498631548443185, "grad_norm": 0.1373927352214366, "learning_rate": 2.493573264781491e-05, "loss": 0.7147, "step": 97 }, { "epoch": 0.025243906365714653, "grad_norm": 0.15331633330972608, "learning_rate": 2.519280205655527e-05, "loss": 0.6507, "step": 98 }, { "epoch": 0.025501497246997455, "grad_norm": 0.22498272198301814, "learning_rate": 2.5449871465295634e-05, "loss": 0.6591, "step": 99 }, { "epoch": 0.025759088128280257, "grad_norm": 0.13631404182762633, "learning_rate": 2.570694087403599e-05, "loss": 0.6483, "step": 100 }, { "epoch": 0.025759088128280257, "eval_PRM Accuracy": 0.6509433962264151, "eval_PRM F1": 0.7757575757575758, "eval_PRM F1 AUC": 0.49423782084861184, "eval_PRM F1 AUC (fixed)": 0.6623886851754844, "eval_PRM F1 Neg": 0.2127659574468085, "eval_PRM NPV": 0.20833333333333334, "eval_PRM Precision": 0.7804878048780488, "eval_PRM Recall": 0.7710843373493976, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7803621888160706, "eval_runtime": 17.4397, "eval_samples_per_second": 2.523, "eval_steps_per_second": 0.172, "step": 100 }, { "epoch": 0.026016679009563063, "grad_norm": 0.2751705039113178, "learning_rate": 2.5964010282776354e-05, "loss": 0.6051, "step": 101 }, { "epoch": 0.026274269890845865, "grad_norm": 0.15155637387832036, "learning_rate": 2.622107969151671e-05, "loss": 0.6747, "step": 102 }, { "epoch": 0.026531860772128667, "grad_norm": 0.1600464407078271, "learning_rate": 2.647814910025707e-05, "loss": 0.7006, "step": 103 }, { "epoch": 0.02678945165341147, "grad_norm": 0.23380101510045495, "learning_rate": 2.673521850899743e-05, "loss": 0.6907, "step": 104 }, { "epoch": 0.027047042534694272, "grad_norm": 0.14430711211952987, "learning_rate": 2.699228791773779e-05, "loss": 0.6556, "step": 105 }, { "epoch": 0.027047042534694272, "eval_PRM Accuracy": 0.7169811320754716, "eval_PRM F1": 0.8255813953488372, "eval_PRM F1 AUC": 0.536406495547407, "eval_PRM F1 AUC (fixed)": 0.6888423258250393, "eval_PRM F1 Neg": 0.25, "eval_PRM NPV": 0.29411764705882354, "eval_PRM Precision": 0.797752808988764, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7592329382896423, "eval_runtime": 17.1101, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 105 }, { "epoch": 0.027304633415977074, "grad_norm": 0.16994724470000197, "learning_rate": 2.724935732647815e-05, "loss": 0.698, "step": 106 }, { "epoch": 0.027562224297259876, "grad_norm": 0.16134048365075782, "learning_rate": 2.750642673521851e-05, "loss": 0.645, "step": 107 }, { "epoch": 0.02781981517854268, "grad_norm": 0.2653647834536006, "learning_rate": 2.7763496143958872e-05, "loss": 0.6954, "step": 108 }, { "epoch": 0.02807740605982548, "grad_norm": 0.17638241330703736, "learning_rate": 2.802056555269923e-05, "loss": 0.6819, "step": 109 }, { "epoch": 0.028334996941108286, "grad_norm": 0.16323739655136751, "learning_rate": 2.827763496143959e-05, "loss": 0.6447, "step": 110 }, { "epoch": 0.028334996941108286, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.6966998428496595, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.74609375, "eval_runtime": 17.0798, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 110 }, { "epoch": 0.02859258782239109, "grad_norm": 0.1506209775401672, "learning_rate": 2.8534704370179948e-05, "loss": 0.5765, "step": 111 }, { "epoch": 0.02885017870367389, "grad_norm": 0.14607815955008335, "learning_rate": 2.879177377892031e-05, "loss": 0.6372, "step": 112 }, { "epoch": 0.029107769584956693, "grad_norm": 0.11028879698713809, "learning_rate": 2.9048843187660668e-05, "loss": 0.6002, "step": 113 }, { "epoch": 0.029365360466239495, "grad_norm": 0.17922057240268474, "learning_rate": 2.930591259640103e-05, "loss": 0.5136, "step": 114 }, { "epoch": 0.029622951347522297, "grad_norm": 0.16959380501504184, "learning_rate": 2.9562982005141387e-05, "loss": 0.614, "step": 115 }, { "epoch": 0.029622951347522297, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.7035096909376637, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7341086864471436, "eval_runtime": 16.6553, "eval_samples_per_second": 2.642, "eval_steps_per_second": 0.18, "step": 115 }, { "epoch": 0.0298805422288051, "grad_norm": 0.2248300295432844, "learning_rate": 2.982005141388175e-05, "loss": 0.6829, "step": 116 }, { "epoch": 0.0301381331100879, "grad_norm": 0.22150232284273402, "learning_rate": 3.0077120822622107e-05, "loss": 0.744, "step": 117 }, { "epoch": 0.030395723991370704, "grad_norm": 0.18391270862872763, "learning_rate": 3.033419023136247e-05, "loss": 0.6808, "step": 118 }, { "epoch": 0.03065331487265351, "grad_norm": 0.1333747453787294, "learning_rate": 3.059125964010283e-05, "loss": 0.5939, "step": 119 }, { "epoch": 0.03091090575393631, "grad_norm": 0.17659651459174927, "learning_rate": 3.0848329048843186e-05, "loss": 0.5475, "step": 120 }, { "epoch": 0.03091090575393631, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8457142857142858, "eval_PRM F1 AUC": 0.5544787847040336, "eval_PRM F1 AUC (fixed)": 0.7027239392352016, "eval_PRM F1 Neg": 0.2702702702702703, "eval_PRM NPV": 0.35714285714285715, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7189275622367859, "eval_runtime": 16.9517, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 120 }, { "epoch": 0.031168496635219114, "grad_norm": 0.3410385776056889, "learning_rate": 3.110539845758355e-05, "loss": 0.7182, "step": 121 }, { "epoch": 0.031426087516501916, "grad_norm": 0.18146873113010875, "learning_rate": 3.1362467866323906e-05, "loss": 0.6707, "step": 122 }, { "epoch": 0.03168367839778472, "grad_norm": 0.2941736631364027, "learning_rate": 3.161953727506427e-05, "loss": 0.698, "step": 123 }, { "epoch": 0.03194126927906752, "grad_norm": 0.25172749962097624, "learning_rate": 3.1876606683804625e-05, "loss": 0.7112, "step": 124 }, { "epoch": 0.032198860160350326, "grad_norm": 0.24241984717241033, "learning_rate": 3.213367609254499e-05, "loss": 0.7325, "step": 125 }, { "epoch": 0.032198860160350326, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.6938187532739655, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.7075639367103577, "eval_runtime": 17.1316, "eval_samples_per_second": 2.568, "eval_steps_per_second": 0.175, "step": 125 }, { "epoch": 0.032456451041633125, "grad_norm": 0.17583196123458156, "learning_rate": 3.2390745501285345e-05, "loss": 0.5292, "step": 126 }, { "epoch": 0.03271404192291593, "grad_norm": 0.12561830177028166, "learning_rate": 3.264781491002571e-05, "loss": 0.5689, "step": 127 }, { "epoch": 0.03297163280419873, "grad_norm": 0.18281597704970667, "learning_rate": 3.2904884318766064e-05, "loss": 0.5399, "step": 128 }, { "epoch": 0.033229223685481535, "grad_norm": 0.21751103957259843, "learning_rate": 3.316195372750643e-05, "loss": 0.5092, "step": 129 }, { "epoch": 0.033486814566764334, "grad_norm": 0.15791030517582452, "learning_rate": 3.341902313624679e-05, "loss": 0.5243, "step": 130 }, { "epoch": 0.033486814566764334, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8488372093023255, "eval_PRM F1 AUC": 0.5919329491880565, "eval_PRM F1 AUC (fixed)": 0.7014143530644317, "eval_PRM F1 Neg": 0.35, "eval_PRM NPV": 0.4117647058823529, "eval_PRM Precision": 0.8202247191011236, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.6996626257896423, "eval_runtime": 16.6179, "eval_samples_per_second": 2.648, "eval_steps_per_second": 0.181, "step": 130 }, { "epoch": 0.03374440544804714, "grad_norm": 0.1437017138457249, "learning_rate": 3.367609254498715e-05, "loss": 0.5331, "step": 131 }, { "epoch": 0.034001996329329945, "grad_norm": 0.14490805162968393, "learning_rate": 3.393316195372751e-05, "loss": 0.6, "step": 132 }, { "epoch": 0.034259587210612744, "grad_norm": 0.2251135432071761, "learning_rate": 3.419023136246787e-05, "loss": 0.4876, "step": 133 }, { "epoch": 0.03451717809189555, "grad_norm": 0.22587653677193498, "learning_rate": 3.444730077120823e-05, "loss": 0.556, "step": 134 }, { "epoch": 0.03477476897317835, "grad_norm": 0.199650036376783, "learning_rate": 3.470437017994859e-05, "loss": 0.5958, "step": 135 }, { "epoch": 0.03477476897317835, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8620689655172413, "eval_PRM F1 AUC": 0.603981141959141, "eval_PRM F1 AUC (fixed)": 0.6723415400733368, "eval_PRM F1 Neg": 0.3684210526315789, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.8241758241758241, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.689453125, "eval_runtime": 17.5521, "eval_samples_per_second": 2.507, "eval_steps_per_second": 0.171, "step": 135 }, { "epoch": 0.035032359854461154, "grad_norm": 0.19518494508973472, "learning_rate": 3.496143958868895e-05, "loss": 0.6123, "step": 136 }, { "epoch": 0.03528995073574395, "grad_norm": 0.1690993363301208, "learning_rate": 3.521850899742931e-05, "loss": 0.5544, "step": 137 }, { "epoch": 0.03554754161702676, "grad_norm": 0.1737907950562536, "learning_rate": 3.547557840616967e-05, "loss": 0.5001, "step": 138 }, { "epoch": 0.03580513249830956, "grad_norm": 0.1282392283643721, "learning_rate": 3.573264781491003e-05, "loss": 0.5336, "step": 139 }, { "epoch": 0.03606272337959236, "grad_norm": 0.21669075712521163, "learning_rate": 3.598971722365039e-05, "loss": 0.604, "step": 140 }, { "epoch": 0.03606272337959236, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.5822420115243583, "eval_PRM F1 AUC (fixed)": 0.6516500785751702, "eval_PRM F1 Neg": 0.32432432432432434, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8152173913043478, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.6690340638160706, "eval_runtime": 16.8763, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 140 }, { "epoch": 0.03632031426087517, "grad_norm": 0.1577628463312436, "learning_rate": 3.624678663239075e-05, "loss": 0.5477, "step": 141 }, { "epoch": 0.03657790514215797, "grad_norm": 0.1957385567890759, "learning_rate": 3.650385604113111e-05, "loss": 0.5437, "step": 142 }, { "epoch": 0.03683549602344077, "grad_norm": 0.34327815211208756, "learning_rate": 3.676092544987147e-05, "loss": 0.5953, "step": 143 }, { "epoch": 0.03709308690472357, "grad_norm": 0.11928570359797404, "learning_rate": 3.701799485861183e-05, "loss": 0.4962, "step": 144 }, { "epoch": 0.03735067778600638, "grad_norm": 0.16179316416758208, "learning_rate": 3.727506426735219e-05, "loss": 0.6005, "step": 145 }, { "epoch": 0.03735067778600638, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.5822420115243583, "eval_PRM F1 AUC (fixed)": 0.6301728653745416, "eval_PRM F1 Neg": 0.32432432432432434, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8152173913043478, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.6517223119735718, "eval_runtime": 17.0935, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.176, "step": 145 }, { "epoch": 0.037608268667289176, "grad_norm": 0.13622294794337028, "learning_rate": 3.753213367609255e-05, "loss": 0.5442, "step": 146 }, { "epoch": 0.03786585954857198, "grad_norm": 0.13886661014337287, "learning_rate": 3.7789203084832907e-05, "loss": 0.5566, "step": 147 }, { "epoch": 0.03812345042985478, "grad_norm": 0.145838887872212, "learning_rate": 3.8046272493573266e-05, "loss": 0.5534, "step": 148 }, { "epoch": 0.038381041311137586, "grad_norm": 0.18946670795108495, "learning_rate": 3.8303341902313626e-05, "loss": 0.6256, "step": 149 }, { "epoch": 0.03863863219242039, "grad_norm": 0.20180324974205688, "learning_rate": 3.8560411311053986e-05, "loss": 0.5303, "step": 150 }, { "epoch": 0.03863863219242039, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8505747126436781, "eval_PRM F1 AUC": 0.5762179151388162, "eval_PRM F1 AUC (fixed)": 0.6178627553693034, "eval_PRM F1 Neg": 0.3157894736842105, "eval_PRM NPV": 0.4, "eval_PRM Precision": 0.8131868131868132, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.6471946239471436, "eval_runtime": 17.1495, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 150 }, { "epoch": 0.03889622307370319, "grad_norm": 0.17344820652015194, "learning_rate": 3.8817480719794346e-05, "loss": 0.5943, "step": 151 }, { "epoch": 0.039153813954985996, "grad_norm": 0.20036484625544604, "learning_rate": 3.9074550128534705e-05, "loss": 0.64, "step": 152 }, { "epoch": 0.039411404836268794, "grad_norm": 0.16136704047855727, "learning_rate": 3.9331619537275065e-05, "loss": 0.5454, "step": 153 }, { "epoch": 0.0396689957175516, "grad_norm": 0.1777827118898286, "learning_rate": 3.958868894601543e-05, "loss": 0.6094, "step": 154 }, { "epoch": 0.0399265865988344, "grad_norm": 0.21171085806417575, "learning_rate": 3.9845758354755785e-05, "loss": 0.5181, "step": 155 }, { "epoch": 0.0399265865988344, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8457142857142858, "eval_PRM F1 AUC": 0.5544787847040336, "eval_PRM F1 AUC (fixed)": 0.6107909900471451, "eval_PRM F1 Neg": 0.2702702702702703, "eval_PRM NPV": 0.35714285714285715, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6313032507896423, "eval_runtime": 16.9858, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 155 }, { "epoch": 0.040184177480117204, "grad_norm": 0.20510483630161375, "learning_rate": 4.010282776349615e-05, "loss": 0.5175, "step": 156 }, { "epoch": 0.0404417683614, "grad_norm": 0.18133337619171275, "learning_rate": 4.0359897172236504e-05, "loss": 0.5717, "step": 157 }, { "epoch": 0.04069935924268281, "grad_norm": 0.1871920902034855, "learning_rate": 4.0616966580976864e-05, "loss": 0.6009, "step": 158 }, { "epoch": 0.040956950123965614, "grad_norm": 0.17194399767251453, "learning_rate": 4.0874035989717224e-05, "loss": 0.5983, "step": 159 }, { "epoch": 0.04121454100524841, "grad_norm": 0.1666284581443205, "learning_rate": 4.1131105398457584e-05, "loss": 0.5631, "step": 160 }, { "epoch": 0.04121454100524841, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8522727272727273, "eval_PRM F1 AUC": 0.5605028810895757, "eval_PRM F1 AUC (fixed)": 0.6228391828182295, "eval_PRM F1 Neg": 0.2777777777777778, "eval_PRM NPV": 0.38461538461538464, "eval_PRM Precision": 0.8064516129032258, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6287286877632141, "eval_runtime": 16.49, "eval_samples_per_second": 2.668, "eval_steps_per_second": 0.182, "step": 160 }, { "epoch": 0.04147213188653122, "grad_norm": 0.21052057136365077, "learning_rate": 4.138817480719794e-05, "loss": 0.5887, "step": 161 }, { "epoch": 0.04172972276781402, "grad_norm": 0.21938375593646936, "learning_rate": 4.16452442159383e-05, "loss": 0.5515, "step": 162 }, { "epoch": 0.04198731364909682, "grad_norm": 0.14346442996636397, "learning_rate": 4.190231362467866e-05, "loss": 0.5208, "step": 163 }, { "epoch": 0.04224490453037962, "grad_norm": 0.17280297410417816, "learning_rate": 4.215938303341902e-05, "loss": 0.5494, "step": 164 }, { "epoch": 0.04250249541166243, "grad_norm": 0.18553608850146194, "learning_rate": 4.241645244215938e-05, "loss": 0.5496, "step": 165 }, { "epoch": 0.04250249541166243, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8522727272727273, "eval_PRM F1 AUC": 0.5605028810895757, "eval_PRM F1 AUC (fixed)": 0.6401257202723938, "eval_PRM F1 Neg": 0.2777777777777778, "eval_PRM NPV": 0.38461538461538464, "eval_PRM Precision": 0.8064516129032258, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6214488744735718, "eval_runtime": 16.7717, "eval_samples_per_second": 2.623, "eval_steps_per_second": 0.179, "step": 165 }, { "epoch": 0.042760086292945226, "grad_norm": 0.22973312336297122, "learning_rate": 4.267352185089974e-05, "loss": 0.658, "step": 166 }, { "epoch": 0.04301767717422803, "grad_norm": 0.1572748222187082, "learning_rate": 4.293059125964011e-05, "loss": 0.5497, "step": 167 }, { "epoch": 0.04327526805551084, "grad_norm": 0.18099893100798864, "learning_rate": 4.318766066838046e-05, "loss": 0.5671, "step": 168 }, { "epoch": 0.043532858936793636, "grad_norm": 0.15191452042169454, "learning_rate": 4.344473007712083e-05, "loss": 0.6038, "step": 169 }, { "epoch": 0.04379044981807644, "grad_norm": 0.1595819560196266, "learning_rate": 4.370179948586118e-05, "loss": 0.5616, "step": 170 }, { "epoch": 0.04379044981807644, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8522727272727273, "eval_PRM F1 AUC": 0.5605028810895757, "eval_PRM F1 AUC (fixed)": 0.6521739130434784, "eval_PRM F1 Neg": 0.2777777777777778, "eval_PRM NPV": 0.38461538461538464, "eval_PRM Precision": 0.8064516129032258, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6329900622367859, "eval_runtime": 17.0935, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.176, "step": 170 }, { "epoch": 0.04404804069935924, "grad_norm": 0.2408434536317289, "learning_rate": 4.395886889460155e-05, "loss": 0.5432, "step": 171 }, { "epoch": 0.044305631580642046, "grad_norm": 0.20680214058942292, "learning_rate": 4.42159383033419e-05, "loss": 0.6017, "step": 172 }, { "epoch": 0.044563222461924845, "grad_norm": 0.25443080851012156, "learning_rate": 4.447300771208227e-05, "loss": 0.4998, "step": 173 }, { "epoch": 0.04482081334320765, "grad_norm": 0.17377601032094642, "learning_rate": 4.473007712082262e-05, "loss": 0.5089, "step": 174 }, { "epoch": 0.045078404224490456, "grad_norm": 0.2147853738228081, "learning_rate": 4.498714652956299e-05, "loss": 0.5058, "step": 175 }, { "epoch": 0.045078404224490456, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8522727272727273, "eval_PRM F1 AUC": 0.5605028810895757, "eval_PRM F1 AUC (fixed)": 0.6634363541121004, "eval_PRM F1 Neg": 0.2777777777777778, "eval_PRM NPV": 0.38461538461538464, "eval_PRM Precision": 0.8064516129032258, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6369850635528564, "eval_runtime": 16.863, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 175 }, { "epoch": 0.045335995105773255, "grad_norm": 0.13027365748855715, "learning_rate": 4.524421593830334e-05, "loss": 0.517, "step": 176 }, { "epoch": 0.04559358598705606, "grad_norm": 0.22194880042454274, "learning_rate": 4.5501285347043706e-05, "loss": 0.5184, "step": 177 }, { "epoch": 0.04585117686833886, "grad_norm": 0.1201654331374536, "learning_rate": 4.5758354755784066e-05, "loss": 0.4867, "step": 178 }, { "epoch": 0.046108767749621665, "grad_norm": 0.1419265185911942, "learning_rate": 4.6015424164524426e-05, "loss": 0.4879, "step": 179 }, { "epoch": 0.046366358630904464, "grad_norm": 0.19508743917911098, "learning_rate": 4.6272493573264786e-05, "loss": 0.5609, "step": 180 }, { "epoch": 0.046366358630904464, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8587570621468926, "eval_PRM F1 AUC": 0.5665269774751178, "eval_PRM F1 AUC (fixed)": 0.675746464117339, "eval_PRM F1 Neg": 0.2857142857142857, "eval_PRM NPV": 0.4166666666666667, "eval_PRM Precision": 0.8085106382978723, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6448863744735718, "eval_runtime": 17.663, "eval_samples_per_second": 2.491, "eval_steps_per_second": 0.17, "step": 180 }, { "epoch": 0.04662394951218727, "grad_norm": 0.12196010428542023, "learning_rate": 4.6529562982005145e-05, "loss": 0.471, "step": 181 }, { "epoch": 0.04688154039347007, "grad_norm": 0.33326680032877204, "learning_rate": 4.6786632390745505e-05, "loss": 0.581, "step": 182 }, { "epoch": 0.047139131274752874, "grad_norm": 0.25584323648190144, "learning_rate": 4.7043701799485865e-05, "loss": 0.5435, "step": 183 }, { "epoch": 0.04739672215603568, "grad_norm": 0.11011166578542346, "learning_rate": 4.7300771208226225e-05, "loss": 0.505, "step": 184 }, { "epoch": 0.04765431303731848, "grad_norm": 0.16707489898231329, "learning_rate": 4.7557840616966585e-05, "loss": 0.4837, "step": 185 }, { "epoch": 0.04765431303731848, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8457142857142858, "eval_PRM F1 AUC": 0.5544787847040336, "eval_PRM F1 AUC (fixed)": 0.6534834992142483, "eval_PRM F1 Neg": 0.2702702702702703, "eval_PRM NPV": 0.35714285714285715, "eval_PRM Precision": 0.8043478260869565, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.6431108117103577, "eval_runtime": 17.5114, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 185 }, { "epoch": 0.047911903918601284, "grad_norm": 0.17587624111548597, "learning_rate": 4.7814910025706944e-05, "loss": 0.5467, "step": 186 }, { "epoch": 0.04816949479988408, "grad_norm": 0.19117636640584607, "learning_rate": 4.80719794344473e-05, "loss": 0.6088, "step": 187 }, { "epoch": 0.04842708568116689, "grad_norm": 0.27902750971709495, "learning_rate": 4.8329048843187664e-05, "loss": 0.5144, "step": 188 }, { "epoch": 0.04868467656244969, "grad_norm": 0.27614020164141406, "learning_rate": 4.8586118251928024e-05, "loss": 0.5848, "step": 189 }, { "epoch": 0.04894226744373249, "grad_norm": 0.12391760470283836, "learning_rate": 4.8843187660668383e-05, "loss": 0.5527, "step": 190 }, { "epoch": 0.04894226744373249, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8439306358381503, "eval_PRM F1 AUC": 0.570193818753274, "eval_PRM F1 AUC (fixed)": 0.6705081194342588, "eval_PRM F1 Neg": 0.3076923076923077, "eval_PRM NPV": 0.375, "eval_PRM Precision": 0.8111111111111111, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.6265092492103577, "eval_runtime": 17.0122, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 190 }, { "epoch": 0.04919985832501529, "grad_norm": 0.18230305229504676, "learning_rate": 4.910025706940874e-05, "loss": 0.5101, "step": 191 }, { "epoch": 0.0494574492062981, "grad_norm": 0.14939867870353327, "learning_rate": 4.93573264781491e-05, "loss": 0.4885, "step": 192 }, { "epoch": 0.0497150400875809, "grad_norm": 0.15376505013710523, "learning_rate": 4.961439588688946e-05, "loss": 0.5303, "step": 193 }, { "epoch": 0.0499726309688637, "grad_norm": 0.216981670871264, "learning_rate": 4.987146529562982e-05, "loss": 0.6049, "step": 194 }, { "epoch": 0.05023022185014651, "grad_norm": 0.14011671701536713, "learning_rate": 5.0128534704370176e-05, "loss": 0.54, "step": 195 }, { "epoch": 0.05023022185014651, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.5822420115243583, "eval_PRM F1 AUC (fixed)": 0.7087480356207438, "eval_PRM F1 Neg": 0.32432432432432434, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8152173913043478, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.5909978747367859, "eval_runtime": 17.519, "eval_samples_per_second": 2.512, "eval_steps_per_second": 0.171, "step": 195 }, { "epoch": 0.050487812731429306, "grad_norm": 0.22826829120034348, "learning_rate": 5.038560411311054e-05, "loss": 0.5765, "step": 196 }, { "epoch": 0.05074540361271211, "grad_norm": 0.21625936802289172, "learning_rate": 5.06426735218509e-05, "loss": 0.5026, "step": 197 }, { "epoch": 0.05100299449399491, "grad_norm": 0.19028664549112714, "learning_rate": 5.089974293059127e-05, "loss": 0.5394, "step": 198 }, { "epoch": 0.051260585375277716, "grad_norm": 0.3262015631593359, "learning_rate": 5.1156812339331615e-05, "loss": 0.519, "step": 199 }, { "epoch": 0.051518176256560515, "grad_norm": 0.11477844217568366, "learning_rate": 5.141388174807198e-05, "loss": 0.4944, "step": 200 }, { "epoch": 0.051518176256560515, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.7331063383970665, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5600141882896423, "eval_runtime": 17.1617, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 200 }, { "epoch": 0.05177576713784332, "grad_norm": 0.3919582988603975, "learning_rate": 5.167095115681234e-05, "loss": 0.6725, "step": 201 }, { "epoch": 0.052033358019126126, "grad_norm": 0.20025984006238126, "learning_rate": 5.192802056555271e-05, "loss": 0.5165, "step": 202 }, { "epoch": 0.052290948900408925, "grad_norm": 0.15210250661984012, "learning_rate": 5.218508997429307e-05, "loss": 0.5468, "step": 203 }, { "epoch": 0.05254853978169173, "grad_norm": 0.27397062971036523, "learning_rate": 5.244215938303342e-05, "loss": 0.5573, "step": 204 }, { "epoch": 0.05280613066297453, "grad_norm": 0.18224360121284594, "learning_rate": 5.269922879177378e-05, "loss": 0.4792, "step": 205 }, { "epoch": 0.05280613066297453, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.7197485594552121, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.5475852489471436, "eval_runtime": 16.9112, "eval_samples_per_second": 2.602, "eval_steps_per_second": 0.177, "step": 205 }, { "epoch": 0.053063721544257335, "grad_norm": 0.20525005870193092, "learning_rate": 5.295629820051414e-05, "loss": 0.4962, "step": 206 }, { "epoch": 0.053321312425540134, "grad_norm": 0.17402891163467932, "learning_rate": 5.3213367609254506e-05, "loss": 0.5267, "step": 207 }, { "epoch": 0.05357890330682294, "grad_norm": 0.14500449921623598, "learning_rate": 5.347043701799486e-05, "loss": 0.5612, "step": 208 }, { "epoch": 0.05383649418810574, "grad_norm": 0.16198022248602326, "learning_rate": 5.372750642673522e-05, "loss": 0.5399, "step": 209 }, { "epoch": 0.054094085069388544, "grad_norm": 0.15496428916089364, "learning_rate": 5.398457583547558e-05, "loss": 0.5199, "step": 210 }, { "epoch": 0.054094085069388544, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8654970760233918, "eval_PRM F1 AUC": 0.6414353064431639, "eval_PRM F1 AUC (fixed)": 0.7215819800942902, "eval_PRM F1 Neg": 0.43902439024390244, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8409090909090909, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5378196239471436, "eval_runtime": 17.6253, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 210 }, { "epoch": 0.05435167595067135, "grad_norm": 0.436910825313582, "learning_rate": 5.4241645244215945e-05, "loss": 0.6318, "step": 211 }, { "epoch": 0.05460926683195415, "grad_norm": 0.2897191331840822, "learning_rate": 5.44987146529563e-05, "loss": 0.5377, "step": 212 }, { "epoch": 0.054866857713236954, "grad_norm": 0.3838210085323777, "learning_rate": 5.475578406169666e-05, "loss": 0.5229, "step": 213 }, { "epoch": 0.05512444859451975, "grad_norm": 0.4637490252762357, "learning_rate": 5.501285347043702e-05, "loss": 0.5073, "step": 214 }, { "epoch": 0.05538203947580256, "grad_norm": 0.15810671328944453, "learning_rate": 5.5269922879177384e-05, "loss": 0.4763, "step": 215 }, { "epoch": 0.05538203947580256, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8636363636363636, "eval_PRM F1 AUC": 0.5882661079099004, "eval_PRM F1 AUC (fixed)": 0.7239392352016762, "eval_PRM F1 Neg": 0.3333333333333333, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8172043010752689, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.5299183130264282, "eval_runtime": 17.0014, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 215 }, { "epoch": 0.05563963035708536, "grad_norm": 0.4476009281604352, "learning_rate": 5.5526992287917744e-05, "loss": 0.5594, "step": 216 }, { "epoch": 0.05589722123836816, "grad_norm": 0.2701973988481393, "learning_rate": 5.57840616966581e-05, "loss": 0.4743, "step": 217 }, { "epoch": 0.05615481211965096, "grad_norm": 0.1421632646461717, "learning_rate": 5.604113110539846e-05, "loss": 0.435, "step": 218 }, { "epoch": 0.05641240300093377, "grad_norm": 0.5948202730941377, "learning_rate": 5.6298200514138824e-05, "loss": 0.6366, "step": 219 }, { "epoch": 0.05666999388221657, "grad_norm": 0.12451088214003082, "learning_rate": 5.655526992287918e-05, "loss": 0.5212, "step": 220 }, { "epoch": 0.05666999388221657, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.6754845468831849, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.5504261255264282, "eval_runtime": 17.0565, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 220 }, { "epoch": 0.05692758476349937, "grad_norm": 0.1841339331757701, "learning_rate": 5.6812339331619536e-05, "loss": 0.5201, "step": 221 }, { "epoch": 0.05718517564478218, "grad_norm": 0.15766870880702374, "learning_rate": 5.7069408740359896e-05, "loss": 0.5535, "step": 222 }, { "epoch": 0.057442766526064976, "grad_norm": 0.34635960046526604, "learning_rate": 5.732647814910026e-05, "loss": 0.5202, "step": 223 }, { "epoch": 0.05770035740734778, "grad_norm": 0.15507165670686024, "learning_rate": 5.758354755784062e-05, "loss": 0.5782, "step": 224 }, { "epoch": 0.05795794828863058, "grad_norm": 0.43365069148784935, "learning_rate": 5.784061696658098e-05, "loss": 0.4763, "step": 225 }, { "epoch": 0.05795794828863058, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.6621267679413304, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.5637428760528564, "eval_runtime": 17.5764, "eval_samples_per_second": 2.503, "eval_steps_per_second": 0.171, "step": 225 }, { "epoch": 0.058215539169913386, "grad_norm": 0.2013790839200976, "learning_rate": 5.8097686375321335e-05, "loss": 0.5569, "step": 226 }, { "epoch": 0.058473130051196184, "grad_norm": 0.15673506859796787, "learning_rate": 5.83547557840617e-05, "loss": 0.5573, "step": 227 }, { "epoch": 0.05873072093247899, "grad_norm": 0.16446603185548572, "learning_rate": 5.861182519280206e-05, "loss": 0.4557, "step": 228 }, { "epoch": 0.058988311813761796, "grad_norm": 0.16674151902274725, "learning_rate": 5.886889460154242e-05, "loss": 0.5435, "step": 229 }, { "epoch": 0.059245902695044594, "grad_norm": 0.44763981190896424, "learning_rate": 5.9125964010282774e-05, "loss": 0.6425, "step": 230 }, { "epoch": 0.059245902695044594, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8651685393258427, "eval_PRM F1 AUC": 0.5725510738606601, "eval_PRM F1 AUC (fixed)": 0.6715557883708748, "eval_PRM F1 Neg": 0.29411764705882354, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8105263157894737, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.5692471861839294, "eval_runtime": 17.6565, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 230 }, { "epoch": 0.0595034935763274, "grad_norm": 0.3865276731777879, "learning_rate": 5.938303341902314e-05, "loss": 0.602, "step": 231 }, { "epoch": 0.0597610844576102, "grad_norm": 0.19317431407242922, "learning_rate": 5.96401028277635e-05, "loss": 0.5172, "step": 232 }, { "epoch": 0.060018675338893004, "grad_norm": 0.31992841830574215, "learning_rate": 5.989717223650386e-05, "loss": 0.5868, "step": 233 }, { "epoch": 0.0602762662201758, "grad_norm": 0.24461145860871872, "learning_rate": 6.015424164524421e-05, "loss": 0.5603, "step": 234 }, { "epoch": 0.06053385710145861, "grad_norm": 0.37559403960763693, "learning_rate": 6.041131105398457e-05, "loss": 0.5213, "step": 235 }, { "epoch": 0.06053385710145861, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.6485070717653222, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.5836292505264282, "eval_runtime": 16.7984, "eval_samples_per_second": 2.619, "eval_steps_per_second": 0.179, "step": 235 }, { "epoch": 0.06079144798274141, "grad_norm": 0.3548402709301409, "learning_rate": 6.066838046272494e-05, "loss": 0.5582, "step": 236 }, { "epoch": 0.06104903886402421, "grad_norm": 0.2700186776159584, "learning_rate": 6.09254498714653e-05, "loss": 0.561, "step": 237 }, { "epoch": 0.06130662974530702, "grad_norm": 0.3067782651988573, "learning_rate": 6.118251928020567e-05, "loss": 0.5305, "step": 238 }, { "epoch": 0.06156422062658982, "grad_norm": 0.14653523252095751, "learning_rate": 6.143958868894601e-05, "loss": 0.6073, "step": 239 }, { "epoch": 0.06182181150787262, "grad_norm": 0.13770574831638763, "learning_rate": 6.169665809768637e-05, "loss": 0.504, "step": 240 }, { "epoch": 0.06182181150787262, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8620689655172413, "eval_PRM F1 AUC": 0.603981141959141, "eval_PRM F1 AUC (fixed)": 0.6778418019905709, "eval_PRM F1 Neg": 0.3684210526315789, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.8241758241758241, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5587713122367859, "eval_runtime": 17.1152, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 240 }, { "epoch": 0.06207940238915542, "grad_norm": 0.1283887217522403, "learning_rate": 6.195372750642675e-05, "loss": 0.4758, "step": 241 }, { "epoch": 0.06233699327043823, "grad_norm": 0.21609156979166783, "learning_rate": 6.22107969151671e-05, "loss": 0.5711, "step": 242 }, { "epoch": 0.06259458415172103, "grad_norm": 0.3386230953661476, "learning_rate": 6.246786632390745e-05, "loss": 0.5613, "step": 243 }, { "epoch": 0.06285217503300383, "grad_norm": 0.38505594758831063, "learning_rate": 6.272493573264781e-05, "loss": 0.5799, "step": 244 }, { "epoch": 0.06310976591428663, "grad_norm": 0.16759711903062344, "learning_rate": 6.298200514138818e-05, "loss": 0.5271, "step": 245 }, { "epoch": 0.06310976591428663, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8654970760233918, "eval_PRM F1 AUC": 0.6414353064431639, "eval_PRM F1 AUC (fixed)": 0.7008905185961236, "eval_PRM F1 Neg": 0.43902439024390244, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8409090909090909, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5464311242103577, "eval_runtime": 16.8753, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 245 }, { "epoch": 0.06336735679556944, "grad_norm": 0.12542045779339983, "learning_rate": 6.323907455012854e-05, "loss": 0.4813, "step": 246 }, { "epoch": 0.06362494767685224, "grad_norm": 0.16724161788396594, "learning_rate": 6.349614395886889e-05, "loss": 0.5576, "step": 247 }, { "epoch": 0.06388253855813504, "grad_norm": 0.3158126157988567, "learning_rate": 6.375321336760925e-05, "loss": 0.4747, "step": 248 }, { "epoch": 0.06414012943941784, "grad_norm": 0.1736000309785114, "learning_rate": 6.401028277634962e-05, "loss": 0.6067, "step": 249 }, { "epoch": 0.06439772032070065, "grad_norm": 0.21226162587716332, "learning_rate": 6.426735218508998e-05, "loss": 0.5219, "step": 250 }, { "epoch": 0.06439772032070065, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8588235294117647, "eval_PRM F1 AUC": 0.6354112100576217, "eval_PRM F1 AUC (fixed)": 0.7438449449973809, "eval_PRM F1 Neg": 0.42857142857142855, "eval_PRM NPV": 0.47368421052631576, "eval_PRM Precision": 0.8390804597701149, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5482954382896423, "eval_runtime": 16.9192, "eval_samples_per_second": 2.601, "eval_steps_per_second": 0.177, "step": 250 }, { "epoch": 0.06465531120198345, "grad_norm": 0.13892867414826318, "learning_rate": 6.452442159383034e-05, "loss": 0.5696, "step": 251 }, { "epoch": 0.06491290208326625, "grad_norm": 0.1640446225625932, "learning_rate": 6.478149100257069e-05, "loss": 0.4941, "step": 252 }, { "epoch": 0.06517049296454905, "grad_norm": 0.19644889538110213, "learning_rate": 6.503856041131106e-05, "loss": 0.4646, "step": 253 }, { "epoch": 0.06542808384583186, "grad_norm": 0.12623396704485648, "learning_rate": 6.529562982005142e-05, "loss": 0.4902, "step": 254 }, { "epoch": 0.06568567472711466, "grad_norm": 0.37328774995275477, "learning_rate": 6.555269922879178e-05, "loss": 0.5717, "step": 255 }, { "epoch": 0.06568567472711466, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.7477737035096909, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.52734375, "eval_runtime": 16.8308, "eval_samples_per_second": 2.614, "eval_steps_per_second": 0.178, "step": 255 }, { "epoch": 0.06594326560839746, "grad_norm": 0.1780495633275393, "learning_rate": 6.580976863753213e-05, "loss": 0.4941, "step": 256 }, { "epoch": 0.06620085648968027, "grad_norm": 0.11709298160118624, "learning_rate": 6.606683804627249e-05, "loss": 0.446, "step": 257 }, { "epoch": 0.06645844737096307, "grad_norm": 0.22742384727948237, "learning_rate": 6.632390745501286e-05, "loss": 0.5343, "step": 258 }, { "epoch": 0.06671603825224587, "grad_norm": 0.3525115109134476, "learning_rate": 6.658097686375322e-05, "loss": 0.6246, "step": 259 }, { "epoch": 0.06697362913352867, "grad_norm": 0.13905305023867473, "learning_rate": 6.683804627249358e-05, "loss": 0.5392, "step": 260 }, { "epoch": 0.06697362913352867, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.7443687794656889, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.5169566869735718, "eval_runtime": 16.8887, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 260 }, { "epoch": 0.06723122001481148, "grad_norm": 0.2550994314086868, "learning_rate": 6.709511568123393e-05, "loss": 0.523, "step": 261 }, { "epoch": 0.06748881089609428, "grad_norm": 0.15146555618039753, "learning_rate": 6.73521850899743e-05, "loss": 0.5048, "step": 262 }, { "epoch": 0.06774640177737708, "grad_norm": 0.15253291749995698, "learning_rate": 6.760925449871466e-05, "loss": 0.4961, "step": 263 }, { "epoch": 0.06800399265865989, "grad_norm": 0.43476914849618326, "learning_rate": 6.786632390745502e-05, "loss": 0.5021, "step": 264 }, { "epoch": 0.06826158353994269, "grad_norm": 0.32124891429850383, "learning_rate": 6.812339331619537e-05, "loss": 0.5028, "step": 265 }, { "epoch": 0.06826158353994269, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8670520231213873, "eval_PRM F1 AUC": 0.6257202723939235, "eval_PRM F1 AUC (fixed)": 0.7446306966998428, "eval_PRM F1 Neg": 0.41025641025641024, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4966264069080353, "eval_runtime": 17.0258, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 265 }, { "epoch": 0.06851917442122549, "grad_norm": 0.162867154400914, "learning_rate": 6.838046272493574e-05, "loss": 0.4842, "step": 266 }, { "epoch": 0.06877676530250829, "grad_norm": 0.14918316038080082, "learning_rate": 6.86375321336761e-05, "loss": 0.4495, "step": 267 }, { "epoch": 0.0690343561837911, "grad_norm": 0.2300150703660838, "learning_rate": 6.889460154241646e-05, "loss": 0.4673, "step": 268 }, { "epoch": 0.0692919470650739, "grad_norm": 0.3563895827847831, "learning_rate": 6.91516709511568e-05, "loss": 0.5033, "step": 269 }, { "epoch": 0.0695495379463567, "grad_norm": 0.24816829885221428, "learning_rate": 6.940874035989718e-05, "loss": 0.4763, "step": 270 }, { "epoch": 0.0695495379463567, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8777777777777778, "eval_PRM F1 AUC": 0.5845992666317443, "eval_PRM F1 AUC (fixed)": 0.7312729177579885, "eval_PRM F1 Neg": 0.3125, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8144329896907216, "eval_PRM Recall": 0.9518072289156626, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.5363103747367859, "eval_runtime": 16.8444, "eval_samples_per_second": 2.612, "eval_steps_per_second": 0.178, "step": 270 }, { "epoch": 0.0698071288276395, "grad_norm": 0.20710898097106806, "learning_rate": 6.966580976863754e-05, "loss": 0.4287, "step": 271 }, { "epoch": 0.07006471970892231, "grad_norm": 0.16331721619805295, "learning_rate": 6.99228791773779e-05, "loss": 0.5094, "step": 272 }, { "epoch": 0.0703223105902051, "grad_norm": 0.21991072828461247, "learning_rate": 7.017994858611826e-05, "loss": 0.5333, "step": 273 }, { "epoch": 0.0705799014714879, "grad_norm": 0.24534823629429503, "learning_rate": 7.043701799485862e-05, "loss": 0.4432, "step": 274 }, { "epoch": 0.07083749235277072, "grad_norm": 0.21465182821802084, "learning_rate": 7.069408740359898e-05, "loss": 0.4929, "step": 275 }, { "epoch": 0.07083749235277072, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8670520231213873, "eval_PRM F1 AUC": 0.6257202723939235, "eval_PRM F1 AUC (fixed)": 0.6969617600838135, "eval_PRM F1 Neg": 0.41025641025641024, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.5442116260528564, "eval_runtime": 17.6229, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 275 }, { "epoch": 0.07109508323405352, "grad_norm": 0.1793598661907607, "learning_rate": 7.095115681233934e-05, "loss": 0.5492, "step": 276 }, { "epoch": 0.07135267411533631, "grad_norm": 0.17143285615075915, "learning_rate": 7.12082262210797e-05, "loss": 0.5534, "step": 277 }, { "epoch": 0.07161026499661911, "grad_norm": 0.2469125643196871, "learning_rate": 7.146529562982006e-05, "loss": 0.5975, "step": 278 }, { "epoch": 0.07186785587790193, "grad_norm": 0.14719122802287674, "learning_rate": 7.172236503856042e-05, "loss": 0.4844, "step": 279 }, { "epoch": 0.07212544675918472, "grad_norm": 0.1696968253057401, "learning_rate": 7.197943444730078e-05, "loss": 0.5158, "step": 280 }, { "epoch": 0.07212544675918472, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8620689655172413, "eval_PRM F1 AUC": 0.603981141959141, "eval_PRM F1 AUC (fixed)": 0.71896280775275, "eval_PRM F1 Neg": 0.3684210526315789, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.8241758241758241, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5271661877632141, "eval_runtime": 16.8876, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 280 }, { "epoch": 0.07238303764046752, "grad_norm": 0.1706507869315982, "learning_rate": 7.223650385604114e-05, "loss": 0.4266, "step": 281 }, { "epoch": 0.07264062852175034, "grad_norm": 0.2100734027971624, "learning_rate": 7.24935732647815e-05, "loss": 0.4214, "step": 282 }, { "epoch": 0.07289821940303313, "grad_norm": 0.14440703342832992, "learning_rate": 7.275064267352186e-05, "loss": 0.4344, "step": 283 }, { "epoch": 0.07315581028431593, "grad_norm": 0.31252968871494025, "learning_rate": 7.300771208226222e-05, "loss": 0.4995, "step": 284 }, { "epoch": 0.07341340116559873, "grad_norm": 0.27899350152206936, "learning_rate": 7.326478149100258e-05, "loss": 0.4469, "step": 285 }, { "epoch": 0.07341340116559873, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8863636363636364, "eval_PRM F1 AUC": 0.6437925615505501, "eval_PRM F1 AUC (fixed)": 0.7226296490309063, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.8387096774193549, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.5223721861839294, "eval_runtime": 17.2517, "eval_samples_per_second": 2.55, "eval_steps_per_second": 0.174, "step": 285 }, { "epoch": 0.07367099204688154, "grad_norm": 0.12494071200070458, "learning_rate": 7.352185089974293e-05, "loss": 0.4027, "step": 286 }, { "epoch": 0.07392858292816434, "grad_norm": 0.1112248386342243, "learning_rate": 7.37789203084833e-05, "loss": 0.3726, "step": 287 }, { "epoch": 0.07418617380944714, "grad_norm": 0.18876716539073077, "learning_rate": 7.403598971722365e-05, "loss": 0.5424, "step": 288 }, { "epoch": 0.07444376469072995, "grad_norm": 0.1920065960733905, "learning_rate": 7.429305912596401e-05, "loss": 0.5358, "step": 289 }, { "epoch": 0.07470135557201275, "grad_norm": 0.2045492546397632, "learning_rate": 7.455012853470437e-05, "loss": 0.442, "step": 290 }, { "epoch": 0.07470135557201275, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.6995809324253537, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.5240589380264282, "eval_runtime": 17.1062, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 290 }, { "epoch": 0.07495894645329555, "grad_norm": 0.16046214096233113, "learning_rate": 7.480719794344473e-05, "loss": 0.4934, "step": 291 }, { "epoch": 0.07521653733457835, "grad_norm": 0.6238046407673321, "learning_rate": 7.50642673521851e-05, "loss": 0.7382, "step": 292 }, { "epoch": 0.07547412821586116, "grad_norm": 0.17549546735039195, "learning_rate": 7.532133676092545e-05, "loss": 0.5593, "step": 293 }, { "epoch": 0.07573171909714396, "grad_norm": 0.1967124652316382, "learning_rate": 7.557840616966581e-05, "loss": 0.5642, "step": 294 }, { "epoch": 0.07598930997842676, "grad_norm": 0.16580167435656418, "learning_rate": 7.583547557840617e-05, "loss": 0.5569, "step": 295 }, { "epoch": 0.07598930997842676, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8588235294117647, "eval_PRM F1 AUC": 0.6354112100576217, "eval_PRM F1 AUC (fixed)": 0.713462545835516, "eval_PRM F1 Neg": 0.42857142857142855, "eval_PRM NPV": 0.47368421052631576, "eval_PRM Precision": 0.8390804597701149, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.49289771914482117, "eval_runtime": 17.1859, "eval_samples_per_second": 2.56, "eval_steps_per_second": 0.175, "step": 295 }, { "epoch": 0.07624690085970956, "grad_norm": 0.21994863274227455, "learning_rate": 7.609254498714653e-05, "loss": 0.5487, "step": 296 }, { "epoch": 0.07650449174099237, "grad_norm": 0.2156652299798949, "learning_rate": 7.634961439588689e-05, "loss": 0.5034, "step": 297 }, { "epoch": 0.07676208262227517, "grad_norm": 0.1764562023351226, "learning_rate": 7.660668380462725e-05, "loss": 0.4057, "step": 298 }, { "epoch": 0.07701967350355797, "grad_norm": 0.3638690402250176, "learning_rate": 7.686375321336761e-05, "loss": 0.488, "step": 299 }, { "epoch": 0.07727726438484078, "grad_norm": 0.21464580532287697, "learning_rate": 7.712082262210797e-05, "loss": 0.4911, "step": 300 }, { "epoch": 0.07727726438484078, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8837209302325582, "eval_PRM F1 AUC": 0.6752226296490309, "eval_PRM F1 AUC (fixed)": 0.7498690413829229, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5882352941176471, "eval_PRM Precision": 0.8539325842696629, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.48464134335517883, "eval_runtime": 16.9244, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 300 }, { "epoch": 0.07753485526612358, "grad_norm": 0.24989606645527593, "learning_rate": 7.737789203084833e-05, "loss": 0.491, "step": 301 }, { "epoch": 0.07779244614740638, "grad_norm": 0.17008015682999567, "learning_rate": 7.763496143958869e-05, "loss": 0.5051, "step": 302 }, { "epoch": 0.07805003702868918, "grad_norm": 0.23234257722694537, "learning_rate": 7.789203084832905e-05, "loss": 0.4387, "step": 303 }, { "epoch": 0.07830762790997199, "grad_norm": 0.4471915700529444, "learning_rate": 7.814910025706941e-05, "loss": 0.4895, "step": 304 }, { "epoch": 0.07856521879125479, "grad_norm": 0.1909539940652607, "learning_rate": 7.840616966580977e-05, "loss": 0.4711, "step": 305 }, { "epoch": 0.07856521879125479, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.754321634363541, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4754083752632141, "eval_runtime": 16.4783, "eval_samples_per_second": 2.67, "eval_steps_per_second": 0.182, "step": 305 }, { "epoch": 0.07882280967253759, "grad_norm": 0.1901414617608177, "learning_rate": 7.866323907455013e-05, "loss": 0.5136, "step": 306 }, { "epoch": 0.0790804005538204, "grad_norm": 0.15289744085473825, "learning_rate": 7.892030848329049e-05, "loss": 0.46, "step": 307 }, { "epoch": 0.0793379914351032, "grad_norm": 0.49183156079988954, "learning_rate": 7.917737789203086e-05, "loss": 0.5623, "step": 308 }, { "epoch": 0.079595582316386, "grad_norm": 0.19221892418033015, "learning_rate": 7.943444730077121e-05, "loss": 0.4282, "step": 309 }, { "epoch": 0.0798531731976688, "grad_norm": 0.1627104339138911, "learning_rate": 7.969151670951157e-05, "loss": 0.4469, "step": 310 }, { "epoch": 0.0798531731976688, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.7582503928758513, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4630681872367859, "eval_runtime": 16.9331, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 310 }, { "epoch": 0.08011076407895161, "grad_norm": 0.23101435386602684, "learning_rate": 7.994858611825193e-05, "loss": 0.5431, "step": 311 }, { "epoch": 0.08036835496023441, "grad_norm": 0.1644424970244475, "learning_rate": 8.02056555269923e-05, "loss": 0.5075, "step": 312 }, { "epoch": 0.08062594584151721, "grad_norm": 0.17393154987172232, "learning_rate": 8.046272493573265e-05, "loss": 0.5121, "step": 313 }, { "epoch": 0.0808835367228, "grad_norm": 0.26415833785058895, "learning_rate": 8.071979434447301e-05, "loss": 0.5219, "step": 314 }, { "epoch": 0.08114112760408282, "grad_norm": 0.2161597178077126, "learning_rate": 8.097686375321337e-05, "loss": 0.4409, "step": 315 }, { "epoch": 0.08114112760408282, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.7433211105290729, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.46475496888160706, "eval_runtime": 17.6161, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 315 }, { "epoch": 0.08139871848536562, "grad_norm": 0.17659314913801039, "learning_rate": 8.123393316195373e-05, "loss": 0.4659, "step": 316 }, { "epoch": 0.08165630936664842, "grad_norm": 0.17852452080635514, "learning_rate": 8.149100257069409e-05, "loss": 0.4608, "step": 317 }, { "epoch": 0.08191390024793123, "grad_norm": 0.4424697785485204, "learning_rate": 8.174807197943445e-05, "loss": 0.5871, "step": 318 }, { "epoch": 0.08217149112921403, "grad_norm": 0.304091441955501, "learning_rate": 8.200514138817481e-05, "loss": 0.5091, "step": 319 }, { "epoch": 0.08242908201049683, "grad_norm": 0.23297366816849394, "learning_rate": 8.226221079691517e-05, "loss": 0.5074, "step": 320 }, { "epoch": 0.08242908201049683, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 AUC (fixed)": 0.7357255107386066, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4779829680919647, "eval_runtime": 16.997, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 320 }, { "epoch": 0.08268667289177963, "grad_norm": 0.2547077789068634, "learning_rate": 8.251928020565554e-05, "loss": 0.5396, "step": 321 }, { "epoch": 0.08294426377306244, "grad_norm": 0.44000153984608, "learning_rate": 8.277634961439589e-05, "loss": 0.5224, "step": 322 }, { "epoch": 0.08320185465434524, "grad_norm": 0.5322367245105415, "learning_rate": 8.303341902313625e-05, "loss": 0.531, "step": 323 }, { "epoch": 0.08345944553562804, "grad_norm": 0.26523524639758594, "learning_rate": 8.32904884318766e-05, "loss": 0.5288, "step": 324 }, { "epoch": 0.08371703641691085, "grad_norm": 0.1570190072505766, "learning_rate": 8.354755784061698e-05, "loss": 0.4288, "step": 325 }, { "epoch": 0.08371703641691085, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8813559322033898, "eval_PRM F1 AUC": 0.6220534311157675, "eval_PRM F1 AUC (fixed)": 0.7585123101100052, "eval_PRM F1 Neg": 0.4, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8297872340425532, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.4786931872367859, "eval_runtime": 17.1433, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 325 }, { "epoch": 0.08397462729819365, "grad_norm": 0.33618140885098385, "learning_rate": 8.380462724935733e-05, "loss": 0.5247, "step": 326 }, { "epoch": 0.08423221817947645, "grad_norm": 0.5150239771745091, "learning_rate": 8.406169665809769e-05, "loss": 0.4938, "step": 327 }, { "epoch": 0.08448980906075924, "grad_norm": 0.1479966986338898, "learning_rate": 8.431876606683805e-05, "loss": 0.4333, "step": 328 }, { "epoch": 0.08474739994204206, "grad_norm": 0.4529975613869295, "learning_rate": 8.457583547557842e-05, "loss": 0.6525, "step": 329 }, { "epoch": 0.08500499082332486, "grad_norm": 0.22779612054480836, "learning_rate": 8.483290488431876e-05, "loss": 0.4149, "step": 330 }, { "epoch": 0.08500499082332486, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 AUC (fixed)": 0.7063907805133578, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.5108309388160706, "eval_runtime": 17.6327, "eval_samples_per_second": 2.495, "eval_steps_per_second": 0.17, "step": 330 }, { "epoch": 0.08526258170460765, "grad_norm": 0.3183526216778193, "learning_rate": 8.508997429305912e-05, "loss": 0.5126, "step": 331 }, { "epoch": 0.08552017258589045, "grad_norm": 0.34937345076092335, "learning_rate": 8.534704370179948e-05, "loss": 0.5294, "step": 332 }, { "epoch": 0.08577776346717327, "grad_norm": 0.18557194020464804, "learning_rate": 8.560411311053986e-05, "loss": 0.5316, "step": 333 }, { "epoch": 0.08603535434845606, "grad_norm": 0.22308062600808679, "learning_rate": 8.586118251928022e-05, "loss": 0.4493, "step": 334 }, { "epoch": 0.08629294522973886, "grad_norm": 0.17128889769646718, "learning_rate": 8.611825192802056e-05, "loss": 0.5186, "step": 335 }, { "epoch": 0.08629294522973886, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.7349397590361446, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4962713122367859, "eval_runtime": 17.0118, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 335 }, { "epoch": 0.08655053611102168, "grad_norm": 0.13729173767184766, "learning_rate": 8.637532133676092e-05, "loss": 0.4542, "step": 336 }, { "epoch": 0.08680812699230447, "grad_norm": 0.13338677993167217, "learning_rate": 8.66323907455013e-05, "loss": 0.432, "step": 337 }, { "epoch": 0.08706571787358727, "grad_norm": 0.341720440183182, "learning_rate": 8.688946015424166e-05, "loss": 0.5322, "step": 338 }, { "epoch": 0.08732330875487007, "grad_norm": 0.2607452444404972, "learning_rate": 8.7146529562982e-05, "loss": 0.4639, "step": 339 }, { "epoch": 0.08758089963615288, "grad_norm": 0.226253128974037, "learning_rate": 8.740359897172236e-05, "loss": 0.4884, "step": 340 }, { "epoch": 0.08758089963615288, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.7606076479832374, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.49129971861839294, "eval_runtime": 17.425, "eval_samples_per_second": 2.525, "eval_steps_per_second": 0.172, "step": 340 }, { "epoch": 0.08783849051743568, "grad_norm": 0.11704984262702216, "learning_rate": 8.766066838046274e-05, "loss": 0.4388, "step": 341 }, { "epoch": 0.08809608139871848, "grad_norm": 0.1414143560135518, "learning_rate": 8.79177377892031e-05, "loss": 0.4522, "step": 342 }, { "epoch": 0.0883536722800013, "grad_norm": 0.18373739576071454, "learning_rate": 8.817480719794346e-05, "loss": 0.4383, "step": 343 }, { "epoch": 0.08861126316128409, "grad_norm": 0.13632975243574016, "learning_rate": 8.84318766066838e-05, "loss": 0.4584, "step": 344 }, { "epoch": 0.08886885404256689, "grad_norm": 0.19694148522854918, "learning_rate": 8.868894601542416e-05, "loss": 0.4785, "step": 345 }, { "epoch": 0.08886885404256689, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.7797276060764798, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4827769994735718, "eval_runtime": 16.9478, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 345 }, { "epoch": 0.08912644492384969, "grad_norm": 0.19209807000617346, "learning_rate": 8.894601542416453e-05, "loss": 0.3847, "step": 346 }, { "epoch": 0.0893840358051325, "grad_norm": 0.191741684622581, "learning_rate": 8.92030848329049e-05, "loss": 0.5368, "step": 347 }, { "epoch": 0.0896416266864153, "grad_norm": 0.21778226831775863, "learning_rate": 8.946015424164524e-05, "loss": 0.4394, "step": 348 }, { "epoch": 0.0898992175676981, "grad_norm": 0.17174001135730832, "learning_rate": 8.97172236503856e-05, "loss": 0.4091, "step": 349 }, { "epoch": 0.09015680844898091, "grad_norm": 0.36807560276385753, "learning_rate": 8.997429305912597e-05, "loss": 0.5305, "step": 350 }, { "epoch": 0.09015680844898091, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8700564971751412, "eval_PRM F1 AUC": 0.5942902042954427, "eval_PRM F1 AUC (fixed)": 0.7786799371398637, "eval_PRM F1 Neg": 0.34285714285714286, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8191489361702128, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.5010653138160706, "eval_runtime": 17.5239, "eval_samples_per_second": 2.511, "eval_steps_per_second": 0.171, "step": 350 }, { "epoch": 0.09041439933026371, "grad_norm": 0.23321715386247485, "learning_rate": 9.023136246786633e-05, "loss": 0.4353, "step": 351 }, { "epoch": 0.09067199021154651, "grad_norm": 0.17565132745255643, "learning_rate": 9.048843187660668e-05, "loss": 0.4594, "step": 352 }, { "epoch": 0.09092958109282931, "grad_norm": 0.1620834651604973, "learning_rate": 9.074550128534704e-05, "loss": 0.4521, "step": 353 }, { "epoch": 0.09118717197411212, "grad_norm": 0.16717604267966277, "learning_rate": 9.100257069408741e-05, "loss": 0.482, "step": 354 }, { "epoch": 0.09144476285539492, "grad_norm": 0.19119680337404393, "learning_rate": 9.125964010282777e-05, "loss": 0.4133, "step": 355 }, { "epoch": 0.09144476285539492, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.7721320062860135, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4742542505264282, "eval_runtime": 17.0982, "eval_samples_per_second": 2.573, "eval_steps_per_second": 0.175, "step": 355 }, { "epoch": 0.09170235373667772, "grad_norm": 0.2030854166064513, "learning_rate": 9.151670951156813e-05, "loss": 0.5278, "step": 356 }, { "epoch": 0.09195994461796052, "grad_norm": 0.31775991598819336, "learning_rate": 9.177377892030848e-05, "loss": 0.5248, "step": 357 }, { "epoch": 0.09221753549924333, "grad_norm": 0.1465016530357859, "learning_rate": 9.203084832904885e-05, "loss": 0.4476, "step": 358 }, { "epoch": 0.09247512638052613, "grad_norm": 0.5093840700812764, "learning_rate": 9.228791773778921e-05, "loss": 0.531, "step": 359 }, { "epoch": 0.09273271726180893, "grad_norm": 0.1894256746900755, "learning_rate": 9.254498714652957e-05, "loss": 0.4719, "step": 360 }, { "epoch": 0.09273271726180893, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.7480356207438449, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4701704680919647, "eval_runtime": 17.525, "eval_samples_per_second": 2.511, "eval_steps_per_second": 0.171, "step": 360 }, { "epoch": 0.09299030814309174, "grad_norm": 0.24605670118769468, "learning_rate": 9.280205655526992e-05, "loss": 0.4204, "step": 361 }, { "epoch": 0.09324789902437454, "grad_norm": 0.2878956035280472, "learning_rate": 9.305912596401029e-05, "loss": 0.5175, "step": 362 }, { "epoch": 0.09350548990565734, "grad_norm": 0.22720435212003723, "learning_rate": 9.331619537275065e-05, "loss": 0.5016, "step": 363 }, { "epoch": 0.09376308078694014, "grad_norm": 0.1813212160080772, "learning_rate": 9.357326478149101e-05, "loss": 0.5415, "step": 364 }, { "epoch": 0.09402067166822295, "grad_norm": 0.2532118573498516, "learning_rate": 9.383033419023136e-05, "loss": 0.5332, "step": 365 }, { "epoch": 0.09402067166822295, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8363636363636363, "eval_PRM F1 AUC": 0.6330539549502358, "eval_PRM F1 AUC (fixed)": 0.6919853326348874, "eval_PRM F1 Neg": 0.425531914893617, "eval_PRM NPV": 0.4166666666666667, "eval_PRM Precision": 0.8414634146341463, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4978693127632141, "eval_runtime": 17.3826, "eval_samples_per_second": 2.531, "eval_steps_per_second": 0.173, "step": 365 }, { "epoch": 0.09427826254950575, "grad_norm": 0.32231507285137934, "learning_rate": 9.408740359897173e-05, "loss": 0.4908, "step": 366 }, { "epoch": 0.09453585343078855, "grad_norm": 0.2351720611467643, "learning_rate": 9.434447300771209e-05, "loss": 0.4, "step": 367 }, { "epoch": 0.09479344431207136, "grad_norm": 0.23792876503320465, "learning_rate": 9.460154241645245e-05, "loss": 0.5383, "step": 368 }, { "epoch": 0.09505103519335416, "grad_norm": 0.2643414916238337, "learning_rate": 9.485861182519281e-05, "loss": 0.5193, "step": 369 }, { "epoch": 0.09530862607463696, "grad_norm": 0.45021787781807343, "learning_rate": 9.511568123393317e-05, "loss": 0.5659, "step": 370 }, { "epoch": 0.09530862607463696, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8700564971751412, "eval_PRM F1 AUC": 0.5942902042954427, "eval_PRM F1 AUC (fixed)": 0.6699842849659509, "eval_PRM F1 Neg": 0.34285714285714286, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8191489361702128, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.5328480005264282, "eval_runtime": 16.928, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 370 }, { "epoch": 0.09556621695591976, "grad_norm": 0.28331637260953885, "learning_rate": 9.537275064267353e-05, "loss": 0.5267, "step": 371 }, { "epoch": 0.09582380783720257, "grad_norm": 0.23483924500354225, "learning_rate": 9.562982005141389e-05, "loss": 0.4323, "step": 372 }, { "epoch": 0.09608139871848537, "grad_norm": 0.1868499578082873, "learning_rate": 9.588688946015425e-05, "loss": 0.5583, "step": 373 }, { "epoch": 0.09633898959976817, "grad_norm": 0.5210569911837933, "learning_rate": 9.61439588688946e-05, "loss": 0.5014, "step": 374 }, { "epoch": 0.09659658048105096, "grad_norm": 0.36489153822322956, "learning_rate": 9.640102827763497e-05, "loss": 0.4962, "step": 375 }, { "epoch": 0.09659658048105096, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8372093023255814, "eval_PRM F1 AUC": 0.5641697223677318, "eval_PRM F1 AUC (fixed)": 0.674698795180723, "eval_PRM F1 Neg": 0.3, "eval_PRM NPV": 0.35294117647058826, "eval_PRM Precision": 0.8089887640449438, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.2608695652173913, "eval_loss": 0.5310724377632141, "eval_runtime": 16.9748, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 375 }, { "epoch": 0.09685417136233378, "grad_norm": 0.19650205672480411, "learning_rate": 9.665809768637533e-05, "loss": 0.4657, "step": 376 }, { "epoch": 0.09711176224361658, "grad_norm": 0.1443011298030704, "learning_rate": 9.691516709511569e-05, "loss": 0.4263, "step": 377 }, { "epoch": 0.09736935312489937, "grad_norm": 0.4113935707165464, "learning_rate": 9.717223650385605e-05, "loss": 0.5134, "step": 378 }, { "epoch": 0.09762694400618219, "grad_norm": 0.558434329883644, "learning_rate": 9.742930591259641e-05, "loss": 0.5736, "step": 379 }, { "epoch": 0.09788453488746499, "grad_norm": 0.14033000522240638, "learning_rate": 9.768637532133677e-05, "loss": 0.4273, "step": 380 }, { "epoch": 0.09788453488746499, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8520710059171598, "eval_PRM F1 AUC": 0.6293871136720797, "eval_PRM F1 AUC (fixed)": 0.7103195390256679, "eval_PRM F1 Neg": 0.4186046511627907, "eval_PRM NPV": 0.45, "eval_PRM Precision": 0.8372093023255814, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5047940611839294, "eval_runtime": 17.2773, "eval_samples_per_second": 2.547, "eval_steps_per_second": 0.174, "step": 380 }, { "epoch": 0.09814212576874778, "grad_norm": 0.15648558150008013, "learning_rate": 9.794344473007713e-05, "loss": 0.4694, "step": 381 }, { "epoch": 0.09839971665003058, "grad_norm": 0.16298054935347225, "learning_rate": 9.820051413881749e-05, "loss": 0.4632, "step": 382 }, { "epoch": 0.0986573075313134, "grad_norm": 0.17347682099313294, "learning_rate": 9.845758354755785e-05, "loss": 0.5555, "step": 383 }, { "epoch": 0.0989148984125962, "grad_norm": 0.47836981451492505, "learning_rate": 9.87146529562982e-05, "loss": 0.5396, "step": 384 }, { "epoch": 0.099172489293879, "grad_norm": 0.1608116292739438, "learning_rate": 9.897172236503857e-05, "loss": 0.4519, "step": 385 }, { "epoch": 0.099172489293879, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.7234154007333682, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4946732819080353, "eval_runtime": 17.4695, "eval_samples_per_second": 2.519, "eval_steps_per_second": 0.172, "step": 385 }, { "epoch": 0.0994300801751618, "grad_norm": 0.17141770911297552, "learning_rate": 9.922879177377893e-05, "loss": 0.5854, "step": 386 }, { "epoch": 0.0996876710564446, "grad_norm": 0.18967728544420465, "learning_rate": 9.948586118251929e-05, "loss": 0.4909, "step": 387 }, { "epoch": 0.0999452619377274, "grad_norm": 0.15732777538667073, "learning_rate": 9.974293059125965e-05, "loss": 0.4709, "step": 388 }, { "epoch": 0.1002028528190102, "grad_norm": 0.15094116449690462, "learning_rate": 0.0001, "loss": 0.464, "step": 389 }, { "epoch": 0.10046044370029301, "grad_norm": 0.15955778560412917, "learning_rate": 9.999997977714101e-05, "loss": 0.4657, "step": 390 }, { "epoch": 0.10046044370029301, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8620689655172413, "eval_PRM F1 AUC": 0.603981141959141, "eval_PRM F1 AUC (fixed)": 0.7341540073336825, "eval_PRM F1 Neg": 0.3684210526315789, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.8241758241758241, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5114524364471436, "eval_runtime": 16.9846, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 390 }, { "epoch": 0.10071803458157581, "grad_norm": 0.1559179576330506, "learning_rate": 9.999991910858042e-05, "loss": 0.4867, "step": 391 }, { "epoch": 0.10097562546285861, "grad_norm": 0.20213418829756755, "learning_rate": 9.999981799436729e-05, "loss": 0.395, "step": 392 }, { "epoch": 0.10123321634414141, "grad_norm": 0.21351071105005232, "learning_rate": 9.999967643458341e-05, "loss": 0.4189, "step": 393 }, { "epoch": 0.10149080722542422, "grad_norm": 0.16842415689789078, "learning_rate": 9.999949442934331e-05, "loss": 0.4204, "step": 394 }, { "epoch": 0.10174839810670702, "grad_norm": 0.15578484355656985, "learning_rate": 9.99992719787942e-05, "loss": 0.4604, "step": 395 }, { "epoch": 0.10174839810670702, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8538011695906432, "eval_PRM F1 AUC": 0.6136720796228392, "eval_PRM F1 AUC (fixed)": 0.7221058145625983, "eval_PRM F1 Neg": 0.3902439024390244, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8295454545454546, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4976917505264282, "eval_runtime": 16.8242, "eval_samples_per_second": 2.615, "eval_steps_per_second": 0.178, "step": 395 }, { "epoch": 0.10200598898798982, "grad_norm": 0.16597472874867428, "learning_rate": 9.999900908311602e-05, "loss": 0.4295, "step": 396 }, { "epoch": 0.10226357986927263, "grad_norm": 0.17607516670412807, "learning_rate": 9.999870574252143e-05, "loss": 0.4687, "step": 397 }, { "epoch": 0.10252117075055543, "grad_norm": 0.2094674841469055, "learning_rate": 9.999836195725582e-05, "loss": 0.4805, "step": 398 }, { "epoch": 0.10277876163183823, "grad_norm": 0.2261268979682064, "learning_rate": 9.999797772759729e-05, "loss": 0.4885, "step": 399 }, { "epoch": 0.10303635251312103, "grad_norm": 0.15858470980159364, "learning_rate": 9.999755305385663e-05, "loss": 0.458, "step": 400 }, { "epoch": 0.10303635251312103, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8538011695906432, "eval_PRM F1 AUC": 0.6136720796228392, "eval_PRM F1 AUC (fixed)": 0.7291775798847565, "eval_PRM F1 Neg": 0.3902439024390244, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8295454545454546, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.5031072497367859, "eval_runtime": 16.9642, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 400 }, { "epoch": 0.10329394339440384, "grad_norm": 0.15572759659857444, "learning_rate": 9.999708793637736e-05, "loss": 0.4792, "step": 401 }, { "epoch": 0.10355153427568664, "grad_norm": 0.1953860715496762, "learning_rate": 9.999658237553574e-05, "loss": 0.4669, "step": 402 }, { "epoch": 0.10380912515696944, "grad_norm": 0.21379356816183082, "learning_rate": 9.999603637174071e-05, "loss": 0.4282, "step": 403 }, { "epoch": 0.10406671603825225, "grad_norm": 0.24861255212920058, "learning_rate": 9.999544992543395e-05, "loss": 0.4617, "step": 404 }, { "epoch": 0.10432430691953505, "grad_norm": 0.1603464704080714, "learning_rate": 9.999482303708985e-05, "loss": 0.4448, "step": 405 }, { "epoch": 0.10432430691953505, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.7239392352016764, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.5149147510528564, "eval_runtime": 17.3849, "eval_samples_per_second": 2.531, "eval_steps_per_second": 0.173, "step": 405 }, { "epoch": 0.10458189780081785, "grad_norm": 0.16544463999602066, "learning_rate": 9.999415570721549e-05, "loss": 0.4365, "step": 406 }, { "epoch": 0.10483948868210065, "grad_norm": 0.2854230612503904, "learning_rate": 9.999344793635068e-05, "loss": 0.5049, "step": 407 }, { "epoch": 0.10509707956338346, "grad_norm": 0.25741146107216933, "learning_rate": 9.999269972506797e-05, "loss": 0.4587, "step": 408 }, { "epoch": 0.10535467044466626, "grad_norm": 0.17499395517678254, "learning_rate": 9.999191107397258e-05, "loss": 0.4283, "step": 409 }, { "epoch": 0.10561226132594906, "grad_norm": 0.2089889252840499, "learning_rate": 9.999108198370249e-05, "loss": 0.4571, "step": 410 }, { "epoch": 0.10561226132594906, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.7328444211629125, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4838423430919647, "eval_runtime": 17.7126, "eval_samples_per_second": 2.484, "eval_steps_per_second": 0.169, "step": 410 }, { "epoch": 0.10586985220723186, "grad_norm": 0.18161399043270976, "learning_rate": 9.999021245492832e-05, "loss": 0.4238, "step": 411 }, { "epoch": 0.10612744308851467, "grad_norm": 0.14000774768905813, "learning_rate": 9.998930248835348e-05, "loss": 0.4118, "step": 412 }, { "epoch": 0.10638503396979747, "grad_norm": 0.20132202608236363, "learning_rate": 9.998835208471404e-05, "loss": 0.5118, "step": 413 }, { "epoch": 0.10664262485108027, "grad_norm": 0.29637805177344245, "learning_rate": 9.998736124477879e-05, "loss": 0.5781, "step": 414 }, { "epoch": 0.10690021573236308, "grad_norm": 0.18134702533907654, "learning_rate": 9.998632996934925e-05, "loss": 0.4832, "step": 415 }, { "epoch": 0.10690021573236308, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.7294394971189104, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4801136255264282, "eval_runtime": 17.3301, "eval_samples_per_second": 2.539, "eval_steps_per_second": 0.173, "step": 415 }, { "epoch": 0.10715780661364588, "grad_norm": 0.253229647609327, "learning_rate": 9.998525825925961e-05, "loss": 0.5234, "step": 416 }, { "epoch": 0.10741539749492868, "grad_norm": 0.3321065579408871, "learning_rate": 9.998414611537681e-05, "loss": 0.4654, "step": 417 }, { "epoch": 0.10767298837621148, "grad_norm": 0.15612392409311915, "learning_rate": 9.998299353860048e-05, "loss": 0.4434, "step": 418 }, { "epoch": 0.10793057925749429, "grad_norm": 0.19621395056064136, "learning_rate": 9.998180052986294e-05, "loss": 0.4868, "step": 419 }, { "epoch": 0.10818817013877709, "grad_norm": 0.35415224476374046, "learning_rate": 9.998056709012927e-05, "loss": 0.5612, "step": 420 }, { "epoch": 0.10818817013877709, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.7215819800942903, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.5131391882896423, "eval_runtime": 17.5344, "eval_samples_per_second": 2.509, "eval_steps_per_second": 0.171, "step": 420 }, { "epoch": 0.10844576102005989, "grad_norm": 0.4068922414515879, "learning_rate": 9.997929322039717e-05, "loss": 0.5337, "step": 421 }, { "epoch": 0.1087033519013427, "grad_norm": 0.34422426148894386, "learning_rate": 9.99779789216971e-05, "loss": 0.372, "step": 422 }, { "epoch": 0.1089609427826255, "grad_norm": 0.24720166484716657, "learning_rate": 9.997662419509224e-05, "loss": 0.4539, "step": 423 }, { "epoch": 0.1092185336639083, "grad_norm": 0.1857752522364961, "learning_rate": 9.997522904167844e-05, "loss": 0.5204, "step": 424 }, { "epoch": 0.1094761245451911, "grad_norm": 0.1529748396919358, "learning_rate": 9.997379346258424e-05, "loss": 0.4264, "step": 425 }, { "epoch": 0.1094761245451911, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8390804597701149, "eval_PRM F1 AUC": 0.5484546883184913, "eval_PRM F1 AUC (fixed)": 0.6925091671031954, "eval_PRM F1 Neg": 0.2631578947368421, "eval_PRM NPV": 0.3333333333333333, "eval_PRM Precision": 0.8021978021978022, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.21739130434782608, "eval_loss": 0.5328480005264282, "eval_runtime": 17.3638, "eval_samples_per_second": 2.534, "eval_steps_per_second": 0.173, "step": 425 }, { "epoch": 0.10973371542647391, "grad_norm": 0.20456549613825648, "learning_rate": 9.997231745897093e-05, "loss": 0.4628, "step": 426 }, { "epoch": 0.1099913063077567, "grad_norm": 0.29545033484076455, "learning_rate": 9.997080103203245e-05, "loss": 0.4632, "step": 427 }, { "epoch": 0.1102488971890395, "grad_norm": 0.29427391377059076, "learning_rate": 9.996924418299546e-05, "loss": 0.4489, "step": 428 }, { "epoch": 0.11050648807032232, "grad_norm": 0.2133142414876546, "learning_rate": 9.996764691311933e-05, "loss": 0.467, "step": 429 }, { "epoch": 0.11076407895160512, "grad_norm": 0.1792954183091056, "learning_rate": 9.99660092236961e-05, "loss": 0.441, "step": 430 }, { "epoch": 0.11076407895160512, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8421052631578947, "eval_PRM F1 AUC": 0.5859088528025145, "eval_PRM F1 AUC (fixed)": 0.7372970141435307, "eval_PRM F1 Neg": 0.34146341463414637, "eval_PRM NPV": 0.3888888888888889, "eval_PRM Precision": 0.8181818181818182, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.49147728085517883, "eval_runtime": 17.0876, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 430 }, { "epoch": 0.11102166983288791, "grad_norm": 0.15464138038121494, "learning_rate": 9.996433111605052e-05, "loss": 0.3917, "step": 431 }, { "epoch": 0.11127926071417071, "grad_norm": 0.3063809759370399, "learning_rate": 9.996261259154005e-05, "loss": 0.5573, "step": 432 }, { "epoch": 0.11153685159545353, "grad_norm": 0.24387152098356815, "learning_rate": 9.996085365155482e-05, "loss": 0.4427, "step": 433 }, { "epoch": 0.11179444247673632, "grad_norm": 0.1479317668426719, "learning_rate": 9.995905429751769e-05, "loss": 0.4525, "step": 434 }, { "epoch": 0.11205203335801912, "grad_norm": 0.2999367338551839, "learning_rate": 9.995721453088412e-05, "loss": 0.3997, "step": 435 }, { "epoch": 0.11205203335801912, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 AUC (fixed)": 0.7600838135149292, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.45143821835517883, "eval_runtime": 16.9173, "eval_samples_per_second": 2.601, "eval_steps_per_second": 0.177, "step": 435 }, { "epoch": 0.11230962423930192, "grad_norm": 0.2907942023534451, "learning_rate": 9.995533435314237e-05, "loss": 0.3766, "step": 436 }, { "epoch": 0.11256721512058473, "grad_norm": 0.17800174577133607, "learning_rate": 9.995341376581336e-05, "loss": 0.4478, "step": 437 }, { "epoch": 0.11282480600186753, "grad_norm": 0.15908663006398277, "learning_rate": 9.995145277045061e-05, "loss": 0.4207, "step": 438 }, { "epoch": 0.11308239688315033, "grad_norm": 0.1482303459601316, "learning_rate": 9.994945136864046e-05, "loss": 0.4181, "step": 439 }, { "epoch": 0.11333998776443314, "grad_norm": 0.1814566515082046, "learning_rate": 9.994740956200186e-05, "loss": 0.4548, "step": 440 }, { "epoch": 0.11333998776443314, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.751440544787847, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4646661877632141, "eval_runtime": 16.9266, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 440 }, { "epoch": 0.11359757864571594, "grad_norm": 0.1858776933699486, "learning_rate": 9.994532735218646e-05, "loss": 0.4098, "step": 441 }, { "epoch": 0.11385516952699874, "grad_norm": 0.3522725312854075, "learning_rate": 9.994320474087858e-05, "loss": 0.4841, "step": 442 }, { "epoch": 0.11411276040828154, "grad_norm": 0.19311937353844774, "learning_rate": 9.994104172979522e-05, "loss": 0.4019, "step": 443 }, { "epoch": 0.11437035128956435, "grad_norm": 0.18798207183678353, "learning_rate": 9.993883832068607e-05, "loss": 0.5132, "step": 444 }, { "epoch": 0.11462794217084715, "grad_norm": 0.19688675449288384, "learning_rate": 9.993659451533353e-05, "loss": 0.3989, "step": 445 }, { "epoch": 0.11462794217084715, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 AUC (fixed)": 0.7194866422210581, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.49911221861839294, "eval_runtime": 17.4796, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 445 }, { "epoch": 0.11488553305212995, "grad_norm": 0.363217425309566, "learning_rate": 9.99343103155526e-05, "loss": 0.3946, "step": 446 }, { "epoch": 0.11514312393341276, "grad_norm": 0.17516787099905137, "learning_rate": 9.993198572319106e-05, "loss": 0.4768, "step": 447 }, { "epoch": 0.11540071481469556, "grad_norm": 0.2283411476567932, "learning_rate": 9.992962074012926e-05, "loss": 0.4892, "step": 448 }, { "epoch": 0.11565830569597836, "grad_norm": 0.29854758113505353, "learning_rate": 9.992721536828029e-05, "loss": 0.3802, "step": 449 }, { "epoch": 0.11591589657726116, "grad_norm": 0.17134261585968869, "learning_rate": 9.992476960958987e-05, "loss": 0.4498, "step": 450 }, { "epoch": 0.11591589657726116, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8491620111731844, "eval_PRM F1 AUC": 0.5230487166055526, "eval_PRM F1 AUC (fixed)": 0.6990570979570455, "eval_PRM F1 Neg": 0.18181818181818182, "eval_PRM NPV": 0.3, "eval_PRM Precision": 0.7916666666666666, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.13043478260869565, "eval_loss": 0.5714666247367859, "eval_runtime": 16.6687, "eval_samples_per_second": 2.64, "eval_steps_per_second": 0.18, "step": 450 }, { "epoch": 0.11617348745854397, "grad_norm": 0.5179158338082497, "learning_rate": 9.992228346603645e-05, "loss": 0.5694, "step": 451 }, { "epoch": 0.11643107833982677, "grad_norm": 0.14435030696402013, "learning_rate": 9.991975693963107e-05, "loss": 0.348, "step": 452 }, { "epoch": 0.11668866922110957, "grad_norm": 0.3095028223705166, "learning_rate": 9.991719003241747e-05, "loss": 0.5441, "step": 453 }, { "epoch": 0.11694626010239237, "grad_norm": 0.18501112554057614, "learning_rate": 9.991458274647208e-05, "loss": 0.4509, "step": 454 }, { "epoch": 0.11720385098367518, "grad_norm": 0.3488794160216645, "learning_rate": 9.991193508390397e-05, "loss": 0.4628, "step": 455 }, { "epoch": 0.11720385098367518, "eval_PRM Accuracy": 0.7075471698113207, "eval_PRM F1": 0.8098159509202454, "eval_PRM F1 AUC": 0.5932425353588267, "eval_PRM F1 AUC (fixed)": 0.6982713462545835, "eval_PRM F1 Neg": 0.3673469387755102, "eval_PRM NPV": 0.34615384615384615, "eval_PRM Precision": 0.825, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5284090638160706, "eval_runtime": 16.9875, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 455 }, { "epoch": 0.11746144186495798, "grad_norm": 0.19188328551639264, "learning_rate": 9.990924704685486e-05, "loss": 0.4861, "step": 456 }, { "epoch": 0.11771903274624078, "grad_norm": 0.16743112572800217, "learning_rate": 9.990651863749915e-05, "loss": 0.4494, "step": 457 }, { "epoch": 0.11797662362752359, "grad_norm": 0.16990822788508342, "learning_rate": 9.990374985804389e-05, "loss": 0.4836, "step": 458 }, { "epoch": 0.11823421450880639, "grad_norm": 0.17530360052546765, "learning_rate": 9.990094071072877e-05, "loss": 0.519, "step": 459 }, { "epoch": 0.11849180539008919, "grad_norm": 0.23016022682514356, "learning_rate": 9.989809119782617e-05, "loss": 0.4656, "step": 460 }, { "epoch": 0.11849180539008919, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.7095337873232059, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.5185546875, "eval_runtime": 16.4348, "eval_samples_per_second": 2.677, "eval_steps_per_second": 0.183, "step": 460 }, { "epoch": 0.11874939627137199, "grad_norm": 0.16776038480661404, "learning_rate": 9.98952013216411e-05, "loss": 0.4884, "step": 461 }, { "epoch": 0.1190069871526548, "grad_norm": 0.30116613735561465, "learning_rate": 9.98922710845112e-05, "loss": 0.4944, "step": 462 }, { "epoch": 0.1192645780339376, "grad_norm": 0.16277221121895444, "learning_rate": 9.98893004888068e-05, "loss": 0.4619, "step": 463 }, { "epoch": 0.1195221689152204, "grad_norm": 0.2884572782143645, "learning_rate": 9.988628953693086e-05, "loss": 0.5342, "step": 464 }, { "epoch": 0.11977975979650321, "grad_norm": 0.23336050166838512, "learning_rate": 9.988323823131898e-05, "loss": 0.3791, "step": 465 }, { "epoch": 0.11977975979650321, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8313253012048193, "eval_PRM F1 AUC": 0.6113148245154532, "eval_PRM F1 AUC (fixed)": 0.6990570979570455, "eval_PRM F1 Neg": 0.391304347826087, "eval_PRM NPV": 0.391304347826087, "eval_PRM Precision": 0.8313253012048193, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5411931872367859, "eval_runtime": 17.247, "eval_samples_per_second": 2.551, "eval_steps_per_second": 0.174, "step": 465 }, { "epoch": 0.12003735067778601, "grad_norm": 0.22876765461599868, "learning_rate": 9.988014657443941e-05, "loss": 0.4939, "step": 466 }, { "epoch": 0.12029494155906881, "grad_norm": 0.18211896106958544, "learning_rate": 9.987701456879301e-05, "loss": 0.46, "step": 467 }, { "epoch": 0.1205525324403516, "grad_norm": 0.20986812857185289, "learning_rate": 9.987384221691331e-05, "loss": 0.4288, "step": 468 }, { "epoch": 0.12081012332163442, "grad_norm": 0.1716281564000407, "learning_rate": 9.98706295213665e-05, "loss": 0.4804, "step": 469 }, { "epoch": 0.12106771420291722, "grad_norm": 0.1914473583057819, "learning_rate": 9.986737648475136e-05, "loss": 0.4898, "step": 470 }, { "epoch": 0.12106771420291722, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8352941176470589, "eval_PRM F1 AUC": 0.5798847564169722, "eval_PRM F1 AUC (fixed)": 0.6909376636982714, "eval_PRM F1 Neg": 0.3333333333333333, "eval_PRM NPV": 0.3684210526315789, "eval_PRM Precision": 0.8160919540229885, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5569957494735718, "eval_runtime": 17.1178, "eval_samples_per_second": 2.57, "eval_steps_per_second": 0.175, "step": 470 }, { "epoch": 0.12132530508420002, "grad_norm": 0.18975921320947228, "learning_rate": 9.986408310969933e-05, "loss": 0.4624, "step": 471 }, { "epoch": 0.12158289596548282, "grad_norm": 0.2313278593118049, "learning_rate": 9.986074939887443e-05, "loss": 0.4887, "step": 472 }, { "epoch": 0.12184048684676563, "grad_norm": 0.22364032858385213, "learning_rate": 9.985737535497337e-05, "loss": 0.5237, "step": 473 }, { "epoch": 0.12209807772804843, "grad_norm": 0.22944534912111908, "learning_rate": 9.985396098072548e-05, "loss": 0.539, "step": 474 }, { "epoch": 0.12235566860933123, "grad_norm": 0.22495178012957986, "learning_rate": 9.985050627889267e-05, "loss": 0.4471, "step": 475 }, { "epoch": 0.12235566860933123, "eval_PRM Accuracy": 0.6981132075471698, "eval_PRM F1": 0.7974683544303798, "eval_PRM F1 AUC": 0.6186485070717653, "eval_PRM F1 AUC (fixed)": 0.7074384494499738, "eval_PRM F1 Neg": 0.4074074074074074, "eval_PRM NPV": 0.3548387096774194, "eval_PRM Precision": 0.84, "eval_PRM Recall": 0.7590361445783133, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.5404829382896423, "eval_runtime": 17.3753, "eval_samples_per_second": 2.532, "eval_steps_per_second": 0.173, "step": 475 }, { "epoch": 0.12261325949061404, "grad_norm": 0.3876207521571214, "learning_rate": 9.984701125226951e-05, "loss": 0.4311, "step": 476 }, { "epoch": 0.12287085037189684, "grad_norm": 0.3426845161190092, "learning_rate": 9.984347590368317e-05, "loss": 0.4346, "step": 477 }, { "epoch": 0.12312844125317964, "grad_norm": 0.15189458060441555, "learning_rate": 9.983990023599346e-05, "loss": 0.4772, "step": 478 }, { "epoch": 0.12338603213446243, "grad_norm": 0.17658901434875726, "learning_rate": 9.983628425209277e-05, "loss": 0.456, "step": 479 }, { "epoch": 0.12364362301574525, "grad_norm": 0.33436832155207574, "learning_rate": 9.983262795490613e-05, "loss": 0.5246, "step": 480 }, { "epoch": 0.12364362301574525, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8685714285714285, "eval_PRM F1 AUC": 0.610005238344683, "eval_PRM F1 AUC (fixed)": 0.7433211105290728, "eval_PRM F1 Neg": 0.3783783783783784, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8260869565217391, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.525390625, "eval_runtime": 17.6488, "eval_samples_per_second": 2.493, "eval_steps_per_second": 0.17, "step": 480 }, { "epoch": 0.12390121389702805, "grad_norm": 0.19496835575163987, "learning_rate": 9.982893134739117e-05, "loss": 0.4505, "step": 481 }, { "epoch": 0.12415880477831084, "grad_norm": 0.39693619983320255, "learning_rate": 9.982519443253814e-05, "loss": 0.558, "step": 482 }, { "epoch": 0.12441639565959366, "grad_norm": 0.17315084168741193, "learning_rate": 9.982141721336986e-05, "loss": 0.4958, "step": 483 }, { "epoch": 0.12467398654087646, "grad_norm": 0.18915620776655914, "learning_rate": 9.98175996929418e-05, "loss": 0.506, "step": 484 }, { "epoch": 0.12493157742215925, "grad_norm": 0.4033255260753271, "learning_rate": 9.9813741874342e-05, "loss": 0.4501, "step": 485 }, { "epoch": 0.12493157742215925, "eval_PRM Accuracy": 0.6981132075471698, "eval_PRM F1": 0.7837837837837838, "eval_PRM F1 AUC": 0.6972236773179675, "eval_PRM F1 AUC (fixed)": 0.7336301728653746, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.3902439024390244, "eval_PRM Precision": 0.8923076923076924, "eval_PRM Recall": 0.6987951807228916, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.5287641882896423, "eval_runtime": 16.3762, "eval_samples_per_second": 2.687, "eval_steps_per_second": 0.183, "step": 485 }, { "epoch": 0.12518916830344207, "grad_norm": 0.541164411061555, "learning_rate": 9.98098437606911e-05, "loss": 0.5239, "step": 486 }, { "epoch": 0.12544675918472487, "grad_norm": 0.19254161502867567, "learning_rate": 9.980590535514233e-05, "loss": 0.4735, "step": 487 }, { "epoch": 0.12570435006600766, "grad_norm": 0.1538111819435099, "learning_rate": 9.980192666088155e-05, "loss": 0.4907, "step": 488 }, { "epoch": 0.12596194094729046, "grad_norm": 0.3066978782803548, "learning_rate": 9.979790768112718e-05, "loss": 0.4783, "step": 489 }, { "epoch": 0.12621953182857326, "grad_norm": 0.1411733561568654, "learning_rate": 9.97938484191302e-05, "loss": 0.4237, "step": 490 }, { "epoch": 0.12621953182857326, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8604651162790697, "eval_PRM F1 AUC": 0.6196961760083813, "eval_PRM F1 AUC (fixed)": 0.7608695652173914, "eval_PRM F1 Neg": 0.4, "eval_PRM NPV": 0.47058823529411764, "eval_PRM Precision": 0.8314606741573034, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.5184659361839294, "eval_runtime": 16.8495, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 490 }, { "epoch": 0.12647712270985606, "grad_norm": 0.23043606595833918, "learning_rate": 9.978974887817422e-05, "loss": 0.4733, "step": 491 }, { "epoch": 0.1267347135911389, "grad_norm": 0.4102961064014028, "learning_rate": 9.978560906157543e-05, "loss": 0.5903, "step": 492 }, { "epoch": 0.12699230447242169, "grad_norm": 0.22264561941506675, "learning_rate": 9.978142897268258e-05, "loss": 0.3833, "step": 493 }, { "epoch": 0.12724989535370448, "grad_norm": 0.16955909867564428, "learning_rate": 9.9777208614877e-05, "loss": 0.4098, "step": 494 }, { "epoch": 0.12750748623498728, "grad_norm": 0.18022022135101873, "learning_rate": 9.977294799157259e-05, "loss": 0.4367, "step": 495 }, { "epoch": 0.12750748623498728, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8383233532934131, "eval_PRM F1 AUC": 0.6173389209009953, "eval_PRM F1 AUC (fixed)": 0.7823467784180199, "eval_PRM F1 Neg": 0.4, "eval_PRM NPV": 0.4090909090909091, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.48135653138160706, "eval_runtime": 16.983, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 495 }, { "epoch": 0.12776507711627008, "grad_norm": 0.1666190087756971, "learning_rate": 9.976864710621587e-05, "loss": 0.4697, "step": 496 }, { "epoch": 0.12802266799755288, "grad_norm": 0.18848552450234565, "learning_rate": 9.976430596228584e-05, "loss": 0.3757, "step": 497 }, { "epoch": 0.12828025887883568, "grad_norm": 0.4272381150332115, "learning_rate": 9.975992456329412e-05, "loss": 0.5456, "step": 498 }, { "epoch": 0.1285378497601185, "grad_norm": 0.1735851448416884, "learning_rate": 9.975550291278493e-05, "loss": 0.4972, "step": 499 }, { "epoch": 0.1287954406414013, "grad_norm": 0.3372198854693474, "learning_rate": 9.975104101433494e-05, "loss": 0.3926, "step": 500 }, { "epoch": 0.1287954406414013, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.7951807228915663, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4642223119735718, "eval_runtime": 16.2875, "eval_samples_per_second": 2.701, "eval_steps_per_second": 0.184, "step": 500 }, { "epoch": 0.1290530315226841, "grad_norm": 0.23243013203416885, "learning_rate": 9.97465388715535e-05, "loss": 0.4365, "step": 501 }, { "epoch": 0.1293106224039669, "grad_norm": 0.18134733182489435, "learning_rate": 9.974199648808242e-05, "loss": 0.44, "step": 502 }, { "epoch": 0.1295682132852497, "grad_norm": 0.2079239247334588, "learning_rate": 9.973741386759614e-05, "loss": 0.4678, "step": 503 }, { "epoch": 0.1298258041665325, "grad_norm": 0.15677292629538625, "learning_rate": 9.973279101380158e-05, "loss": 0.4219, "step": 504 }, { "epoch": 0.1300833950478153, "grad_norm": 0.14797415216563284, "learning_rate": 9.972812793043822e-05, "loss": 0.344, "step": 505 }, { "epoch": 0.1300833950478153, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8520710059171598, "eval_PRM F1 AUC": 0.6293871136720797, "eval_PRM F1 AUC (fixed)": 0.819015191199581, "eval_PRM F1 Neg": 0.4186046511627907, "eval_PRM NPV": 0.45, "eval_PRM Precision": 0.8372093023255814, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4420276880264282, "eval_runtime": 16.6527, "eval_samples_per_second": 2.642, "eval_steps_per_second": 0.18, "step": 505 }, { "epoch": 0.1303409859290981, "grad_norm": 0.2156201044253168, "learning_rate": 9.97234246212781e-05, "loss": 0.3819, "step": 506 }, { "epoch": 0.13059857681038092, "grad_norm": 0.15209645182404072, "learning_rate": 9.971868109012584e-05, "loss": 0.3684, "step": 507 }, { "epoch": 0.13085616769166372, "grad_norm": 0.14796710634213806, "learning_rate": 9.971389734081848e-05, "loss": 0.403, "step": 508 }, { "epoch": 0.13111375857294652, "grad_norm": 0.18733175562992538, "learning_rate": 9.970907337722573e-05, "loss": 0.4461, "step": 509 }, { "epoch": 0.13137134945422932, "grad_norm": 0.19539929424521896, "learning_rate": 9.970420920324973e-05, "loss": 0.3827, "step": 510 }, { "epoch": 0.13137134945422932, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.8253012048192772, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4430042505264282, "eval_runtime": 16.9975, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.176, "step": 510 }, { "epoch": 0.13162894033551212, "grad_norm": 0.13720232796296922, "learning_rate": 9.969930482282517e-05, "loss": 0.3627, "step": 511 }, { "epoch": 0.13188653121679492, "grad_norm": 0.1931117883189801, "learning_rate": 9.96943602399193e-05, "loss": 0.4324, "step": 512 }, { "epoch": 0.13214412209807772, "grad_norm": 0.2464304212601258, "learning_rate": 9.968937545853183e-05, "loss": 0.401, "step": 513 }, { "epoch": 0.13240171297936054, "grad_norm": 0.2286895783952905, "learning_rate": 9.968435048269506e-05, "loss": 0.4901, "step": 514 }, { "epoch": 0.13265930386064334, "grad_norm": 0.28191949398014665, "learning_rate": 9.967928531647374e-05, "loss": 0.3807, "step": 515 }, { "epoch": 0.13265930386064334, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8538011695906432, "eval_PRM F1 AUC": 0.6136720796228392, "eval_PRM F1 AUC (fixed)": 0.8014667365112624, "eval_PRM F1 Neg": 0.3902439024390244, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8295454545454546, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.45419034361839294, "eval_runtime": 16.4526, "eval_samples_per_second": 2.674, "eval_steps_per_second": 0.182, "step": 515 }, { "epoch": 0.13291689474192614, "grad_norm": 0.30036386163077716, "learning_rate": 9.967417996396515e-05, "loss": 0.5147, "step": 516 }, { "epoch": 0.13317448562320894, "grad_norm": 0.2381165463587887, "learning_rate": 9.966903442929912e-05, "loss": 0.4514, "step": 517 }, { "epoch": 0.13343207650449174, "grad_norm": 0.2553809821857254, "learning_rate": 9.966384871663791e-05, "loss": 0.5682, "step": 518 }, { "epoch": 0.13368966738577454, "grad_norm": 0.14562660210177747, "learning_rate": 9.965862283017634e-05, "loss": 0.3927, "step": 519 }, { "epoch": 0.13394725826705733, "grad_norm": 0.19130425296371797, "learning_rate": 9.965335677414169e-05, "loss": 0.5246, "step": 520 }, { "epoch": 0.13394725826705733, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.7668936616029334, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.48055753111839294, "eval_runtime": 16.4423, "eval_samples_per_second": 2.676, "eval_steps_per_second": 0.182, "step": 520 }, { "epoch": 0.13420484914834016, "grad_norm": 0.19635568998878608, "learning_rate": 9.964805055279375e-05, "loss": 0.4501, "step": 521 }, { "epoch": 0.13446244002962296, "grad_norm": 0.19298995301566033, "learning_rate": 9.96427041704248e-05, "loss": 0.458, "step": 522 }, { "epoch": 0.13472003091090576, "grad_norm": 0.17217381619733002, "learning_rate": 9.963731763135962e-05, "loss": 0.4226, "step": 523 }, { "epoch": 0.13497762179218856, "grad_norm": 0.15567023610076314, "learning_rate": 9.963189093995543e-05, "loss": 0.4658, "step": 524 }, { "epoch": 0.13523521267347136, "grad_norm": 0.20454779429172162, "learning_rate": 9.962642410060199e-05, "loss": 0.4434, "step": 525 }, { "epoch": 0.13523521267347136, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8670520231213873, "eval_PRM F1 AUC": 0.6257202723939235, "eval_PRM F1 AUC (fixed)": 0.7666317443687796, "eval_PRM F1 Neg": 0.41025641025641024, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4827769994735718, "eval_runtime": 17.0237, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 525 }, { "epoch": 0.13549280355475415, "grad_norm": 0.18673112417563809, "learning_rate": 9.962091711772149e-05, "loss": 0.4381, "step": 526 }, { "epoch": 0.13575039443603695, "grad_norm": 0.17857466313927792, "learning_rate": 9.961536999576858e-05, "loss": 0.446, "step": 527 }, { "epoch": 0.13600798531731978, "grad_norm": 0.1430458337040357, "learning_rate": 9.960978273923045e-05, "loss": 0.383, "step": 528 }, { "epoch": 0.13626557619860258, "grad_norm": 0.21712102874818842, "learning_rate": 9.960415535262671e-05, "loss": 0.4592, "step": 529 }, { "epoch": 0.13652316707988538, "grad_norm": 0.16887131482346196, "learning_rate": 9.959848784050941e-05, "loss": 0.3989, "step": 530 }, { "epoch": 0.13652316707988538, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.7765845992666317, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4584517180919647, "eval_runtime": 16.9731, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 530 }, { "epoch": 0.13678075796116818, "grad_norm": 0.1644342267077243, "learning_rate": 9.959278020746308e-05, "loss": 0.4431, "step": 531 }, { "epoch": 0.13703834884245097, "grad_norm": 0.21428398361967044, "learning_rate": 9.958703245810472e-05, "loss": 0.3902, "step": 532 }, { "epoch": 0.13729593972373377, "grad_norm": 0.21520986079808266, "learning_rate": 9.958124459708378e-05, "loss": 0.4852, "step": 533 }, { "epoch": 0.13755353060501657, "grad_norm": 0.18083797967486132, "learning_rate": 9.957541662908211e-05, "loss": 0.4208, "step": 534 }, { "epoch": 0.1378111214862994, "grad_norm": 0.13634423713941946, "learning_rate": 9.956954855881409e-05, "loss": 0.4408, "step": 535 }, { "epoch": 0.1378111214862994, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 AUC (fixed)": 0.7781561026715557, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4533025622367859, "eval_runtime": 17.1738, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 535 }, { "epoch": 0.1380687123675822, "grad_norm": 0.14534073818815002, "learning_rate": 9.956364039102642e-05, "loss": 0.4851, "step": 536 }, { "epoch": 0.138326303248865, "grad_norm": 0.23394278593735526, "learning_rate": 9.955769213049834e-05, "loss": 0.4349, "step": 537 }, { "epoch": 0.1385838941301478, "grad_norm": 0.16137021473735455, "learning_rate": 9.955170378204148e-05, "loss": 0.4472, "step": 538 }, { "epoch": 0.1388414850114306, "grad_norm": 0.15990281414868324, "learning_rate": 9.95456753504999e-05, "loss": 0.48, "step": 539 }, { "epoch": 0.1390990758927134, "grad_norm": 0.1380368399427166, "learning_rate": 9.953960684075008e-05, "loss": 0.3557, "step": 540 }, { "epoch": 0.1390990758927134, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8538011695906432, "eval_PRM F1 AUC": 0.6136720796228392, "eval_PRM F1 AUC (fixed)": 0.782608695652174, "eval_PRM F1 Neg": 0.3902439024390244, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8295454545454546, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4630681872367859, "eval_runtime": 16.3394, "eval_samples_per_second": 2.693, "eval_steps_per_second": 0.184, "step": 540 }, { "epoch": 0.1393566667739962, "grad_norm": 0.12860872444305896, "learning_rate": 9.953349825770092e-05, "loss": 0.3588, "step": 541 }, { "epoch": 0.139614257655279, "grad_norm": 0.3595882169037072, "learning_rate": 9.952734960629377e-05, "loss": 0.5299, "step": 542 }, { "epoch": 0.13987184853656182, "grad_norm": 0.13181945672957565, "learning_rate": 9.952116089150232e-05, "loss": 0.3421, "step": 543 }, { "epoch": 0.14012943941784461, "grad_norm": 0.30647108715130694, "learning_rate": 9.951493211833274e-05, "loss": 0.4841, "step": 544 }, { "epoch": 0.1403870302991274, "grad_norm": 0.14305039438230568, "learning_rate": 9.950866329182356e-05, "loss": 0.3758, "step": 545 }, { "epoch": 0.1403870302991274, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8343558282208589, "eval_PRM F1 AUC": 0.6487689889994761, "eval_PRM F1 AUC (fixed)": 0.7718700890518596, "eval_PRM F1 Neg": 0.4489795918367347, "eval_PRM NPV": 0.4230769230769231, "eval_PRM Precision": 0.85, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4650213122367859, "eval_runtime": 16.5497, "eval_samples_per_second": 2.659, "eval_steps_per_second": 0.181, "step": 545 }, { "epoch": 0.1406446211804102, "grad_norm": 0.20571048343383005, "learning_rate": 9.950235441704574e-05, "loss": 0.3588, "step": 546 }, { "epoch": 0.140902212061693, "grad_norm": 0.14773983628595605, "learning_rate": 9.94960054991026e-05, "loss": 0.4495, "step": 547 }, { "epoch": 0.1411598029429758, "grad_norm": 0.20537275966087623, "learning_rate": 9.948961654312987e-05, "loss": 0.3736, "step": 548 }, { "epoch": 0.1414173938242586, "grad_norm": 0.1561976741038428, "learning_rate": 9.948318755429569e-05, "loss": 0.3903, "step": 549 }, { "epoch": 0.14167498470554143, "grad_norm": 0.19033190051807455, "learning_rate": 9.947671853780054e-05, "loss": 0.4475, "step": 550 }, { "epoch": 0.14167498470554143, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8414634146341463, "eval_PRM F1 AUC": 0.6547930853850183, "eval_PRM F1 AUC (fixed)": 0.7723939235201676, "eval_PRM F1 Neg": 0.4583333333333333, "eval_PRM NPV": 0.44, "eval_PRM Precision": 0.8518518518518519, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.47682884335517883, "eval_runtime": 17.3925, "eval_samples_per_second": 2.53, "eval_steps_per_second": 0.172, "step": 550 }, { "epoch": 0.14193257558682423, "grad_norm": 0.24424439496753372, "learning_rate": 9.947020949887732e-05, "loss": 0.4133, "step": 551 }, { "epoch": 0.14219016646810703, "grad_norm": 0.15774239195977913, "learning_rate": 9.946366044279127e-05, "loss": 0.4132, "step": 552 }, { "epoch": 0.14244775734938983, "grad_norm": 0.15828250510157615, "learning_rate": 9.945707137484002e-05, "loss": 0.3469, "step": 553 }, { "epoch": 0.14270534823067263, "grad_norm": 0.3625889067067729, "learning_rate": 9.945044230035356e-05, "loss": 0.5171, "step": 554 }, { "epoch": 0.14296293911195543, "grad_norm": 0.24737500122935935, "learning_rate": 9.944377322469425e-05, "loss": 0.3971, "step": 555 }, { "epoch": 0.14296293911195543, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.787847040335254, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4770951569080353, "eval_runtime": 17.1821, "eval_samples_per_second": 2.561, "eval_steps_per_second": 0.175, "step": 555 }, { "epoch": 0.14322052999323823, "grad_norm": 0.2036589367656424, "learning_rate": 9.943706415325678e-05, "loss": 0.4076, "step": 556 }, { "epoch": 0.14347812087452105, "grad_norm": 0.16148951825642974, "learning_rate": 9.943031509146825e-05, "loss": 0.4358, "step": 557 }, { "epoch": 0.14373571175580385, "grad_norm": 0.1550701405332846, "learning_rate": 9.942352604478804e-05, "loss": 0.4499, "step": 558 }, { "epoch": 0.14399330263708665, "grad_norm": 0.23723687725191614, "learning_rate": 9.941669701870791e-05, "loss": 0.5176, "step": 559 }, { "epoch": 0.14425089351836945, "grad_norm": 0.4408293427341948, "learning_rate": 9.940982801875198e-05, "loss": 0.4098, "step": 560 }, { "epoch": 0.14425089351836945, "eval_PRM Accuracy": 0.7264150943396226, "eval_PRM F1": 0.8176100628930818, "eval_PRM F1 AUC": 0.6524358302776323, "eval_PRM F1 AUC (fixed)": 0.7624410686223154, "eval_PRM F1 Neg": 0.4528301886792453, "eval_PRM NPV": 0.4, "eval_PRM Precision": 0.8552631578947368, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4998224377632141, "eval_runtime": 17.5111, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 560 }, { "epoch": 0.14450848439965225, "grad_norm": 0.1636596109094242, "learning_rate": 9.940291905047667e-05, "loss": 0.4615, "step": 561 }, { "epoch": 0.14476607528093505, "grad_norm": 0.3288203026034336, "learning_rate": 9.939597011947075e-05, "loss": 0.4137, "step": 562 }, { "epoch": 0.14502366616221785, "grad_norm": 0.1727766161378202, "learning_rate": 9.93889812313553e-05, "loss": 0.4257, "step": 563 }, { "epoch": 0.14528125704350067, "grad_norm": 0.22133306534740338, "learning_rate": 9.938195239178374e-05, "loss": 0.3642, "step": 564 }, { "epoch": 0.14553884792478347, "grad_norm": 0.23564996506576932, "learning_rate": 9.937488360644179e-05, "loss": 0.4865, "step": 565 }, { "epoch": 0.14553884792478347, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8685714285714285, "eval_PRM F1 AUC": 0.610005238344683, "eval_PRM F1 AUC (fixed)": 0.7537977998952331, "eval_PRM F1 Neg": 0.3783783783783784, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8260869565217391, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5230823755264282, "eval_runtime": 17.63, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 565 }, { "epoch": 0.14579643880606627, "grad_norm": 0.2508803371340414, "learning_rate": 9.936777488104751e-05, "loss": 0.4145, "step": 566 }, { "epoch": 0.14605402968734907, "grad_norm": 0.23956297596171264, "learning_rate": 9.936062622135122e-05, "loss": 0.3944, "step": 567 }, { "epoch": 0.14631162056863187, "grad_norm": 0.21289659087940283, "learning_rate": 9.935343763313559e-05, "loss": 0.4617, "step": 568 }, { "epoch": 0.14656921144991467, "grad_norm": 0.14778690605865993, "learning_rate": 9.934620912221558e-05, "loss": 0.4379, "step": 569 }, { "epoch": 0.14682680233119746, "grad_norm": 0.44236419877530125, "learning_rate": 9.933894069443843e-05, "loss": 0.4767, "step": 570 }, { "epoch": 0.14682680233119746, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8470588235294118, "eval_PRM F1 AUC": 0.607647983237297, "eval_PRM F1 AUC (fixed)": 0.7697747511786275, "eval_PRM F1 Neg": 0.38095238095238093, "eval_PRM NPV": 0.42105263157894735, "eval_PRM Precision": 0.8275862068965517, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4584517180919647, "eval_runtime": 16.7879, "eval_samples_per_second": 2.621, "eval_steps_per_second": 0.179, "step": 570 }, { "epoch": 0.1470843932124803, "grad_norm": 0.14575814167022766, "learning_rate": 9.933163235568367e-05, "loss": 0.4122, "step": 571 }, { "epoch": 0.1473419840937631, "grad_norm": 0.24990219221165175, "learning_rate": 9.932428411186315e-05, "loss": 0.4993, "step": 572 }, { "epoch": 0.1475995749750459, "grad_norm": 0.16879855136788025, "learning_rate": 9.93168959689209e-05, "loss": 0.3773, "step": 573 }, { "epoch": 0.1478571658563287, "grad_norm": 0.13860080291382879, "learning_rate": 9.930946793283337e-05, "loss": 0.4355, "step": 574 }, { "epoch": 0.14811475673761149, "grad_norm": 0.26517256347990664, "learning_rate": 9.930200000960918e-05, "loss": 0.4739, "step": 575 }, { "epoch": 0.14811475673761149, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.6160293347302253, "eval_PRM F1 AUC (fixed)": 0.785751702462022, "eval_PRM F1 Neg": 0.3888888888888889, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8279569892473119, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.30434782608695654, "eval_loss": 0.5024858117103577, "eval_runtime": 17.4454, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 575 }, { "epoch": 0.14837234761889428, "grad_norm": 0.3003378646329778, "learning_rate": 9.929449220528921e-05, "loss": 0.4226, "step": 576 }, { "epoch": 0.14862993850017708, "grad_norm": 0.17494421357782064, "learning_rate": 9.928694452594668e-05, "loss": 0.4519, "step": 577 }, { "epoch": 0.1488875293814599, "grad_norm": 0.22765598168556703, "learning_rate": 9.927935697768698e-05, "loss": 0.4153, "step": 578 }, { "epoch": 0.1491451202627427, "grad_norm": 0.1344097185209204, "learning_rate": 9.927172956664781e-05, "loss": 0.4616, "step": 579 }, { "epoch": 0.1494027111440255, "grad_norm": 0.16415731918738993, "learning_rate": 9.926406229899907e-05, "loss": 0.5363, "step": 580 }, { "epoch": 0.1494027111440255, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8271604938271605, "eval_PRM F1 AUC": 0.6427448926139341, "eval_PRM F1 AUC (fixed)": 0.7708224201152436, "eval_PRM F1 Neg": 0.44, "eval_PRM NPV": 0.4074074074074074, "eval_PRM Precision": 0.8481012658227848, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4730113744735718, "eval_runtime": 17.0191, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 580 }, { "epoch": 0.1496603020253083, "grad_norm": 0.2707654312129822, "learning_rate": 9.925635518094294e-05, "loss": 0.4373, "step": 581 }, { "epoch": 0.1499178929065911, "grad_norm": 0.29728737295247704, "learning_rate": 9.92486082187138e-05, "loss": 0.4487, "step": 582 }, { "epoch": 0.1501754837878739, "grad_norm": 0.27014933637943056, "learning_rate": 9.924082141857832e-05, "loss": 0.4214, "step": 583 }, { "epoch": 0.1504330746691567, "grad_norm": 0.17698864479805085, "learning_rate": 9.923299478683529e-05, "loss": 0.437, "step": 584 }, { "epoch": 0.1506906655504395, "grad_norm": 0.22061789218307817, "learning_rate": 9.922512832981584e-05, "loss": 0.4341, "step": 585 }, { "epoch": 0.1506906655504395, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8654970760233918, "eval_PRM F1 AUC": 0.6414353064431639, "eval_PRM F1 AUC (fixed)": 0.7723939235201677, "eval_PRM F1 Neg": 0.43902439024390244, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8409090909090909, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.48464134335517883, "eval_runtime": 17.1406, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 585 }, { "epoch": 0.15094825643172233, "grad_norm": 0.12518709115500176, "learning_rate": 9.921722205388324e-05, "loss": 0.4047, "step": 586 }, { "epoch": 0.15120584731300513, "grad_norm": 0.12534518949469658, "learning_rate": 9.920927596543299e-05, "loss": 0.3973, "step": 587 }, { "epoch": 0.15146343819428792, "grad_norm": 0.27077397791264957, "learning_rate": 9.920129007089279e-05, "loss": 0.4163, "step": 588 }, { "epoch": 0.15172102907557072, "grad_norm": 0.3836375221713533, "learning_rate": 9.919326437672256e-05, "loss": 0.5781, "step": 589 }, { "epoch": 0.15197861995685352, "grad_norm": 0.12441513482581146, "learning_rate": 9.91851988894144e-05, "loss": 0.4091, "step": 590 }, { "epoch": 0.15197861995685352, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.7632268203247774, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.48153409361839294, "eval_runtime": 16.8994, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 590 }, { "epoch": 0.15223621083813632, "grad_norm": 0.21179237222878922, "learning_rate": 9.917709361549257e-05, "loss": 0.367, "step": 591 }, { "epoch": 0.15249380171941912, "grad_norm": 0.17304497033591962, "learning_rate": 9.916894856151357e-05, "loss": 0.3508, "step": 592 }, { "epoch": 0.15275139260070195, "grad_norm": 0.2454166685449653, "learning_rate": 9.916076373406604e-05, "loss": 0.3496, "step": 593 }, { "epoch": 0.15300898348198474, "grad_norm": 0.15787014111337078, "learning_rate": 9.915253913977081e-05, "loss": 0.47, "step": 594 }, { "epoch": 0.15326657436326754, "grad_norm": 0.1557034906946904, "learning_rate": 9.914427478528086e-05, "loss": 0.3704, "step": 595 }, { "epoch": 0.15326657436326754, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8402366863905325, "eval_PRM F1 AUC": 0.6016238868517548, "eval_PRM F1 AUC (fixed)": 0.7739654269250916, "eval_PRM F1 Neg": 0.37209302325581395, "eval_PRM NPV": 0.4, "eval_PRM Precision": 0.8255813953488372, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4736328125, "eval_runtime": 17.6317, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 595 }, { "epoch": 0.15352416524455034, "grad_norm": 0.16299805013993665, "learning_rate": 9.913597067728136e-05, "loss": 0.366, "step": 596 }, { "epoch": 0.15378175612583314, "grad_norm": 0.2558748098135429, "learning_rate": 9.912762682248961e-05, "loss": 0.4376, "step": 597 }, { "epoch": 0.15403934700711594, "grad_norm": 0.15880230898681458, "learning_rate": 9.91192432276551e-05, "loss": 0.4012, "step": 598 }, { "epoch": 0.15429693788839874, "grad_norm": 0.342622293511161, "learning_rate": 9.91108198995594e-05, "loss": 0.5031, "step": 599 }, { "epoch": 0.15455452876968157, "grad_norm": 0.27763131896966214, "learning_rate": 9.910235684501628e-05, "loss": 0.4109, "step": 600 }, { "epoch": 0.15455452876968157, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8414634146341463, "eval_PRM F1 AUC": 0.6547930853850183, "eval_PRM F1 AUC (fixed)": 0.7765845992666317, "eval_PRM F1 Neg": 0.4583333333333333, "eval_PRM NPV": 0.44, "eval_PRM Precision": 0.8518518518518519, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46084871888160706, "eval_runtime": 17.2635, "eval_samples_per_second": 2.549, "eval_steps_per_second": 0.174, "step": 600 }, { "epoch": 0.15481211965096436, "grad_norm": 0.19495500755986214, "learning_rate": 9.909385407087164e-05, "loss": 0.4823, "step": 601 }, { "epoch": 0.15506971053224716, "grad_norm": 0.1662738231837952, "learning_rate": 9.908531158400348e-05, "loss": 0.4359, "step": 602 }, { "epoch": 0.15532730141352996, "grad_norm": 0.24425168108186104, "learning_rate": 9.907672939132194e-05, "loss": 0.4882, "step": 603 }, { "epoch": 0.15558489229481276, "grad_norm": 0.34371667637053854, "learning_rate": 9.90681074997693e-05, "loss": 0.4093, "step": 604 }, { "epoch": 0.15584248317609556, "grad_norm": 0.21489885476226608, "learning_rate": 9.905944591631989e-05, "loss": 0.4114, "step": 605 }, { "epoch": 0.15584248317609556, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.78365636458879, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4428267180919647, "eval_runtime": 17.6587, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 605 }, { "epoch": 0.15610007405737836, "grad_norm": 0.19266685254832466, "learning_rate": 9.905074464798024e-05, "loss": 0.4228, "step": 606 }, { "epoch": 0.15635766493866118, "grad_norm": 0.2251564834529174, "learning_rate": 9.90420037017889e-05, "loss": 0.467, "step": 607 }, { "epoch": 0.15661525581994398, "grad_norm": 0.45729581506743594, "learning_rate": 9.903322308481653e-05, "loss": 0.5991, "step": 608 }, { "epoch": 0.15687284670122678, "grad_norm": 0.2339539113090074, "learning_rate": 9.902440280416594e-05, "loss": 0.4402, "step": 609 }, { "epoch": 0.15713043758250958, "grad_norm": 0.18198996585166632, "learning_rate": 9.901554286697194e-05, "loss": 0.4522, "step": 610 }, { "epoch": 0.15713043758250958, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.7949188056574122, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.43448153138160706, "eval_runtime": 16.8939, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 610 }, { "epoch": 0.15738802846379238, "grad_norm": 0.1639411644773044, "learning_rate": 9.90066432804015e-05, "loss": 0.4075, "step": 611 }, { "epoch": 0.15764561934507518, "grad_norm": 0.15815955150830535, "learning_rate": 9.899770405165361e-05, "loss": 0.4248, "step": 612 }, { "epoch": 0.15790321022635798, "grad_norm": 0.14162794618236046, "learning_rate": 9.898872518795932e-05, "loss": 0.4081, "step": 613 }, { "epoch": 0.1581608011076408, "grad_norm": 0.1732530807850286, "learning_rate": 9.897970669658179e-05, "loss": 0.5186, "step": 614 }, { "epoch": 0.1584183919889236, "grad_norm": 0.1591015472447936, "learning_rate": 9.897064858481617e-05, "loss": 0.5341, "step": 615 }, { "epoch": 0.1584183919889236, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8082765845992665, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4280894994735718, "eval_runtime": 17.1846, "eval_samples_per_second": 2.56, "eval_steps_per_second": 0.175, "step": 615 }, { "epoch": 0.1586759828702064, "grad_norm": 0.12295791241989529, "learning_rate": 9.896155085998975e-05, "loss": 0.3893, "step": 616 }, { "epoch": 0.1589335737514892, "grad_norm": 0.21121958874624774, "learning_rate": 9.895241352946177e-05, "loss": 0.4044, "step": 617 }, { "epoch": 0.159191164632772, "grad_norm": 0.16536974448875036, "learning_rate": 9.894323660062355e-05, "loss": 0.3859, "step": 618 }, { "epoch": 0.1594487555140548, "grad_norm": 0.1282038086427594, "learning_rate": 9.893402008089846e-05, "loss": 0.3675, "step": 619 }, { "epoch": 0.1597063463953376, "grad_norm": 0.13244793629971566, "learning_rate": 9.892476397774186e-05, "loss": 0.4034, "step": 620 }, { "epoch": 0.1597063463953376, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.816919853326349, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4388316869735718, "eval_runtime": 16.9877, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 620 }, { "epoch": 0.15996393727662042, "grad_norm": 0.12452336620676328, "learning_rate": 9.891546829864115e-05, "loss": 0.3525, "step": 621 }, { "epoch": 0.16022152815790322, "grad_norm": 0.1293755399419532, "learning_rate": 9.890613305111573e-05, "loss": 0.3772, "step": 622 }, { "epoch": 0.16047911903918602, "grad_norm": 0.1472043938786218, "learning_rate": 9.889675824271702e-05, "loss": 0.3906, "step": 623 }, { "epoch": 0.16073670992046882, "grad_norm": 0.1937422838204494, "learning_rate": 9.888734388102846e-05, "loss": 0.4236, "step": 624 }, { "epoch": 0.16099430080175162, "grad_norm": 0.23154168480630893, "learning_rate": 9.887788997366542e-05, "loss": 0.3951, "step": 625 }, { "epoch": 0.16099430080175162, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8061812467260345, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4663529694080353, "eval_runtime": 16.9729, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 625 }, { "epoch": 0.16125189168303442, "grad_norm": 0.1623940427136026, "learning_rate": 9.886839652827535e-05, "loss": 0.3886, "step": 626 }, { "epoch": 0.1615094825643172, "grad_norm": 0.17304434957011025, "learning_rate": 9.885886355253758e-05, "loss": 0.4262, "step": 627 }, { "epoch": 0.1617670734456, "grad_norm": 0.21701077444991348, "learning_rate": 9.884929105416352e-05, "loss": 0.3799, "step": 628 }, { "epoch": 0.16202466432688284, "grad_norm": 0.18532237415497269, "learning_rate": 9.883967904089646e-05, "loss": 0.354, "step": 629 }, { "epoch": 0.16228225520816564, "grad_norm": 0.3017205197744428, "learning_rate": 9.883002752051172e-05, "loss": 0.4886, "step": 630 }, { "epoch": 0.16228225520816564, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.84472049689441, "eval_PRM F1 AUC": 0.6922472498690415, "eval_PRM F1 AUC (fixed)": 0.7812991094814038, "eval_PRM F1 Neg": 0.5098039215686274, "eval_PRM NPV": 0.4642857142857143, "eval_PRM Precision": 0.8717948717948718, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.48837003111839294, "eval_runtime": 17.0394, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 630 }, { "epoch": 0.16253984608944844, "grad_norm": 0.19832066024351758, "learning_rate": 9.882033650081656e-05, "loss": 0.4964, "step": 631 }, { "epoch": 0.16279743697073124, "grad_norm": 0.25106766964391797, "learning_rate": 9.881060598965017e-05, "loss": 0.4588, "step": 632 }, { "epoch": 0.16305502785201403, "grad_norm": 0.16820083455872828, "learning_rate": 9.88008359948837e-05, "loss": 0.4158, "step": 633 }, { "epoch": 0.16331261873329683, "grad_norm": 0.13897970781754732, "learning_rate": 9.879102652442024e-05, "loss": 0.3465, "step": 634 }, { "epoch": 0.16357020961457963, "grad_norm": 0.21733232579412023, "learning_rate": 9.878117758619483e-05, "loss": 0.4867, "step": 635 }, { "epoch": 0.16357020961457963, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.7888947092718699, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4793146252632141, "eval_runtime": 16.8841, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 635 }, { "epoch": 0.16382780049586246, "grad_norm": 0.24553401011337908, "learning_rate": 9.877128918817438e-05, "loss": 0.5677, "step": 636 }, { "epoch": 0.16408539137714526, "grad_norm": 0.19633898799616223, "learning_rate": 9.876136133835779e-05, "loss": 0.4463, "step": 637 }, { "epoch": 0.16434298225842806, "grad_norm": 0.21283256236770995, "learning_rate": 9.875139404477583e-05, "loss": 0.4492, "step": 638 }, { "epoch": 0.16460057313971085, "grad_norm": 0.20776709367960883, "learning_rate": 9.874138731549118e-05, "loss": 0.3329, "step": 639 }, { "epoch": 0.16485816402099365, "grad_norm": 0.1459764071074001, "learning_rate": 9.873134115859846e-05, "loss": 0.4164, "step": 640 }, { "epoch": 0.16485816402099365, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8301886792452831, "eval_PRM F1 AUC": 0.6801990570979571, "eval_PRM F1 AUC (fixed)": 0.7700366684127815, "eval_PRM F1 Neg": 0.49056603773584906, "eval_PRM NPV": 0.43333333333333335, "eval_PRM Precision": 0.868421052631579, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4796697497367859, "eval_runtime": 17.0848, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 640 }, { "epoch": 0.16511575490227645, "grad_norm": 0.14339358364490282, "learning_rate": 9.872125558222409e-05, "loss": 0.3873, "step": 641 }, { "epoch": 0.16537334578355925, "grad_norm": 0.13491590441467222, "learning_rate": 9.87111305945265e-05, "loss": 0.405, "step": 642 }, { "epoch": 0.16563093666484208, "grad_norm": 0.17369455599043898, "learning_rate": 9.870096620369588e-05, "loss": 0.4617, "step": 643 }, { "epoch": 0.16588852754612488, "grad_norm": 0.17412662325525785, "learning_rate": 9.86907624179544e-05, "loss": 0.4395, "step": 644 }, { "epoch": 0.16614611842740767, "grad_norm": 0.15648856160595107, "learning_rate": 9.868051924555604e-05, "loss": 0.4099, "step": 645 }, { "epoch": 0.16614611842740767, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.7658459926663175, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4887251555919647, "eval_runtime": 17.4777, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 645 }, { "epoch": 0.16640370930869047, "grad_norm": 0.13481567407746478, "learning_rate": 9.867023669478663e-05, "loss": 0.3853, "step": 646 }, { "epoch": 0.16666130018997327, "grad_norm": 0.16480165211419467, "learning_rate": 9.865991477396389e-05, "loss": 0.4374, "step": 647 }, { "epoch": 0.16691889107125607, "grad_norm": 0.18018135544254535, "learning_rate": 9.864955349143734e-05, "loss": 0.3137, "step": 648 }, { "epoch": 0.16717648195253887, "grad_norm": 0.24524899870695566, "learning_rate": 9.863915285558842e-05, "loss": 0.4701, "step": 649 }, { "epoch": 0.1674340728338217, "grad_norm": 0.17646733473636492, "learning_rate": 9.862871287483031e-05, "loss": 0.4509, "step": 650 }, { "epoch": 0.1674340728338217, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.7640125720272394, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.5013316869735718, "eval_runtime": 17.2256, "eval_samples_per_second": 2.554, "eval_steps_per_second": 0.174, "step": 650 }, { "epoch": 0.1676916637151045, "grad_norm": 0.15937218329200434, "learning_rate": 9.861823355760806e-05, "loss": 0.3599, "step": 651 }, { "epoch": 0.1679492545963873, "grad_norm": 0.3289575061927892, "learning_rate": 9.860771491239858e-05, "loss": 0.6103, "step": 652 }, { "epoch": 0.1682068454776701, "grad_norm": 0.17863045278628034, "learning_rate": 9.859715694771053e-05, "loss": 0.38, "step": 653 }, { "epoch": 0.1684644363589529, "grad_norm": 0.1585090949938342, "learning_rate": 9.858655967208439e-05, "loss": 0.4371, "step": 654 }, { "epoch": 0.1687220272402357, "grad_norm": 0.19057423234458407, "learning_rate": 9.857592309409247e-05, "loss": 0.3568, "step": 655 }, { "epoch": 0.1687220272402357, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.7551073860660031, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.5083451867103577, "eval_runtime": 16.3698, "eval_samples_per_second": 2.688, "eval_steps_per_second": 0.183, "step": 655 }, { "epoch": 0.1689796181215185, "grad_norm": 0.18323061816255004, "learning_rate": 9.856524722233884e-05, "loss": 0.438, "step": 656 }, { "epoch": 0.16923720900280131, "grad_norm": 0.16272978610400557, "learning_rate": 9.855453206545935e-05, "loss": 0.4271, "step": 657 }, { "epoch": 0.1694947998840841, "grad_norm": 0.23468911850628899, "learning_rate": 9.854377763212165e-05, "loss": 0.3553, "step": 658 }, { "epoch": 0.1697523907653669, "grad_norm": 0.18744583407611537, "learning_rate": 9.85329839310252e-05, "loss": 0.4781, "step": 659 }, { "epoch": 0.1700099816466497, "grad_norm": 0.27561193725327016, "learning_rate": 9.852215097090111e-05, "loss": 0.5132, "step": 660 }, { "epoch": 0.1700099816466497, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.7773703509690938, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4916548430919647, "eval_runtime": 17.1452, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 660 }, { "epoch": 0.1702675725279325, "grad_norm": 0.15231121801516695, "learning_rate": 9.851127876051236e-05, "loss": 0.4001, "step": 661 }, { "epoch": 0.1705251634092153, "grad_norm": 0.18241783473583673, "learning_rate": 9.850036730865364e-05, "loss": 0.3844, "step": 662 }, { "epoch": 0.1707827542904981, "grad_norm": 0.15668351745371425, "learning_rate": 9.848941662415134e-05, "loss": 0.4022, "step": 663 }, { "epoch": 0.1710403451717809, "grad_norm": 0.20632946751665437, "learning_rate": 9.847842671586368e-05, "loss": 0.474, "step": 664 }, { "epoch": 0.17129793605306373, "grad_norm": 0.2153198389229454, "learning_rate": 9.846739759268052e-05, "loss": 0.3973, "step": 665 }, { "epoch": 0.17129793605306373, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8333333333333334, "eval_PRM F1 AUC": 0.7176532215819801, "eval_PRM F1 AUC (fixed)": 0.7925615505500262, "eval_PRM F1 Neg": 0.5357142857142857, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8904109589041096, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.4423828125, "eval_runtime": 17.0767, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 665 }, { "epoch": 0.17155552693434653, "grad_norm": 0.24999244006409765, "learning_rate": 9.845632926352348e-05, "loss": 0.4994, "step": 666 }, { "epoch": 0.17181311781562933, "grad_norm": 0.2967977515854507, "learning_rate": 9.844522173734592e-05, "loss": 0.3771, "step": 667 }, { "epoch": 0.17207070869691213, "grad_norm": 0.26746297579695144, "learning_rate": 9.843407502313282e-05, "loss": 0.4001, "step": 668 }, { "epoch": 0.17232829957819493, "grad_norm": 0.17058731150960188, "learning_rate": 9.842288912990096e-05, "loss": 0.3965, "step": 669 }, { "epoch": 0.17258589045947773, "grad_norm": 0.1778065780640039, "learning_rate": 9.841166406669877e-05, "loss": 0.4523, "step": 670 }, { "epoch": 0.17258589045947773, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8103719224724988, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.41184303164482117, "eval_runtime": 16.9731, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 670 }, { "epoch": 0.17284348134076052, "grad_norm": 0.31129934399896336, "learning_rate": 9.840039984260634e-05, "loss": 0.4905, "step": 671 }, { "epoch": 0.17310107222204335, "grad_norm": 0.1258029131348985, "learning_rate": 9.838909646673549e-05, "loss": 0.333, "step": 672 }, { "epoch": 0.17335866310332615, "grad_norm": 0.16695596415017197, "learning_rate": 9.837775394822965e-05, "loss": 0.3892, "step": 673 }, { "epoch": 0.17361625398460895, "grad_norm": 0.3017701623634423, "learning_rate": 9.8366372296264e-05, "loss": 0.3822, "step": 674 }, { "epoch": 0.17387384486589175, "grad_norm": 0.19166938021469296, "learning_rate": 9.835495152004525e-05, "loss": 0.4365, "step": 675 }, { "epoch": 0.17387384486589175, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.795180722891566, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.42356178164482117, "eval_runtime": 16.9552, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 675 }, { "epoch": 0.17413143574717455, "grad_norm": 0.23536978986739074, "learning_rate": 9.83434916288119e-05, "loss": 0.4063, "step": 676 }, { "epoch": 0.17438902662845734, "grad_norm": 0.18774279660642884, "learning_rate": 9.833199263183397e-05, "loss": 0.3721, "step": 677 }, { "epoch": 0.17464661750974014, "grad_norm": 0.17259884970457762, "learning_rate": 9.832045453841318e-05, "loss": 0.3639, "step": 678 }, { "epoch": 0.17490420839102297, "grad_norm": 0.14308034016674614, "learning_rate": 9.830887735788287e-05, "loss": 0.3857, "step": 679 }, { "epoch": 0.17516179927230577, "grad_norm": 0.17253077784863272, "learning_rate": 9.829726109960797e-05, "loss": 0.4504, "step": 680 }, { "epoch": 0.17516179927230577, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.785227867993714, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4419389069080353, "eval_runtime": 17.177, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 680 }, { "epoch": 0.17541939015358857, "grad_norm": 0.16508665536775802, "learning_rate": 9.828560577298506e-05, "loss": 0.3882, "step": 681 }, { "epoch": 0.17567698103487137, "grad_norm": 0.23190791244069672, "learning_rate": 9.827391138744228e-05, "loss": 0.4693, "step": 682 }, { "epoch": 0.17593457191615416, "grad_norm": 0.15595323621705906, "learning_rate": 9.82621779524394e-05, "loss": 0.3928, "step": 683 }, { "epoch": 0.17619216279743696, "grad_norm": 0.16183023013035544, "learning_rate": 9.825040547746775e-05, "loss": 0.3593, "step": 684 }, { "epoch": 0.17644975367871976, "grad_norm": 0.19154156099368147, "learning_rate": 9.823859397205026e-05, "loss": 0.4246, "step": 685 }, { "epoch": 0.17644975367871976, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.7920377160817181, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4419389069080353, "eval_runtime": 16.9346, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 685 }, { "epoch": 0.1767073445600026, "grad_norm": 0.1618543609679037, "learning_rate": 9.822674344574144e-05, "loss": 0.3815, "step": 686 }, { "epoch": 0.1769649354412854, "grad_norm": 0.3216490040480785, "learning_rate": 9.821485390812733e-05, "loss": 0.5033, "step": 687 }, { "epoch": 0.17722252632256819, "grad_norm": 0.16829711684006338, "learning_rate": 9.820292536882556e-05, "loss": 0.4262, "step": 688 }, { "epoch": 0.17748011720385098, "grad_norm": 0.15787994725503365, "learning_rate": 9.81909578374853e-05, "loss": 0.505, "step": 689 }, { "epoch": 0.17773770808513378, "grad_norm": 0.19522280952391355, "learning_rate": 9.817895132378725e-05, "loss": 0.4339, "step": 690 }, { "epoch": 0.17773770808513378, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8354430379746836, "eval_PRM F1 AUC": 0.7019381875327397, "eval_PRM F1 AUC (fixed)": 0.7917757988475642, "eval_PRM F1 Neg": 0.5185185185185185, "eval_PRM NPV": 0.45161290322580644, "eval_PRM Precision": 0.88, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.45614346861839294, "eval_runtime": 17.1136, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 690 }, { "epoch": 0.17799529896641658, "grad_norm": 0.28504389079299514, "learning_rate": 9.816690583744365e-05, "loss": 0.426, "step": 691 }, { "epoch": 0.17825288984769938, "grad_norm": 0.143898851373031, "learning_rate": 9.815482138819828e-05, "loss": 0.4758, "step": 692 }, { "epoch": 0.1785104807289822, "grad_norm": 0.24346195842723017, "learning_rate": 9.81426979858264e-05, "loss": 0.3278, "step": 693 }, { "epoch": 0.178768071610265, "grad_norm": 0.11310363925185545, "learning_rate": 9.813053564013484e-05, "loss": 0.3266, "step": 694 }, { "epoch": 0.1790256624915478, "grad_norm": 0.24451936762572263, "learning_rate": 9.811833436096186e-05, "loss": 0.394, "step": 695 }, { "epoch": 0.1790256624915478, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8069669984284966, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.44699928164482117, "eval_runtime": 16.9839, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 695 }, { "epoch": 0.1792832533728306, "grad_norm": 0.176740775173657, "learning_rate": 9.810609415817727e-05, "loss": 0.3819, "step": 696 }, { "epoch": 0.1795408442541134, "grad_norm": 0.16027318002171667, "learning_rate": 9.809381504168234e-05, "loss": 0.4551, "step": 697 }, { "epoch": 0.1797984351353962, "grad_norm": 0.11939734809378039, "learning_rate": 9.808149702140983e-05, "loss": 0.3272, "step": 698 }, { "epoch": 0.180056026016679, "grad_norm": 0.15004215332483806, "learning_rate": 9.806914010732395e-05, "loss": 0.4346, "step": 699 }, { "epoch": 0.18031361689796183, "grad_norm": 0.1189821211202139, "learning_rate": 9.805674430942038e-05, "loss": 0.381, "step": 700 }, { "epoch": 0.18031361689796183, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.7985856469355683, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4493963122367859, "eval_runtime": 17.6285, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 700 }, { "epoch": 0.18057120777924462, "grad_norm": 0.14680025815997552, "learning_rate": 9.80443096377263e-05, "loss": 0.4104, "step": 701 }, { "epoch": 0.18082879866052742, "grad_norm": 0.13239596703644493, "learning_rate": 9.803183610230024e-05, "loss": 0.4173, "step": 702 }, { "epoch": 0.18108638954181022, "grad_norm": 0.21879212415674984, "learning_rate": 9.801932371323228e-05, "loss": 0.3054, "step": 703 }, { "epoch": 0.18134398042309302, "grad_norm": 0.19389884767672666, "learning_rate": 9.800677248064382e-05, "loss": 0.4646, "step": 704 }, { "epoch": 0.18160157130437582, "grad_norm": 0.1441583153096296, "learning_rate": 9.799418241468775e-05, "loss": 0.3857, "step": 705 }, { "epoch": 0.18160157130437582, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8343558282208589, "eval_PRM F1 AUC": 0.6487689889994761, "eval_PRM F1 AUC (fixed)": 0.7922996333158722, "eval_PRM F1 Neg": 0.4489795918367347, "eval_PRM NPV": 0.4230769230769231, "eval_PRM Precision": 0.85, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4591619372367859, "eval_runtime": 17.1547, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 705 }, { "epoch": 0.18185916218565862, "grad_norm": 0.17259266561515865, "learning_rate": 9.798155352554836e-05, "loss": 0.4183, "step": 706 }, { "epoch": 0.18211675306694142, "grad_norm": 0.24418359176201268, "learning_rate": 9.796888582344135e-05, "loss": 0.4182, "step": 707 }, { "epoch": 0.18237434394822424, "grad_norm": 0.17618402257807567, "learning_rate": 9.795617931861379e-05, "loss": 0.4445, "step": 708 }, { "epoch": 0.18263193482950704, "grad_norm": 0.1407033934250589, "learning_rate": 9.794343402134414e-05, "loss": 0.3682, "step": 709 }, { "epoch": 0.18288952571078984, "grad_norm": 0.12444465439617118, "learning_rate": 9.793064994194227e-05, "loss": 0.3716, "step": 710 }, { "epoch": 0.18288952571078984, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.7778941854374017, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.48366478085517883, "eval_runtime": 17.4779, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 710 }, { "epoch": 0.18314711659207264, "grad_norm": 0.1885154528557264, "learning_rate": 9.791782709074944e-05, "loss": 0.4482, "step": 711 }, { "epoch": 0.18340470747335544, "grad_norm": 0.2084121178583777, "learning_rate": 9.790496547813818e-05, "loss": 0.397, "step": 712 }, { "epoch": 0.18366229835463824, "grad_norm": 0.18995844826892994, "learning_rate": 9.789206511451246e-05, "loss": 0.431, "step": 713 }, { "epoch": 0.18391988923592104, "grad_norm": 0.1672234048350745, "learning_rate": 9.787912601030758e-05, "loss": 0.3347, "step": 714 }, { "epoch": 0.18417748011720386, "grad_norm": 0.23976725387657785, "learning_rate": 9.786614817599014e-05, "loss": 0.3865, "step": 715 }, { "epoch": 0.18417748011720386, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.7655840754321633, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.5034623742103577, "eval_runtime": 17.0738, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 715 }, { "epoch": 0.18443507099848666, "grad_norm": 0.19241961064016783, "learning_rate": 9.785313162205811e-05, "loss": 0.4392, "step": 716 }, { "epoch": 0.18469266187976946, "grad_norm": 0.17170470742937655, "learning_rate": 9.784007635904078e-05, "loss": 0.4119, "step": 717 }, { "epoch": 0.18495025276105226, "grad_norm": 0.3564333460795497, "learning_rate": 9.782698239749873e-05, "loss": 0.5353, "step": 718 }, { "epoch": 0.18520784364233506, "grad_norm": 0.19042268984096947, "learning_rate": 9.781384974802384e-05, "loss": 0.3812, "step": 719 }, { "epoch": 0.18546543452361786, "grad_norm": 0.1841518362260629, "learning_rate": 9.780067842123932e-05, "loss": 0.3837, "step": 720 }, { "epoch": 0.18546543452361786, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8414634146341463, "eval_PRM F1 AUC": 0.6547930853850183, "eval_PRM F1 AUC (fixed)": 0.7747511786275537, "eval_PRM F1 Neg": 0.4583333333333333, "eval_PRM NPV": 0.44, "eval_PRM Precision": 0.8518518518518519, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4703480005264282, "eval_runtime": 17.027, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 720 }, { "epoch": 0.18572302540490065, "grad_norm": 0.14523048812798553, "learning_rate": 9.778746842779962e-05, "loss": 0.3908, "step": 721 }, { "epoch": 0.18598061628618348, "grad_norm": 0.2404417369064902, "learning_rate": 9.777421977839053e-05, "loss": 0.4869, "step": 722 }, { "epoch": 0.18623820716746628, "grad_norm": 0.24401582523659818, "learning_rate": 9.776093248372904e-05, "loss": 0.3266, "step": 723 }, { "epoch": 0.18649579804874908, "grad_norm": 0.14511178744116965, "learning_rate": 9.774760655456345e-05, "loss": 0.3733, "step": 724 }, { "epoch": 0.18675338893003188, "grad_norm": 0.1669798992396188, "learning_rate": 9.77342420016733e-05, "loss": 0.4016, "step": 725 }, { "epoch": 0.18675338893003188, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.7797276060764797, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.43758878111839294, "eval_runtime": 16.9726, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 725 }, { "epoch": 0.18701097981131468, "grad_norm": 0.2225144894529699, "learning_rate": 9.772083883586936e-05, "loss": 0.4693, "step": 726 }, { "epoch": 0.18726857069259747, "grad_norm": 0.21140379196640652, "learning_rate": 9.770739706799363e-05, "loss": 0.4119, "step": 727 }, { "epoch": 0.18752616157388027, "grad_norm": 0.14808478866451108, "learning_rate": 9.769391670891936e-05, "loss": 0.4312, "step": 728 }, { "epoch": 0.1877837524551631, "grad_norm": 0.16545059820296004, "learning_rate": 9.768039776955102e-05, "loss": 0.3698, "step": 729 }, { "epoch": 0.1880413433364459, "grad_norm": 0.19797455075357506, "learning_rate": 9.766684026082427e-05, "loss": 0.4312, "step": 730 }, { "epoch": 0.1880413433364459, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.78889470927187, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4273792505264282, "eval_runtime": 17.6199, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 730 }, { "epoch": 0.1882989342177287, "grad_norm": 0.170939002594386, "learning_rate": 9.765324419370595e-05, "loss": 0.4068, "step": 731 }, { "epoch": 0.1885565250990115, "grad_norm": 0.17609581400732574, "learning_rate": 9.763960957919413e-05, "loss": 0.4073, "step": 732 }, { "epoch": 0.1888141159802943, "grad_norm": 0.23961640293275535, "learning_rate": 9.762593642831805e-05, "loss": 0.4086, "step": 733 }, { "epoch": 0.1890717068615771, "grad_norm": 0.25101595087816564, "learning_rate": 9.761222475213811e-05, "loss": 0.424, "step": 734 }, { "epoch": 0.1893292977428599, "grad_norm": 0.37737375725226296, "learning_rate": 9.75984745617459e-05, "loss": 0.5042, "step": 735 }, { "epoch": 0.1893292977428599, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.7875851231011001, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4454900622367859, "eval_runtime": 16.443, "eval_samples_per_second": 2.676, "eval_steps_per_second": 0.182, "step": 735 }, { "epoch": 0.18958688862414272, "grad_norm": 0.152758559386544, "learning_rate": 9.758468586826413e-05, "loss": 0.3539, "step": 736 }, { "epoch": 0.18984447950542552, "grad_norm": 0.17933481161507048, "learning_rate": 9.757085868284666e-05, "loss": 0.3642, "step": 737 }, { "epoch": 0.19010207038670832, "grad_norm": 0.3803071586187389, "learning_rate": 9.755699301667851e-05, "loss": 0.4196, "step": 738 }, { "epoch": 0.19035966126799111, "grad_norm": 0.17381527089661578, "learning_rate": 9.754308888097583e-05, "loss": 0.348, "step": 739 }, { "epoch": 0.1906172521492739, "grad_norm": 0.1755864297637989, "learning_rate": 9.752914628698586e-05, "loss": 0.4574, "step": 740 }, { "epoch": 0.1906172521492739, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8333333333333334, "eval_PRM F1 AUC": 0.7176532215819801, "eval_PRM F1 AUC (fixed)": 0.7729177579884755, "eval_PRM F1 Neg": 0.5357142857142857, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8904109589041096, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.46981534361839294, "eval_runtime": 16.851, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 740 }, { "epoch": 0.1908748430305567, "grad_norm": 0.21612637159514025, "learning_rate": 9.751516524598696e-05, "loss": 0.4121, "step": 741 }, { "epoch": 0.1911324339118395, "grad_norm": 0.3550694559997702, "learning_rate": 9.750114576928862e-05, "loss": 0.5301, "step": 742 }, { "epoch": 0.1913900247931223, "grad_norm": 0.24408273606929198, "learning_rate": 9.748708786823138e-05, "loss": 0.3451, "step": 743 }, { "epoch": 0.19164761567440514, "grad_norm": 0.19514048935188616, "learning_rate": 9.747299155418685e-05, "loss": 0.4174, "step": 744 }, { "epoch": 0.19190520655568793, "grad_norm": 0.23026704504127513, "learning_rate": 9.74588568385578e-05, "loss": 0.4779, "step": 745 }, { "epoch": 0.19190520655568793, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8837209302325582, "eval_PRM F1 AUC": 0.6752226296490309, "eval_PRM F1 AUC (fixed)": 0.7823467784180198, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5882352941176471, "eval_PRM Precision": 0.8539325842696629, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.47256746888160706, "eval_runtime": 17.5688, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 745 }, { "epoch": 0.19216279743697073, "grad_norm": 0.19241262553746935, "learning_rate": 9.744468373277797e-05, "loss": 0.3714, "step": 746 }, { "epoch": 0.19242038831825353, "grad_norm": 0.24726756595075375, "learning_rate": 9.743047224831217e-05, "loss": 0.5159, "step": 747 }, { "epoch": 0.19267797919953633, "grad_norm": 0.29366301569104414, "learning_rate": 9.741622239665631e-05, "loss": 0.4148, "step": 748 }, { "epoch": 0.19293557008081913, "grad_norm": 0.1950838719158936, "learning_rate": 9.740193418933728e-05, "loss": 0.3973, "step": 749 }, { "epoch": 0.19319316096210193, "grad_norm": 0.20510230996291545, "learning_rate": 9.738760763791303e-05, "loss": 0.3554, "step": 750 }, { "epoch": 0.19319316096210193, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.7776322682032477, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4508167505264282, "eval_runtime": 17.5177, "eval_samples_per_second": 2.512, "eval_steps_per_second": 0.171, "step": 750 }, { "epoch": 0.19345075184338476, "grad_norm": 0.19898803672075183, "learning_rate": 9.73732427539725e-05, "loss": 0.363, "step": 751 }, { "epoch": 0.19370834272466755, "grad_norm": 0.1432817107182984, "learning_rate": 9.735883954913565e-05, "loss": 0.3756, "step": 752 }, { "epoch": 0.19396593360595035, "grad_norm": 0.1881536741065255, "learning_rate": 9.734439803505345e-05, "loss": 0.3625, "step": 753 }, { "epoch": 0.19422352448723315, "grad_norm": 0.12158895906899068, "learning_rate": 9.732991822340785e-05, "loss": 0.3648, "step": 754 }, { "epoch": 0.19448111536851595, "grad_norm": 0.17723149507279376, "learning_rate": 9.731540012591176e-05, "loss": 0.4379, "step": 755 }, { "epoch": 0.19448111536851595, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.7692509167103195, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4884588122367859, "eval_runtime": 17.1302, "eval_samples_per_second": 2.569, "eval_steps_per_second": 0.175, "step": 755 }, { "epoch": 0.19473870624979875, "grad_norm": 0.1692840674810335, "learning_rate": 9.730084375430908e-05, "loss": 0.3276, "step": 756 }, { "epoch": 0.19499629713108155, "grad_norm": 0.1871394545447885, "learning_rate": 9.728624912037468e-05, "loss": 0.343, "step": 757 }, { "epoch": 0.19525388801236437, "grad_norm": 0.17511018151942143, "learning_rate": 9.727161623591437e-05, "loss": 0.3519, "step": 758 }, { "epoch": 0.19551147889364717, "grad_norm": 0.22041489318437088, "learning_rate": 9.72569451127649e-05, "loss": 0.5358, "step": 759 }, { "epoch": 0.19576906977492997, "grad_norm": 0.21720558104730403, "learning_rate": 9.724223576279395e-05, "loss": 0.3526, "step": 760 }, { "epoch": 0.19576906977492997, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.7689889994761655, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.48606178164482117, "eval_runtime": 17.3554, "eval_samples_per_second": 2.535, "eval_steps_per_second": 0.173, "step": 760 }, { "epoch": 0.19602666065621277, "grad_norm": 0.17551041408187082, "learning_rate": 9.722748819790011e-05, "loss": 0.3745, "step": 761 }, { "epoch": 0.19628425153749557, "grad_norm": 0.1898005383137732, "learning_rate": 9.721270243001291e-05, "loss": 0.3917, "step": 762 }, { "epoch": 0.19654184241877837, "grad_norm": 0.1561591738808733, "learning_rate": 9.719787847109277e-05, "loss": 0.4333, "step": 763 }, { "epoch": 0.19679943330006117, "grad_norm": 0.15861873391394862, "learning_rate": 9.7183016333131e-05, "loss": 0.4221, "step": 764 }, { "epoch": 0.197057024181344, "grad_norm": 0.16657975948790257, "learning_rate": 9.716811602814979e-05, "loss": 0.4818, "step": 765 }, { "epoch": 0.197057024181344, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.7763226820324777, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.47958096861839294, "eval_runtime": 17.0454, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 765 }, { "epoch": 0.1973146150626268, "grad_norm": 0.14504239882322556, "learning_rate": 9.715317756820223e-05, "loss": 0.4516, "step": 766 }, { "epoch": 0.1975722059439096, "grad_norm": 0.14639368262114139, "learning_rate": 9.713820096537225e-05, "loss": 0.4258, "step": 767 }, { "epoch": 0.1978297968251924, "grad_norm": 0.19299648566477917, "learning_rate": 9.712318623177462e-05, "loss": 0.3764, "step": 768 }, { "epoch": 0.1980873877064752, "grad_norm": 0.23503011870891174, "learning_rate": 9.7108133379555e-05, "loss": 0.4836, "step": 769 }, { "epoch": 0.198344978587758, "grad_norm": 0.17907646710776773, "learning_rate": 9.709304242088984e-05, "loss": 0.4597, "step": 770 }, { "epoch": 0.198344978587758, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8395061728395061, "eval_PRM F1 AUC": 0.6705081194342588, "eval_PRM F1 AUC (fixed)": 0.7962283918281823, "eval_PRM F1 Neg": 0.48, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8607594936708861, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4485973119735718, "eval_runtime": 17.5214, "eval_samples_per_second": 2.511, "eval_steps_per_second": 0.171, "step": 770 }, { "epoch": 0.19860256946904079, "grad_norm": 0.17476764075194923, "learning_rate": 9.707791336798643e-05, "loss": 0.3892, "step": 771 }, { "epoch": 0.1988601603503236, "grad_norm": 0.12482609899561933, "learning_rate": 9.70627462330829e-05, "loss": 0.3539, "step": 772 }, { "epoch": 0.1991177512316064, "grad_norm": 0.16405790688900532, "learning_rate": 9.704754102844812e-05, "loss": 0.4053, "step": 773 }, { "epoch": 0.1993753421128892, "grad_norm": 0.1798409265106501, "learning_rate": 9.703229776638185e-05, "loss": 0.4475, "step": 774 }, { "epoch": 0.199632932994172, "grad_norm": 0.23051915163837344, "learning_rate": 9.701701645921458e-05, "loss": 0.4611, "step": 775 }, { "epoch": 0.199632932994172, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 AUC (fixed)": 0.8192771084337349, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4166370630264282, "eval_runtime": 17.7586, "eval_samples_per_second": 2.478, "eval_steps_per_second": 0.169, "step": 775 }, { "epoch": 0.1998905238754548, "grad_norm": 0.26064744376320587, "learning_rate": 9.700169711930753e-05, "loss": 0.4869, "step": 776 }, { "epoch": 0.2001481147567376, "grad_norm": 0.1999796986883691, "learning_rate": 9.698633975905278e-05, "loss": 0.5008, "step": 777 }, { "epoch": 0.2004057056380204, "grad_norm": 0.14601894484791306, "learning_rate": 9.69709443908731e-05, "loss": 0.3229, "step": 778 }, { "epoch": 0.20066329651930323, "grad_norm": 0.14849870124150014, "learning_rate": 9.695551102722203e-05, "loss": 0.4005, "step": 779 }, { "epoch": 0.20092088740058603, "grad_norm": 0.1488717627910205, "learning_rate": 9.694003968058383e-05, "loss": 0.4319, "step": 780 }, { "epoch": 0.20092088740058603, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8407643312101911, "eval_PRM F1 AUC": 0.7236773179675223, "eval_PRM F1 AUC (fixed)": 0.8101100052383448, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.46875, "eval_PRM Precision": 0.8918918918918919, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.4207208752632141, "eval_runtime": 16.8594, "eval_samples_per_second": 2.61, "eval_steps_per_second": 0.178, "step": 780 }, { "epoch": 0.20117847828186883, "grad_norm": 0.3037648366334819, "learning_rate": 9.692453036347351e-05, "loss": 0.3818, "step": 781 }, { "epoch": 0.20143606916315163, "grad_norm": 0.15315428578747717, "learning_rate": 9.690898308843676e-05, "loss": 0.4629, "step": 782 }, { "epoch": 0.20169366004443443, "grad_norm": 0.11302922927189676, "learning_rate": 9.689339786805001e-05, "loss": 0.3261, "step": 783 }, { "epoch": 0.20195125092571722, "grad_norm": 0.32958898362051664, "learning_rate": 9.687777471492036e-05, "loss": 0.451, "step": 784 }, { "epoch": 0.20220884180700002, "grad_norm": 0.14601671670226055, "learning_rate": 9.686211364168563e-05, "loss": 0.4574, "step": 785 }, { "epoch": 0.20220884180700002, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.8033001571503404, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42453834414482117, "eval_runtime": 16.5518, "eval_samples_per_second": 2.658, "eval_steps_per_second": 0.181, "step": 785 }, { "epoch": 0.20246643268828282, "grad_norm": 0.17151940551861491, "learning_rate": 9.684641466101423e-05, "loss": 0.4361, "step": 786 }, { "epoch": 0.20272402356956565, "grad_norm": 0.3369782781660549, "learning_rate": 9.683067778560536e-05, "loss": 0.4478, "step": 787 }, { "epoch": 0.20298161445084845, "grad_norm": 0.192975450863202, "learning_rate": 9.681490302818874e-05, "loss": 0.3957, "step": 788 }, { "epoch": 0.20323920533213125, "grad_norm": 0.14886576232650187, "learning_rate": 9.679909040152484e-05, "loss": 0.4205, "step": 789 }, { "epoch": 0.20349679621341404, "grad_norm": 0.13937466642036642, "learning_rate": 9.67832399184047e-05, "loss": 0.3992, "step": 790 }, { "epoch": 0.20349679621341404, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.7996333158721843, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4310191869735718, "eval_runtime": 16.4895, "eval_samples_per_second": 2.668, "eval_steps_per_second": 0.182, "step": 790 }, { "epoch": 0.20375438709469684, "grad_norm": 0.19031279307769508, "learning_rate": 9.676735159165002e-05, "loss": 0.4396, "step": 791 }, { "epoch": 0.20401197797597964, "grad_norm": 0.2020213473917749, "learning_rate": 9.675142543411308e-05, "loss": 0.4226, "step": 792 }, { "epoch": 0.20426956885726244, "grad_norm": 0.15671936741014697, "learning_rate": 9.673546145867677e-05, "loss": 0.3852, "step": 793 }, { "epoch": 0.20452715973854527, "grad_norm": 0.1481990620321785, "learning_rate": 9.671945967825461e-05, "loss": 0.3121, "step": 794 }, { "epoch": 0.20478475061982807, "grad_norm": 0.15171912703311316, "learning_rate": 9.670342010579065e-05, "loss": 0.3816, "step": 795 }, { "epoch": 0.20478475061982807, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.8072289156626504, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4208984375, "eval_runtime": 17.0559, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 795 }, { "epoch": 0.20504234150111086, "grad_norm": 0.15307562258543508, "learning_rate": 9.668734275425955e-05, "loss": 0.4493, "step": 796 }, { "epoch": 0.20529993238239366, "grad_norm": 0.15101795775140697, "learning_rate": 9.667122763666647e-05, "loss": 0.3499, "step": 797 }, { "epoch": 0.20555752326367646, "grad_norm": 0.16283688865421317, "learning_rate": 9.665507476604721e-05, "loss": 0.4525, "step": 798 }, { "epoch": 0.20581511414495926, "grad_norm": 0.16698738414824957, "learning_rate": 9.6638884155468e-05, "loss": 0.3571, "step": 799 }, { "epoch": 0.20607270502624206, "grad_norm": 0.19989730282652068, "learning_rate": 9.662265581802571e-05, "loss": 0.3698, "step": 800 }, { "epoch": 0.20607270502624206, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8169198533263489, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4137073755264282, "eval_runtime": 17.4114, "eval_samples_per_second": 2.527, "eval_steps_per_second": 0.172, "step": 800 }, { "epoch": 0.20633029590752489, "grad_norm": 0.13446897065785993, "learning_rate": 9.660638976684767e-05, "loss": 0.3707, "step": 801 }, { "epoch": 0.20658788678880768, "grad_norm": 0.19362781709647103, "learning_rate": 9.659008601509168e-05, "loss": 0.4089, "step": 802 }, { "epoch": 0.20684547767009048, "grad_norm": 0.2122106215855278, "learning_rate": 9.657374457594612e-05, "loss": 0.468, "step": 803 }, { "epoch": 0.20710306855137328, "grad_norm": 0.11315965378853726, "learning_rate": 9.65573654626298e-05, "loss": 0.3292, "step": 804 }, { "epoch": 0.20736065943265608, "grad_norm": 0.1620234431000773, "learning_rate": 9.654094868839201e-05, "loss": 0.4112, "step": 805 }, { "epoch": 0.20736065943265608, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8111576741749607, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.40749290585517883, "eval_runtime": 17.5029, "eval_samples_per_second": 2.514, "eval_steps_per_second": 0.171, "step": 805 }, { "epoch": 0.20761825031393888, "grad_norm": 0.22409526882756822, "learning_rate": 9.652449426651254e-05, "loss": 0.3767, "step": 806 }, { "epoch": 0.20787584119522168, "grad_norm": 0.18783384945052448, "learning_rate": 9.650800221030158e-05, "loss": 0.4147, "step": 807 }, { "epoch": 0.2081334320765045, "grad_norm": 0.17442232052951923, "learning_rate": 9.649147253309983e-05, "loss": 0.4048, "step": 808 }, { "epoch": 0.2083910229577873, "grad_norm": 0.16769633718288773, "learning_rate": 9.647490524827834e-05, "loss": 0.3623, "step": 809 }, { "epoch": 0.2086486138390701, "grad_norm": 0.21383071232057696, "learning_rate": 9.645830036923865e-05, "loss": 0.3873, "step": 810 }, { "epoch": 0.2086486138390701, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.7993713986380304, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4146839380264282, "eval_runtime": 16.94, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 810 }, { "epoch": 0.2089062047203529, "grad_norm": 0.14123803753295183, "learning_rate": 9.644165790941268e-05, "loss": 0.4005, "step": 811 }, { "epoch": 0.2091637956016357, "grad_norm": 0.24189428392173476, "learning_rate": 9.642497788226275e-05, "loss": 0.4661, "step": 812 }, { "epoch": 0.2094213864829185, "grad_norm": 0.14479028233303481, "learning_rate": 9.640826030128159e-05, "loss": 0.4395, "step": 813 }, { "epoch": 0.2096789773642013, "grad_norm": 0.1604142770726198, "learning_rate": 9.639150517999225e-05, "loss": 0.3342, "step": 814 }, { "epoch": 0.20993656824548412, "grad_norm": 0.23317907375675592, "learning_rate": 9.637471253194823e-05, "loss": 0.4612, "step": 815 }, { "epoch": 0.20993656824548412, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8850574712643678, "eval_PRM F1 AUC": 0.6595075955997904, "eval_PRM F1 AUC (fixed)": 0.788108957569408, "eval_PRM F1 Neg": 0.47368421052631576, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.8461538461538461, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4583629369735718, "eval_runtime": 17.1879, "eval_samples_per_second": 2.56, "eval_steps_per_second": 0.175, "step": 815 }, { "epoch": 0.21019415912676692, "grad_norm": 0.15262141042584548, "learning_rate": 9.635788237073334e-05, "loss": 0.3574, "step": 816 }, { "epoch": 0.21045175000804972, "grad_norm": 0.17132596391131955, "learning_rate": 9.63410147099617e-05, "loss": 0.4807, "step": 817 }, { "epoch": 0.21070934088933252, "grad_norm": 0.14325025622334514, "learning_rate": 9.632410956327786e-05, "loss": 0.3313, "step": 818 }, { "epoch": 0.21096693177061532, "grad_norm": 0.11746916940347794, "learning_rate": 9.63071669443566e-05, "loss": 0.3267, "step": 819 }, { "epoch": 0.21122452265189812, "grad_norm": 0.14624718675117127, "learning_rate": 9.629018686690306e-05, "loss": 0.3998, "step": 820 }, { "epoch": 0.21122452265189812, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.7666317443687795, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.46706321835517883, "eval_runtime": 17.0486, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 820 }, { "epoch": 0.21148211353318092, "grad_norm": 0.17452696072716195, "learning_rate": 9.627316934465264e-05, "loss": 0.4397, "step": 821 }, { "epoch": 0.21173970441446371, "grad_norm": 0.250352300400204, "learning_rate": 9.625611439137113e-05, "loss": 0.3709, "step": 822 }, { "epoch": 0.21199729529574654, "grad_norm": 0.13325918031436973, "learning_rate": 9.623902202085444e-05, "loss": 0.3643, "step": 823 }, { "epoch": 0.21225488617702934, "grad_norm": 0.1376574849374028, "learning_rate": 9.622189224692887e-05, "loss": 0.3484, "step": 824 }, { "epoch": 0.21251247705831214, "grad_norm": 0.18013047197269513, "learning_rate": 9.620472508345097e-05, "loss": 0.3847, "step": 825 }, { "epoch": 0.21251247705831214, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8863636363636364, "eval_PRM F1 AUC": 0.6437925615505501, "eval_PRM F1 AUC (fixed)": 0.7781561026715559, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.6153846153846154, "eval_PRM Precision": 0.8387096774193549, "eval_PRM Recall": 0.9397590361445783, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4634232819080353, "eval_runtime": 17.0545, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 825 }, { "epoch": 0.21277006793959494, "grad_norm": 0.31481506650138047, "learning_rate": 9.618752054430747e-05, "loss": 0.4774, "step": 826 }, { "epoch": 0.21302765882087774, "grad_norm": 0.21549229291270694, "learning_rate": 9.617027864341537e-05, "loss": 0.3868, "step": 827 }, { "epoch": 0.21328524970216053, "grad_norm": 0.15842482711381703, "learning_rate": 9.615299939472188e-05, "loss": 0.3959, "step": 828 }, { "epoch": 0.21354284058344333, "grad_norm": 0.2159293707864858, "learning_rate": 9.613568281220448e-05, "loss": 0.3981, "step": 829 }, { "epoch": 0.21380043146472616, "grad_norm": 0.21434011506461947, "learning_rate": 9.611832890987076e-05, "loss": 0.3735, "step": 830 }, { "epoch": 0.21380043146472616, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8033001571503405, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4027876555919647, "eval_runtime": 17.1564, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 830 }, { "epoch": 0.21405802234600896, "grad_norm": 0.19850586686388644, "learning_rate": 9.610093770175856e-05, "loss": 0.4578, "step": 831 }, { "epoch": 0.21431561322729176, "grad_norm": 0.1403665244468571, "learning_rate": 9.608350920193587e-05, "loss": 0.3801, "step": 832 }, { "epoch": 0.21457320410857456, "grad_norm": 0.15098022992995108, "learning_rate": 9.606604342450085e-05, "loss": 0.3486, "step": 833 }, { "epoch": 0.21483079498985735, "grad_norm": 0.17415927435539957, "learning_rate": 9.604854038358183e-05, "loss": 0.46, "step": 834 }, { "epoch": 0.21508838587114015, "grad_norm": 0.29094141315279337, "learning_rate": 9.603100009333726e-05, "loss": 0.4823, "step": 835 }, { "epoch": 0.21508838587114015, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8129910948140388, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4161931872367859, "eval_runtime": 16.9223, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 835 }, { "epoch": 0.21534597675242295, "grad_norm": 0.12714327598998507, "learning_rate": 9.601342256795574e-05, "loss": 0.3482, "step": 836 }, { "epoch": 0.21560356763370578, "grad_norm": 0.1699018978398677, "learning_rate": 9.599580782165598e-05, "loss": 0.5118, "step": 837 }, { "epoch": 0.21586115851498858, "grad_norm": 0.14798460776395087, "learning_rate": 9.59781558686868e-05, "loss": 0.3537, "step": 838 }, { "epoch": 0.21611874939627138, "grad_norm": 0.2451212892024897, "learning_rate": 9.596046672332711e-05, "loss": 0.4351, "step": 839 }, { "epoch": 0.21637634027755417, "grad_norm": 0.15004232276867055, "learning_rate": 9.594274039988593e-05, "loss": 0.4771, "step": 840 }, { "epoch": 0.21637634027755417, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8145625982189628, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.40793678164482117, "eval_runtime": 16.5548, "eval_samples_per_second": 2.658, "eval_steps_per_second": 0.181, "step": 840 }, { "epoch": 0.21663393115883697, "grad_norm": 0.255883186053489, "learning_rate": 9.592497691270233e-05, "loss": 0.4136, "step": 841 }, { "epoch": 0.21689152204011977, "grad_norm": 0.1369788834956702, "learning_rate": 9.590717627614546e-05, "loss": 0.3685, "step": 842 }, { "epoch": 0.21714911292140257, "grad_norm": 0.13098749300255105, "learning_rate": 9.588933850461449e-05, "loss": 0.4034, "step": 843 }, { "epoch": 0.2174067038026854, "grad_norm": 0.11385104349796996, "learning_rate": 9.587146361253868e-05, "loss": 0.3198, "step": 844 }, { "epoch": 0.2176642946839682, "grad_norm": 0.18974213666735434, "learning_rate": 9.585355161437724e-05, "loss": 0.4077, "step": 845 }, { "epoch": 0.2176642946839682, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8735632183908046, "eval_PRM F1 AUC": 0.6317443687794656, "eval_PRM F1 AUC (fixed)": 0.8158721843897327, "eval_PRM F1 Neg": 0.42105263157894735, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.8351648351648352, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.44522371888160706, "eval_runtime": 17.5219, "eval_samples_per_second": 2.511, "eval_steps_per_second": 0.171, "step": 845 }, { "epoch": 0.217921885565251, "grad_norm": 0.11312026576338297, "learning_rate": 9.583560252461948e-05, "loss": 0.3097, "step": 846 }, { "epoch": 0.2181794764465338, "grad_norm": 0.1387086966813091, "learning_rate": 9.581761635778467e-05, "loss": 0.3891, "step": 847 }, { "epoch": 0.2184370673278166, "grad_norm": 0.16540974340110773, "learning_rate": 9.579959312842206e-05, "loss": 0.4268, "step": 848 }, { "epoch": 0.2186946582090994, "grad_norm": 0.1690801786245441, "learning_rate": 9.578153285111093e-05, "loss": 0.4515, "step": 849 }, { "epoch": 0.2189522490903822, "grad_norm": 0.16246155063394263, "learning_rate": 9.576343554046048e-05, "loss": 0.4245, "step": 850 }, { "epoch": 0.2189522490903822, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.819800942902043, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.43137428164482117, "eval_runtime": 16.9923, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 850 }, { "epoch": 0.21920983997166502, "grad_norm": 0.2251105993186927, "learning_rate": 9.57453012111099e-05, "loss": 0.3838, "step": 851 }, { "epoch": 0.21946743085294781, "grad_norm": 0.1396316925705257, "learning_rate": 9.572712987772827e-05, "loss": 0.4357, "step": 852 }, { "epoch": 0.2197250217342306, "grad_norm": 0.2051254490266408, "learning_rate": 9.570892155501467e-05, "loss": 0.5482, "step": 853 }, { "epoch": 0.2199826126155134, "grad_norm": 0.164591578477754, "learning_rate": 9.569067625769809e-05, "loss": 0.4432, "step": 854 }, { "epoch": 0.2202402034967962, "grad_norm": 0.15359633500587797, "learning_rate": 9.567239400053738e-05, "loss": 0.4244, "step": 855 }, { "epoch": 0.2202402034967962, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.816919853326349, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.43856534361839294, "eval_runtime": 16.9004, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.178, "step": 855 }, { "epoch": 0.220497794378079, "grad_norm": 0.12554692671195433, "learning_rate": 9.565407479832133e-05, "loss": 0.3899, "step": 856 }, { "epoch": 0.2207553852593618, "grad_norm": 0.12730086090169687, "learning_rate": 9.563571866586862e-05, "loss": 0.3758, "step": 857 }, { "epoch": 0.22101297614064463, "grad_norm": 0.13699372075558489, "learning_rate": 9.561732561802778e-05, "loss": 0.3901, "step": 858 }, { "epoch": 0.22127056702192743, "grad_norm": 0.12170352940977552, "learning_rate": 9.559889566967721e-05, "loss": 0.359, "step": 859 }, { "epoch": 0.22152815790321023, "grad_norm": 0.12857140264063513, "learning_rate": 9.558042883572515e-05, "loss": 0.3368, "step": 860 }, { "epoch": 0.22152815790321023, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8224201152435829, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4373224377632141, "eval_runtime": 17.5393, "eval_samples_per_second": 2.509, "eval_steps_per_second": 0.171, "step": 860 }, { "epoch": 0.22178574878449303, "grad_norm": 0.143945456486762, "learning_rate": 9.556192513110973e-05, "loss": 0.3765, "step": 861 }, { "epoch": 0.22204333966577583, "grad_norm": 0.1717137987094751, "learning_rate": 9.554338457079879e-05, "loss": 0.3239, "step": 862 }, { "epoch": 0.22230093054705863, "grad_norm": 0.18909983282166132, "learning_rate": 9.552480716979012e-05, "loss": 0.3319, "step": 863 }, { "epoch": 0.22255852142834143, "grad_norm": 0.2966835879822856, "learning_rate": 9.550619294311121e-05, "loss": 0.4235, "step": 864 }, { "epoch": 0.22281611230962423, "grad_norm": 0.17407346186283396, "learning_rate": 9.548754190581939e-05, "loss": 0.292, "step": 865 }, { "epoch": 0.22281611230962423, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.8234677841801991, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4254261255264282, "eval_runtime": 17.5424, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 865 }, { "epoch": 0.22307370319090705, "grad_norm": 0.169671280802814, "learning_rate": 9.546885407300176e-05, "loss": 0.3925, "step": 866 }, { "epoch": 0.22333129407218985, "grad_norm": 0.16485537784189574, "learning_rate": 9.545012945977515e-05, "loss": 0.4292, "step": 867 }, { "epoch": 0.22358888495347265, "grad_norm": 0.19768390498945893, "learning_rate": 9.543136808128618e-05, "loss": 0.4197, "step": 868 }, { "epoch": 0.22384647583475545, "grad_norm": 0.22647004514664276, "learning_rate": 9.541256995271122e-05, "loss": 0.4155, "step": 869 }, { "epoch": 0.22410406671603825, "grad_norm": 0.21311239927558964, "learning_rate": 9.539373508925632e-05, "loss": 0.342, "step": 870 }, { "epoch": 0.22410406671603825, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.822943949711891, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4334161877632141, "eval_runtime": 16.5787, "eval_samples_per_second": 2.654, "eval_steps_per_second": 0.181, "step": 870 }, { "epoch": 0.22436165759732105, "grad_norm": 0.24569395654982099, "learning_rate": 9.537486350615727e-05, "loss": 0.4597, "step": 871 }, { "epoch": 0.22461924847860384, "grad_norm": 0.15527931242487145, "learning_rate": 9.53559552186796e-05, "loss": 0.3082, "step": 872 }, { "epoch": 0.22487683935988667, "grad_norm": 0.21946551945820547, "learning_rate": 9.533701024211845e-05, "loss": 0.4091, "step": 873 }, { "epoch": 0.22513443024116947, "grad_norm": 0.11264153813024441, "learning_rate": 9.53180285917987e-05, "loss": 0.3023, "step": 874 }, { "epoch": 0.22539202112245227, "grad_norm": 0.2451578442942059, "learning_rate": 9.529901028307488e-05, "loss": 0.4661, "step": 875 }, { "epoch": 0.22539202112245227, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8654970760233918, "eval_PRM F1 AUC": 0.6414353064431639, "eval_PRM F1 AUC (fixed)": 0.829229963331587, "eval_PRM F1 Neg": 0.43902439024390244, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8409090909090909, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4075816869735718, "eval_runtime": 17.543, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 875 }, { "epoch": 0.22564961200373507, "grad_norm": 0.1625927951987115, "learning_rate": 9.527995533133118e-05, "loss": 0.3937, "step": 876 }, { "epoch": 0.22590720288501787, "grad_norm": 0.21395674527079286, "learning_rate": 9.526086375198143e-05, "loss": 0.3233, "step": 877 }, { "epoch": 0.22616479376630066, "grad_norm": 0.2455296017354688, "learning_rate": 9.524173556046907e-05, "loss": 0.4285, "step": 878 }, { "epoch": 0.22642238464758346, "grad_norm": 0.189837739355848, "learning_rate": 9.522257077226717e-05, "loss": 0.3221, "step": 879 }, { "epoch": 0.2266799755288663, "grad_norm": 0.1935407868054634, "learning_rate": 9.520336940287839e-05, "loss": 0.3578, "step": 880 }, { "epoch": 0.2266799755288663, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8334206390780513, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.3994140625, "eval_runtime": 17.1926, "eval_samples_per_second": 2.559, "eval_steps_per_second": 0.174, "step": 880 }, { "epoch": 0.2269375664101491, "grad_norm": 0.24698027744013595, "learning_rate": 9.518413146783502e-05, "loss": 0.4388, "step": 881 }, { "epoch": 0.2271951572914319, "grad_norm": 0.17139552946991912, "learning_rate": 9.516485698269889e-05, "loss": 0.3637, "step": 882 }, { "epoch": 0.22745274817271469, "grad_norm": 0.1606745092503172, "learning_rate": 9.51455459630614e-05, "loss": 0.3869, "step": 883 }, { "epoch": 0.22771033905399748, "grad_norm": 0.1397191393946997, "learning_rate": 9.512619842454352e-05, "loss": 0.3552, "step": 884 }, { "epoch": 0.22796792993528028, "grad_norm": 0.14490255830626222, "learning_rate": 9.510681438279574e-05, "loss": 0.4143, "step": 885 }, { "epoch": 0.22796792993528028, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8850574712643678, "eval_PRM F1 AUC": 0.6595075955997904, "eval_PRM F1 AUC (fixed)": 0.8491356731272919, "eval_PRM F1 Neg": 0.47368421052631576, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.8461538461538461, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4111328125, "eval_runtime": 16.9082, "eval_samples_per_second": 2.602, "eval_steps_per_second": 0.177, "step": 885 }, { "epoch": 0.22822552081656308, "grad_norm": 0.11820532309422944, "learning_rate": 9.508739385349812e-05, "loss": 0.336, "step": 886 }, { "epoch": 0.2284831116978459, "grad_norm": 0.1318247173658625, "learning_rate": 9.506793685236018e-05, "loss": 0.3308, "step": 887 }, { "epoch": 0.2287407025791287, "grad_norm": 0.2824055496224138, "learning_rate": 9.504844339512095e-05, "loss": 0.4404, "step": 888 }, { "epoch": 0.2289982934604115, "grad_norm": 0.2394051935135196, "learning_rate": 9.5028913497549e-05, "loss": 0.4252, "step": 889 }, { "epoch": 0.2292558843416943, "grad_norm": 0.14323716490546728, "learning_rate": 9.500934717544235e-05, "loss": 0.3904, "step": 890 }, { "epoch": 0.2292558843416943, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8446830801466736, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3892045319080353, "eval_runtime": 16.4151, "eval_samples_per_second": 2.68, "eval_steps_per_second": 0.183, "step": 890 }, { "epoch": 0.2295134752229771, "grad_norm": 0.16829762372870483, "learning_rate": 9.498974444462845e-05, "loss": 0.3552, "step": 891 }, { "epoch": 0.2297710661042599, "grad_norm": 0.18322336447852924, "learning_rate": 9.497010532096425e-05, "loss": 0.4769, "step": 892 }, { "epoch": 0.2300286569855427, "grad_norm": 0.23586845435952258, "learning_rate": 9.49504298203361e-05, "loss": 0.3448, "step": 893 }, { "epoch": 0.23028624786682553, "grad_norm": 0.12876558401772226, "learning_rate": 9.493071795865982e-05, "loss": 0.367, "step": 894 }, { "epoch": 0.23054383874810833, "grad_norm": 0.14829063639667459, "learning_rate": 9.49109697518806e-05, "loss": 0.4471, "step": 895 }, { "epoch": 0.23054383874810833, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 AUC (fixed)": 0.8407543216343636, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.39151278138160706, "eval_runtime": 16.9332, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 895 }, { "epoch": 0.23080142962939112, "grad_norm": 0.1626905173293953, "learning_rate": 9.489118521597306e-05, "loss": 0.4158, "step": 896 }, { "epoch": 0.23105902051067392, "grad_norm": 0.17383287946697712, "learning_rate": 9.487136436694117e-05, "loss": 0.4791, "step": 897 }, { "epoch": 0.23131661139195672, "grad_norm": 0.20773918045671103, "learning_rate": 9.485150722081834e-05, "loss": 0.404, "step": 898 }, { "epoch": 0.23157420227323952, "grad_norm": 0.17792771207325503, "learning_rate": 9.483161379366726e-05, "loss": 0.4027, "step": 899 }, { "epoch": 0.23183179315452232, "grad_norm": 0.19377175951533993, "learning_rate": 9.481168410158003e-05, "loss": 0.412, "step": 900 }, { "epoch": 0.23183179315452232, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8397066526977475, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4158380627632141, "eval_runtime": 17.0948, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 900 }, { "epoch": 0.23208938403580515, "grad_norm": 0.18030512872838098, "learning_rate": 9.479171816067808e-05, "loss": 0.4122, "step": 901 }, { "epoch": 0.23234697491708795, "grad_norm": 0.3095765006071036, "learning_rate": 9.47717159871121e-05, "loss": 0.45, "step": 902 }, { "epoch": 0.23260456579837074, "grad_norm": 0.12280104764281838, "learning_rate": 9.475167759706219e-05, "loss": 0.3338, "step": 903 }, { "epoch": 0.23286215667965354, "grad_norm": 0.27572084329849705, "learning_rate": 9.473160300673764e-05, "loss": 0.4631, "step": 904 }, { "epoch": 0.23311974756093634, "grad_norm": 0.2907471101623543, "learning_rate": 9.471149223237711e-05, "loss": 0.5238, "step": 905 }, { "epoch": 0.23311974756093634, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8516129032258064, "eval_PRM F1 AUC": 0.7671555788370874, "eval_PRM F1 AUC (fixed)": 0.8383970665269774, "eval_PRM F1 Neg": 0.5964912280701754, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.9166666666666666, "eval_PRM Recall": 0.7951807228915663, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.4096235930919647, "eval_runtime": 17.0311, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 905 }, { "epoch": 0.23337733844221914, "grad_norm": 0.18952926158184763, "learning_rate": 9.46913452902485e-05, "loss": 0.4212, "step": 906 }, { "epoch": 0.23363492932350194, "grad_norm": 0.28504685772556815, "learning_rate": 9.467116219664894e-05, "loss": 0.4743, "step": 907 }, { "epoch": 0.23389252020478474, "grad_norm": 0.21196042252015154, "learning_rate": 9.465094296790479e-05, "loss": 0.4351, "step": 908 }, { "epoch": 0.23415011108606756, "grad_norm": 0.20720899057536477, "learning_rate": 9.463068762037175e-05, "loss": 0.4369, "step": 909 }, { "epoch": 0.23440770196735036, "grad_norm": 0.2221626129843554, "learning_rate": 9.461039617043461e-05, "loss": 0.3761, "step": 910 }, { "epoch": 0.23440770196735036, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.8391828182294394, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.41042259335517883, "eval_runtime": 16.7036, "eval_samples_per_second": 2.634, "eval_steps_per_second": 0.18, "step": 910 }, { "epoch": 0.23466529284863316, "grad_norm": 0.14525347000128516, "learning_rate": 9.459006863450745e-05, "loss": 0.3742, "step": 911 }, { "epoch": 0.23492288372991596, "grad_norm": 0.1469248523372294, "learning_rate": 9.456970502903347e-05, "loss": 0.39, "step": 912 }, { "epoch": 0.23518047461119876, "grad_norm": 0.12611252030989256, "learning_rate": 9.454930537048509e-05, "loss": 0.3686, "step": 913 }, { "epoch": 0.23543806549248156, "grad_norm": 0.21237171555846002, "learning_rate": 9.45288696753639e-05, "loss": 0.4215, "step": 914 }, { "epoch": 0.23569565637376436, "grad_norm": 0.19752147714699278, "learning_rate": 9.450839796020062e-05, "loss": 0.4671, "step": 915 }, { "epoch": 0.23569565637376436, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8438973284442116, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.44442471861839294, "eval_runtime": 16.4035, "eval_samples_per_second": 2.682, "eval_steps_per_second": 0.183, "step": 915 }, { "epoch": 0.23595324725504718, "grad_norm": 0.14782360329829114, "learning_rate": 9.448789024155512e-05, "loss": 0.3182, "step": 916 }, { "epoch": 0.23621083813632998, "grad_norm": 0.19752535682343816, "learning_rate": 9.446734653601638e-05, "loss": 0.374, "step": 917 }, { "epoch": 0.23646842901761278, "grad_norm": 0.12313740946942986, "learning_rate": 9.44467668602025e-05, "loss": 0.352, "step": 918 }, { "epoch": 0.23672601989889558, "grad_norm": 0.1272196895295518, "learning_rate": 9.442615123076071e-05, "loss": 0.361, "step": 919 }, { "epoch": 0.23698361078017838, "grad_norm": 0.1790741759047021, "learning_rate": 9.440549966436723e-05, "loss": 0.4352, "step": 920 }, { "epoch": 0.23698361078017838, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.8365636458878994, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.41787996888160706, "eval_runtime": 17.7177, "eval_samples_per_second": 2.483, "eval_steps_per_second": 0.169, "step": 920 }, { "epoch": 0.23724120166146118, "grad_norm": 0.17468148532061714, "learning_rate": 9.438481217772744e-05, "loss": 0.4196, "step": 921 }, { "epoch": 0.23749879254274397, "grad_norm": 0.20932563574883836, "learning_rate": 9.436408878757573e-05, "loss": 0.5019, "step": 922 }, { "epoch": 0.2377563834240268, "grad_norm": 0.1690322430372637, "learning_rate": 9.434332951067556e-05, "loss": 0.3852, "step": 923 }, { "epoch": 0.2380139743053096, "grad_norm": 0.19683614597147409, "learning_rate": 9.432253436381941e-05, "loss": 0.405, "step": 924 }, { "epoch": 0.2382715651865924, "grad_norm": 0.23040544364504154, "learning_rate": 9.430170336382877e-05, "loss": 0.4063, "step": 925 }, { "epoch": 0.2382715651865924, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8441558441558441, "eval_PRM F1 AUC": 0.7611314824515453, "eval_PRM F1 AUC (fixed)": 0.8281822943949712, "eval_PRM F1 Neg": 0.5862068965517241, "eval_PRM NPV": 0.4857142857142857, "eval_PRM Precision": 0.9154929577464789, "eval_PRM Recall": 0.7831325301204819, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.4153941869735718, "eval_runtime": 16.9625, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 925 }, { "epoch": 0.2385291560678752, "grad_norm": 0.26755480903948853, "learning_rate": 9.428083652755413e-05, "loss": 0.3961, "step": 926 }, { "epoch": 0.238786746949158, "grad_norm": 0.15315689632772056, "learning_rate": 9.425993387187498e-05, "loss": 0.3509, "step": 927 }, { "epoch": 0.2390443378304408, "grad_norm": 0.1948264077316225, "learning_rate": 9.423899541369978e-05, "loss": 0.4091, "step": 928 }, { "epoch": 0.2393019287117236, "grad_norm": 0.16756323110853735, "learning_rate": 9.421802116996594e-05, "loss": 0.3959, "step": 929 }, { "epoch": 0.23955951959300642, "grad_norm": 0.1490428268438959, "learning_rate": 9.419701115763984e-05, "loss": 0.355, "step": 930 }, { "epoch": 0.23955951959300642, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8480880041906756, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4066939055919647, "eval_runtime": 17.0963, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 930 }, { "epoch": 0.23981711047428922, "grad_norm": 0.22527675436530697, "learning_rate": 9.417596539371676e-05, "loss": 0.4164, "step": 931 }, { "epoch": 0.24007470135557202, "grad_norm": 0.15295735099602972, "learning_rate": 9.415488389522094e-05, "loss": 0.4011, "step": 932 }, { "epoch": 0.24033229223685482, "grad_norm": 0.15842198585707942, "learning_rate": 9.413376667920549e-05, "loss": 0.3678, "step": 933 }, { "epoch": 0.24058988311813762, "grad_norm": 0.15904855690305927, "learning_rate": 9.411261376275245e-05, "loss": 0.43, "step": 934 }, { "epoch": 0.24084747399942041, "grad_norm": 0.17554700531767695, "learning_rate": 9.409142516297269e-05, "loss": 0.4352, "step": 935 }, { "epoch": 0.24084747399942041, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.8441592456783656, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3881392180919647, "eval_runtime": 17.0028, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 935 }, { "epoch": 0.2411050648807032, "grad_norm": 0.1713854725195325, "learning_rate": 9.4070200897006e-05, "loss": 0.4305, "step": 936 }, { "epoch": 0.24136265576198604, "grad_norm": 0.15626671018190155, "learning_rate": 9.4048940982021e-05, "loss": 0.3977, "step": 937 }, { "epoch": 0.24162024664326884, "grad_norm": 0.21859089159563583, "learning_rate": 9.40276454352151e-05, "loss": 0.4578, "step": 938 }, { "epoch": 0.24187783752455164, "grad_norm": 0.1294788942706536, "learning_rate": 9.400631427381461e-05, "loss": 0.3135, "step": 939 }, { "epoch": 0.24213542840583444, "grad_norm": 0.1369184685070066, "learning_rate": 9.398494751507458e-05, "loss": 0.379, "step": 940 }, { "epoch": 0.24213542840583444, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8717948717948718, "eval_PRM F1 AUC": 0.8009429020429545, "eval_PRM F1 AUC (fixed)": 0.8226820324777371, "eval_PRM F1 Neg": 0.6428571428571429, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.9315068493150684, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.782608695652174, "eval_loss": 0.4037642180919647, "eval_runtime": 16.4439, "eval_samples_per_second": 2.676, "eval_steps_per_second": 0.182, "step": 940 }, { "epoch": 0.24239301928711723, "grad_norm": 0.2180367622905385, "learning_rate": 9.396354517627894e-05, "loss": 0.4684, "step": 941 }, { "epoch": 0.24265061016840003, "grad_norm": 0.17297061180500137, "learning_rate": 9.394210727474028e-05, "loss": 0.4199, "step": 942 }, { "epoch": 0.24290820104968283, "grad_norm": 0.15365515927755224, "learning_rate": 9.39206338278001e-05, "loss": 0.4338, "step": 943 }, { "epoch": 0.24316579193096563, "grad_norm": 0.14812603615734782, "learning_rate": 9.389912485282852e-05, "loss": 0.4139, "step": 944 }, { "epoch": 0.24342338281224846, "grad_norm": 0.134690643724279, "learning_rate": 9.387758036722449e-05, "loss": 0.4019, "step": 945 }, { "epoch": 0.24342338281224846, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8336825563122052, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.3979048430919647, "eval_runtime": 17.2865, "eval_samples_per_second": 2.545, "eval_steps_per_second": 0.174, "step": 945 }, { "epoch": 0.24368097369353126, "grad_norm": 0.11990899731140318, "learning_rate": 9.385600038841565e-05, "loss": 0.3805, "step": 946 }, { "epoch": 0.24393856457481405, "grad_norm": 0.14269153218454197, "learning_rate": 9.383438493385833e-05, "loss": 0.4108, "step": 947 }, { "epoch": 0.24419615545609685, "grad_norm": 0.1568414779967645, "learning_rate": 9.381273402103761e-05, "loss": 0.4309, "step": 948 }, { "epoch": 0.24445374633737965, "grad_norm": 0.2639791353112172, "learning_rate": 9.379104766746722e-05, "loss": 0.4595, "step": 949 }, { "epoch": 0.24471133721866245, "grad_norm": 0.15967077217953962, "learning_rate": 9.376932589068956e-05, "loss": 0.3983, "step": 950 }, { "epoch": 0.24471133721866245, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.8378732320586694, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.39621803164482117, "eval_runtime": 16.4937, "eval_samples_per_second": 2.668, "eval_steps_per_second": 0.182, "step": 950 }, { "epoch": 0.24496892809994525, "grad_norm": 0.14648351009860774, "learning_rate": 9.37475687082757e-05, "loss": 0.3631, "step": 951 }, { "epoch": 0.24522651898122808, "grad_norm": 0.1708614665782863, "learning_rate": 9.37257761378253e-05, "loss": 0.4959, "step": 952 }, { "epoch": 0.24548410986251087, "grad_norm": 0.14645710050507305, "learning_rate": 9.370394819696672e-05, "loss": 0.4341, "step": 953 }, { "epoch": 0.24574170074379367, "grad_norm": 0.13774689007290275, "learning_rate": 9.368208490335688e-05, "loss": 0.4097, "step": 954 }, { "epoch": 0.24599929162507647, "grad_norm": 0.19038858106009274, "learning_rate": 9.366018627468132e-05, "loss": 0.4468, "step": 955 }, { "epoch": 0.24599929162507647, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 AUC (fixed)": 0.8310633839706653, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.4013671875, "eval_runtime": 17.7219, "eval_samples_per_second": 2.483, "eval_steps_per_second": 0.169, "step": 955 }, { "epoch": 0.24625688250635927, "grad_norm": 0.16842942889240387, "learning_rate": 9.363825232865413e-05, "loss": 0.4024, "step": 956 }, { "epoch": 0.24651447338764207, "grad_norm": 0.18857457825609594, "learning_rate": 9.361628308301802e-05, "loss": 0.4498, "step": 957 }, { "epoch": 0.24677206426892487, "grad_norm": 0.136330963308826, "learning_rate": 9.359427855554422e-05, "loss": 0.3852, "step": 958 }, { "epoch": 0.2470296551502077, "grad_norm": 0.11744396040766063, "learning_rate": 9.357223876403252e-05, "loss": 0.3422, "step": 959 }, { "epoch": 0.2472872460314905, "grad_norm": 0.1449604845198016, "learning_rate": 9.355016372631119e-05, "loss": 0.361, "step": 960 }, { "epoch": 0.2472872460314905, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8588235294117647, "eval_PRM F1 AUC": 0.6354112100576217, "eval_PRM F1 AUC (fixed)": 0.8247773703509691, "eval_PRM F1 Neg": 0.42857142857142855, "eval_PRM NPV": 0.47368421052631576, "eval_PRM Precision": 0.8390804597701149, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4242720305919647, "eval_runtime": 16.955, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 960 }, { "epoch": 0.2475448369127733, "grad_norm": 0.20695516034130174, "learning_rate": 9.352805346023708e-05, "loss": 0.4325, "step": 961 }, { "epoch": 0.2478024277940561, "grad_norm": 0.18413880039768285, "learning_rate": 9.35059079836955e-05, "loss": 0.3913, "step": 962 }, { "epoch": 0.2480600186753389, "grad_norm": 0.1330576765822883, "learning_rate": 9.348372731460023e-05, "loss": 0.3176, "step": 963 }, { "epoch": 0.2483176095566217, "grad_norm": 0.1715696984366364, "learning_rate": 9.346151147089353e-05, "loss": 0.4301, "step": 964 }, { "epoch": 0.2485752004379045, "grad_norm": 0.15438138766517245, "learning_rate": 9.34392604705461e-05, "loss": 0.3565, "step": 965 }, { "epoch": 0.2485752004379045, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8043478260869565, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4443359375, "eval_runtime": 17.4644, "eval_samples_per_second": 2.519, "eval_steps_per_second": 0.172, "step": 965 }, { "epoch": 0.2488327913191873, "grad_norm": 0.16409412908054974, "learning_rate": 9.341697433155714e-05, "loss": 0.4135, "step": 966 }, { "epoch": 0.2490903822004701, "grad_norm": 0.1866985573588762, "learning_rate": 9.33946530719542e-05, "loss": 0.4067, "step": 967 }, { "epoch": 0.2493479730817529, "grad_norm": 0.21365475825974745, "learning_rate": 9.337229670979326e-05, "loss": 0.5011, "step": 968 }, { "epoch": 0.2496055639630357, "grad_norm": 0.23948434704234775, "learning_rate": 9.334990526315872e-05, "loss": 0.4017, "step": 969 }, { "epoch": 0.2498631548443185, "grad_norm": 0.17961717581685058, "learning_rate": 9.332747875016332e-05, "loss": 0.4603, "step": 970 }, { "epoch": 0.2498631548443185, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8395061728395061, "eval_PRM F1 AUC": 0.6705081194342588, "eval_PRM F1 AUC (fixed)": 0.8053954950235724, "eval_PRM F1 Neg": 0.48, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8607594936708861, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42489346861839294, "eval_runtime": 16.9263, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 970 }, { "epoch": 0.25012074572560133, "grad_norm": 0.18685993902268822, "learning_rate": 9.330501718894822e-05, "loss": 0.4057, "step": 971 }, { "epoch": 0.25037833660688413, "grad_norm": 0.13572225823285414, "learning_rate": 9.328252059768287e-05, "loss": 0.3287, "step": 972 }, { "epoch": 0.25063592748816693, "grad_norm": 0.17561696599857984, "learning_rate": 9.325998899456511e-05, "loss": 0.3267, "step": 973 }, { "epoch": 0.25089351836944973, "grad_norm": 0.2187092719272626, "learning_rate": 9.323742239782105e-05, "loss": 0.3878, "step": 974 }, { "epoch": 0.25115110925073253, "grad_norm": 0.17469577094967373, "learning_rate": 9.321482082570517e-05, "loss": 0.3959, "step": 975 }, { "epoch": 0.25115110925073253, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8106338397066528, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.45703125, "eval_runtime": 17.0878, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 975 }, { "epoch": 0.25140870013201533, "grad_norm": 0.19474948276705212, "learning_rate": 9.319218429650016e-05, "loss": 0.3772, "step": 976 }, { "epoch": 0.2516662910132981, "grad_norm": 0.1656104569164003, "learning_rate": 9.316951282851707e-05, "loss": 0.4089, "step": 977 }, { "epoch": 0.2519238818945809, "grad_norm": 0.1418895601874937, "learning_rate": 9.314680644009517e-05, "loss": 0.36, "step": 978 }, { "epoch": 0.2521814727758637, "grad_norm": 0.17363933837883128, "learning_rate": 9.312406514960197e-05, "loss": 0.3555, "step": 979 }, { "epoch": 0.2524390636571465, "grad_norm": 0.13397604357233978, "learning_rate": 9.310128897543324e-05, "loss": 0.4131, "step": 980 }, { "epoch": 0.2524390636571465, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 AUC (fixed)": 0.8171817705605028, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4318181872367859, "eval_runtime": 16.9598, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 980 }, { "epoch": 0.2526966545384293, "grad_norm": 0.16272419299786625, "learning_rate": 9.307847793601296e-05, "loss": 0.3888, "step": 981 }, { "epoch": 0.2529542454197121, "grad_norm": 0.20637938124124308, "learning_rate": 9.305563204979329e-05, "loss": 0.4093, "step": 982 }, { "epoch": 0.2532118363009949, "grad_norm": 0.10892419838862474, "learning_rate": 9.303275133525459e-05, "loss": 0.3415, "step": 983 }, { "epoch": 0.2534694271822778, "grad_norm": 0.12897192014996747, "learning_rate": 9.300983581090541e-05, "loss": 0.3571, "step": 984 }, { "epoch": 0.25372701806356057, "grad_norm": 0.11750622088823434, "learning_rate": 9.298688549528245e-05, "loss": 0.3772, "step": 985 }, { "epoch": 0.25372701806356057, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.823729701414353, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.4033203125, "eval_runtime": 17.8449, "eval_samples_per_second": 2.466, "eval_steps_per_second": 0.168, "step": 985 }, { "epoch": 0.25398460894484337, "grad_norm": 0.1891010004062452, "learning_rate": 9.296390040695055e-05, "loss": 0.3341, "step": 986 }, { "epoch": 0.25424219982612617, "grad_norm": 0.1354763589527095, "learning_rate": 9.294088056450269e-05, "loss": 0.388, "step": 987 }, { "epoch": 0.25449979070740897, "grad_norm": 0.1870413461225831, "learning_rate": 9.291782598655992e-05, "loss": 0.4452, "step": 988 }, { "epoch": 0.25475738158869177, "grad_norm": 0.1294604296779203, "learning_rate": 9.289473669177145e-05, "loss": 0.338, "step": 989 }, { "epoch": 0.25501497246997457, "grad_norm": 0.1366314980600317, "learning_rate": 9.287161269881451e-05, "loss": 0.3888, "step": 990 }, { "epoch": 0.25501497246997457, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8370874803562074, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3888494372367859, "eval_runtime": 17.5944, "eval_samples_per_second": 2.501, "eval_steps_per_second": 0.171, "step": 990 }, { "epoch": 0.25527256335125736, "grad_norm": 0.1349113771077854, "learning_rate": 9.284845402639446e-05, "loss": 0.3752, "step": 991 }, { "epoch": 0.25553015423254016, "grad_norm": 0.1731884430207601, "learning_rate": 9.282526069324467e-05, "loss": 0.3876, "step": 992 }, { "epoch": 0.25578774511382296, "grad_norm": 0.1775726982010048, "learning_rate": 9.280203271812656e-05, "loss": 0.3675, "step": 993 }, { "epoch": 0.25604533599510576, "grad_norm": 0.14993967493503185, "learning_rate": 9.277877011982955e-05, "loss": 0.4215, "step": 994 }, { "epoch": 0.25630292687638856, "grad_norm": 0.1343320533787638, "learning_rate": 9.275547291717112e-05, "loss": 0.3518, "step": 995 }, { "epoch": 0.25630292687638856, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8446830801466737, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3720703125, "eval_runtime": 16.9861, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 995 }, { "epoch": 0.25656051775767136, "grad_norm": 0.1626833754173271, "learning_rate": 9.273214112899673e-05, "loss": 0.4218, "step": 996 }, { "epoch": 0.25681810863895416, "grad_norm": 0.14982404885775505, "learning_rate": 9.270877477417976e-05, "loss": 0.3784, "step": 997 }, { "epoch": 0.257075699520237, "grad_norm": 0.13228815032922078, "learning_rate": 9.26853738716216e-05, "loss": 0.3225, "step": 998 }, { "epoch": 0.2573332904015198, "grad_norm": 0.14245961303650523, "learning_rate": 9.266193844025157e-05, "loss": 0.3533, "step": 999 }, { "epoch": 0.2575908812828026, "grad_norm": 0.1561824029866387, "learning_rate": 9.263846849902696e-05, "loss": 0.4104, "step": 1000 }, { "epoch": 0.2575908812828026, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8486118386589837, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.3876953125, "eval_runtime": 16.9787, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 1000 }, { "epoch": 0.2578484721640854, "grad_norm": 0.2067931536176895, "learning_rate": 9.261496406693291e-05, "loss": 0.4059, "step": 1001 }, { "epoch": 0.2581060630453682, "grad_norm": 0.1386399808387454, "learning_rate": 9.259142516298249e-05, "loss": 0.3399, "step": 1002 }, { "epoch": 0.258363653926651, "grad_norm": 0.14591159357587608, "learning_rate": 9.256785180621668e-05, "loss": 0.3407, "step": 1003 }, { "epoch": 0.2586212448079338, "grad_norm": 0.14826515123499576, "learning_rate": 9.254424401570428e-05, "loss": 0.4042, "step": 1004 }, { "epoch": 0.2588788356892166, "grad_norm": 0.1909193283313938, "learning_rate": 9.2520601810542e-05, "loss": 0.3987, "step": 1005 }, { "epoch": 0.2588788356892166, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8415400733368256, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3910689055919647, "eval_runtime": 16.9389, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 1005 }, { "epoch": 0.2591364265704994, "grad_norm": 0.16849892375783673, "learning_rate": 9.249692520985433e-05, "loss": 0.3537, "step": 1006 }, { "epoch": 0.2593940174517822, "grad_norm": 0.16021345094153908, "learning_rate": 9.247321423279365e-05, "loss": 0.4003, "step": 1007 }, { "epoch": 0.259651608333065, "grad_norm": 0.17522704107805528, "learning_rate": 9.244946889854007e-05, "loss": 0.3845, "step": 1008 }, { "epoch": 0.2599091992143478, "grad_norm": 0.21505356665104383, "learning_rate": 9.242568922630157e-05, "loss": 0.4019, "step": 1009 }, { "epoch": 0.2601667900956306, "grad_norm": 0.20190155730209533, "learning_rate": 9.240187523531383e-05, "loss": 0.3778, "step": 1010 }, { "epoch": 0.2601667900956306, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8336825563122053, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.41415128111839294, "eval_runtime": 16.6358, "eval_samples_per_second": 2.645, "eval_steps_per_second": 0.18, "step": 1010 }, { "epoch": 0.2604243809769134, "grad_norm": 0.1304894840593479, "learning_rate": 9.237802694484035e-05, "loss": 0.3954, "step": 1011 }, { "epoch": 0.2606819718581962, "grad_norm": 0.16729151782918208, "learning_rate": 9.235414437417234e-05, "loss": 0.3729, "step": 1012 }, { "epoch": 0.26093956273947905, "grad_norm": 0.13464803129255679, "learning_rate": 9.233022754262879e-05, "loss": 0.3414, "step": 1013 }, { "epoch": 0.26119715362076185, "grad_norm": 0.21650707312132442, "learning_rate": 9.230627646955633e-05, "loss": 0.4102, "step": 1014 }, { "epoch": 0.26145474450204464, "grad_norm": 0.18996640661419206, "learning_rate": 9.228229117432934e-05, "loss": 0.4218, "step": 1015 }, { "epoch": 0.26145474450204464, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 AUC (fixed)": 0.8313253012048192, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42649146914482117, "eval_runtime": 17.2388, "eval_samples_per_second": 2.552, "eval_steps_per_second": 0.174, "step": 1015 }, { "epoch": 0.26171233538332744, "grad_norm": 0.20091968234874621, "learning_rate": 9.225827167634988e-05, "loss": 0.4052, "step": 1016 }, { "epoch": 0.26196992626461024, "grad_norm": 0.12694680575243175, "learning_rate": 9.223421799504766e-05, "loss": 0.3392, "step": 1017 }, { "epoch": 0.26222751714589304, "grad_norm": 0.16143599885245627, "learning_rate": 9.221013014988002e-05, "loss": 0.4284, "step": 1018 }, { "epoch": 0.26248510802717584, "grad_norm": 0.16508042764720718, "learning_rate": 9.2186008160332e-05, "loss": 0.3993, "step": 1019 }, { "epoch": 0.26274269890845864, "grad_norm": 0.17263770646244828, "learning_rate": 9.216185204591623e-05, "loss": 0.4116, "step": 1020 }, { "epoch": 0.26274269890845864, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8133333333333334, "eval_PRM F1 AUC": 0.7370350969093766, "eval_PRM F1 AUC (fixed)": 0.8255631220534312, "eval_PRM F1 Neg": 0.5483870967741935, "eval_PRM NPV": 0.4358974358974359, "eval_PRM Precision": 0.9104477611940298, "eval_PRM Recall": 0.7349397590361446, "eval_PRM Specificty": 0.7391304347826086, "eval_loss": 0.44895240664482117, "eval_runtime": 16.7685, "eval_samples_per_second": 2.624, "eval_steps_per_second": 0.179, "step": 1020 }, { "epoch": 0.26300028978974144, "grad_norm": 0.2604772518482746, "learning_rate": 9.213766182617291e-05, "loss": 0.3891, "step": 1021 }, { "epoch": 0.26325788067102424, "grad_norm": 0.34843739606905194, "learning_rate": 9.211343752066987e-05, "loss": 0.3742, "step": 1022 }, { "epoch": 0.26351547155230703, "grad_norm": 0.24911731597936657, "learning_rate": 9.20891791490025e-05, "loss": 0.4635, "step": 1023 }, { "epoch": 0.26377306243358983, "grad_norm": 0.1428673547192327, "learning_rate": 9.206488673079374e-05, "loss": 0.41, "step": 1024 }, { "epoch": 0.26403065331487263, "grad_norm": 0.1742718145669165, "learning_rate": 9.204056028569408e-05, "loss": 0.4359, "step": 1025 }, { "epoch": 0.26403065331487263, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8452069146149817, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.41335228085517883, "eval_runtime": 17.5963, "eval_samples_per_second": 2.501, "eval_steps_per_second": 0.17, "step": 1025 }, { "epoch": 0.26428824419615543, "grad_norm": 0.210658527552093, "learning_rate": 9.201619983338153e-05, "loss": 0.4333, "step": 1026 }, { "epoch": 0.2645458350774383, "grad_norm": 0.20888251125539192, "learning_rate": 9.199180539356158e-05, "loss": 0.4023, "step": 1027 }, { "epoch": 0.2648034259587211, "grad_norm": 0.11542874262581096, "learning_rate": 9.196737698596729e-05, "loss": 0.3623, "step": 1028 }, { "epoch": 0.2650610168400039, "grad_norm": 0.11029223772798089, "learning_rate": 9.194291463035913e-05, "loss": 0.2974, "step": 1029 }, { "epoch": 0.2653186077212867, "grad_norm": 0.13294700436961546, "learning_rate": 9.191841834652506e-05, "loss": 0.4041, "step": 1030 }, { "epoch": 0.2653186077212867, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8334206390780514, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42959871888160706, "eval_runtime": 17.6048, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 1030 }, { "epoch": 0.2655761986025695, "grad_norm": 0.15032790930629672, "learning_rate": 9.189388815428046e-05, "loss": 0.4129, "step": 1031 }, { "epoch": 0.2658337894838523, "grad_norm": 0.14931824160886123, "learning_rate": 9.186932407346816e-05, "loss": 0.3766, "step": 1032 }, { "epoch": 0.2660913803651351, "grad_norm": 0.14988426793842805, "learning_rate": 9.18447261239584e-05, "loss": 0.4318, "step": 1033 }, { "epoch": 0.2663489712464179, "grad_norm": 0.17020066830486527, "learning_rate": 9.18200943256488e-05, "loss": 0.3892, "step": 1034 }, { "epoch": 0.2666065621277007, "grad_norm": 0.1712453662894019, "learning_rate": 9.179542869846441e-05, "loss": 0.4141, "step": 1035 }, { "epoch": 0.2666065621277007, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.8308014667365112, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.4091796875, "eval_runtime": 17.1588, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 1035 }, { "epoch": 0.2668641530089835, "grad_norm": 0.13669254651581447, "learning_rate": 9.177072926235757e-05, "loss": 0.384, "step": 1036 }, { "epoch": 0.26712174389026627, "grad_norm": 0.16069639755617673, "learning_rate": 9.174599603730803e-05, "loss": 0.3246, "step": 1037 }, { "epoch": 0.26737933477154907, "grad_norm": 0.2247863127680151, "learning_rate": 9.172122904332285e-05, "loss": 0.3559, "step": 1038 }, { "epoch": 0.26763692565283187, "grad_norm": 0.16978345730453467, "learning_rate": 9.169642830043641e-05, "loss": 0.4354, "step": 1039 }, { "epoch": 0.26789451653411467, "grad_norm": 0.18000893954151356, "learning_rate": 9.167159382871039e-05, "loss": 0.3767, "step": 1040 }, { "epoch": 0.26789451653411467, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 AUC (fixed)": 0.8213724463069669, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.4064275622367859, "eval_runtime": 16.9395, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 1040 }, { "epoch": 0.2681521074153975, "grad_norm": 0.15685931245812837, "learning_rate": 9.164672564823373e-05, "loss": 0.456, "step": 1041 }, { "epoch": 0.2684096982966803, "grad_norm": 0.14901852400421192, "learning_rate": 9.162182377912267e-05, "loss": 0.3767, "step": 1042 }, { "epoch": 0.2686672891779631, "grad_norm": 0.13445209403749314, "learning_rate": 9.159688824152071e-05, "loss": 0.3573, "step": 1043 }, { "epoch": 0.2689248800592459, "grad_norm": 0.17431203821454808, "learning_rate": 9.157191905559852e-05, "loss": 0.4132, "step": 1044 }, { "epoch": 0.2691824709405287, "grad_norm": 0.24346105759432404, "learning_rate": 9.154691624155407e-05, "loss": 0.3811, "step": 1045 }, { "epoch": 0.2691824709405287, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.875, "eval_PRM F1 AUC": 0.7695128339444735, "eval_PRM F1 AUC (fixed)": 0.8169198533263489, "eval_PRM F1 Neg": 0.6153846153846154, "eval_PRM NPV": 0.5517241379310345, "eval_PRM Precision": 0.9090909090909091, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.4085582494735718, "eval_runtime": 17.7287, "eval_samples_per_second": 2.482, "eval_steps_per_second": 0.169, "step": 1045 }, { "epoch": 0.2694400618218115, "grad_norm": 0.1862374759893012, "learning_rate": 9.152187981961249e-05, "loss": 0.4444, "step": 1046 }, { "epoch": 0.2696976527030943, "grad_norm": 0.19340815671260683, "learning_rate": 9.149680981002609e-05, "loss": 0.4632, "step": 1047 }, { "epoch": 0.2699552435843771, "grad_norm": 0.1521736630568345, "learning_rate": 9.147170623307436e-05, "loss": 0.3079, "step": 1048 }, { "epoch": 0.2702128344656599, "grad_norm": 0.22388242364619593, "learning_rate": 9.144656910906396e-05, "loss": 0.4221, "step": 1049 }, { "epoch": 0.2704704253469427, "grad_norm": 0.2529846606801436, "learning_rate": 9.142139845832865e-05, "loss": 0.4404, "step": 1050 }, { "epoch": 0.2704704253469427, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8520710059171598, "eval_PRM F1 AUC": 0.6293871136720797, "eval_PRM F1 AUC (fixed)": 0.8208486118386591, "eval_PRM F1 Neg": 0.4186046511627907, "eval_PRM NPV": 0.45, "eval_PRM Precision": 0.8372093023255814, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.42311790585517883, "eval_runtime": 17.482, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 1050 }, { "epoch": 0.2707280162282255, "grad_norm": 0.17440932166602557, "learning_rate": 9.139619430122934e-05, "loss": 0.4214, "step": 1051 }, { "epoch": 0.2709856071095083, "grad_norm": 0.1566511663979366, "learning_rate": 9.137095665815405e-05, "loss": 0.4382, "step": 1052 }, { "epoch": 0.2712431979907911, "grad_norm": 0.1301890238471345, "learning_rate": 9.134568554951783e-05, "loss": 0.3407, "step": 1053 }, { "epoch": 0.2715007888720739, "grad_norm": 0.1849987303899487, "learning_rate": 9.13203809957629e-05, "loss": 0.3871, "step": 1054 }, { "epoch": 0.2717583797533567, "grad_norm": 0.1803736153989277, "learning_rate": 9.129504301735843e-05, "loss": 0.4206, "step": 1055 }, { "epoch": 0.2717583797533567, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.8166579360921948, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4222301244735718, "eval_runtime": 17.0144, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 1055 }, { "epoch": 0.27201597063463956, "grad_norm": 0.12021042483741588, "learning_rate": 9.12696716348007e-05, "loss": 0.4008, "step": 1056 }, { "epoch": 0.27227356151592236, "grad_norm": 0.18208081270330123, "learning_rate": 9.124426686861297e-05, "loss": 0.428, "step": 1057 }, { "epoch": 0.27253115239720516, "grad_norm": 0.25078268910891494, "learning_rate": 9.121882873934553e-05, "loss": 0.4336, "step": 1058 }, { "epoch": 0.27278874327848796, "grad_norm": 0.12547677332239998, "learning_rate": 9.119335726757564e-05, "loss": 0.3865, "step": 1059 }, { "epoch": 0.27304633415977075, "grad_norm": 0.11937745843039797, "learning_rate": 9.116785247390756e-05, "loss": 0.3921, "step": 1060 }, { "epoch": 0.27304633415977075, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.826348873755893, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.40696021914482117, "eval_runtime": 16.9725, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 1060 }, { "epoch": 0.27330392504105355, "grad_norm": 0.2627937741367757, "learning_rate": 9.114231437897244e-05, "loss": 0.5265, "step": 1061 }, { "epoch": 0.27356151592233635, "grad_norm": 0.1355591220720796, "learning_rate": 9.111674300342846e-05, "loss": 0.442, "step": 1062 }, { "epoch": 0.27381910680361915, "grad_norm": 0.1598848159314281, "learning_rate": 9.109113836796066e-05, "loss": 0.3194, "step": 1063 }, { "epoch": 0.27407669768490195, "grad_norm": 0.18613848933268956, "learning_rate": 9.106550049328097e-05, "loss": 0.4081, "step": 1064 }, { "epoch": 0.27433428856618475, "grad_norm": 0.17605562826410903, "learning_rate": 9.103982940012827e-05, "loss": 0.3616, "step": 1065 }, { "epoch": 0.27433428856618475, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8247773703509691, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4161931872367859, "eval_runtime": 17.1407, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 1065 }, { "epoch": 0.27459187944746755, "grad_norm": 0.13440588506280207, "learning_rate": 9.101412510926826e-05, "loss": 0.3541, "step": 1066 }, { "epoch": 0.27484947032875034, "grad_norm": 0.1264456406693554, "learning_rate": 9.09883876414935e-05, "loss": 0.4368, "step": 1067 }, { "epoch": 0.27510706121003314, "grad_norm": 0.1755640275626186, "learning_rate": 9.096261701762342e-05, "loss": 0.3912, "step": 1068 }, { "epoch": 0.27536465209131594, "grad_norm": 0.14262925831191228, "learning_rate": 9.093681325850424e-05, "loss": 0.3582, "step": 1069 }, { "epoch": 0.2756222429725988, "grad_norm": 0.13270810591162102, "learning_rate": 9.091097638500899e-05, "loss": 0.358, "step": 1070 }, { "epoch": 0.2756222429725988, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.823729701414353, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.44797584414482117, "eval_runtime": 16.9445, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 1070 }, { "epoch": 0.2758798338538816, "grad_norm": 0.29696661127794793, "learning_rate": 9.088510641803746e-05, "loss": 0.4006, "step": 1071 }, { "epoch": 0.2761374247351644, "grad_norm": 0.16416354495271582, "learning_rate": 9.085920337851628e-05, "loss": 0.349, "step": 1072 }, { "epoch": 0.2763950156164472, "grad_norm": 0.2389788938976279, "learning_rate": 9.083326728739877e-05, "loss": 0.4834, "step": 1073 }, { "epoch": 0.27665260649773, "grad_norm": 0.15513737344864312, "learning_rate": 9.080729816566502e-05, "loss": 0.3941, "step": 1074 }, { "epoch": 0.2769101973790128, "grad_norm": 0.12851916399871888, "learning_rate": 9.078129603432181e-05, "loss": 0.2987, "step": 1075 }, { "epoch": 0.2769101973790128, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.8156102671555788, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.43838778138160706, "eval_runtime": 16.9665, "eval_samples_per_second": 2.593, "eval_steps_per_second": 0.177, "step": 1075 }, { "epoch": 0.2771677882602956, "grad_norm": 0.1591420230521014, "learning_rate": 9.075526091440263e-05, "loss": 0.3497, "step": 1076 }, { "epoch": 0.2774253791415784, "grad_norm": 0.17850950086356343, "learning_rate": 9.07291928269677e-05, "loss": 0.3665, "step": 1077 }, { "epoch": 0.2776829700228612, "grad_norm": 0.19765132445593747, "learning_rate": 9.070309179310383e-05, "loss": 0.3594, "step": 1078 }, { "epoch": 0.277940560904144, "grad_norm": 0.13591152152682912, "learning_rate": 9.067695783392453e-05, "loss": 0.3993, "step": 1079 }, { "epoch": 0.2781981517854268, "grad_norm": 0.17645809479483776, "learning_rate": 9.065079097056996e-05, "loss": 0.4008, "step": 1080 }, { "epoch": 0.2781981517854268, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.819800942902043, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.44264915585517883, "eval_runtime": 17.0278, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 1080 }, { "epoch": 0.2784557426667096, "grad_norm": 0.1742505264308386, "learning_rate": 9.062459122420683e-05, "loss": 0.3511, "step": 1081 }, { "epoch": 0.2787133335479924, "grad_norm": 0.19008003382534122, "learning_rate": 9.059835861602853e-05, "loss": 0.3842, "step": 1082 }, { "epoch": 0.2789709244292752, "grad_norm": 0.15138887112369492, "learning_rate": 9.057209316725498e-05, "loss": 0.4147, "step": 1083 }, { "epoch": 0.279228515310558, "grad_norm": 0.1613638075776943, "learning_rate": 9.054579489913268e-05, "loss": 0.4365, "step": 1084 }, { "epoch": 0.27948610619184083, "grad_norm": 0.16072174490961555, "learning_rate": 9.051946383293466e-05, "loss": 0.4441, "step": 1085 }, { "epoch": 0.27948610619184083, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.8213724463069669, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4340376555919647, "eval_runtime": 17.4527, "eval_samples_per_second": 2.521, "eval_steps_per_second": 0.172, "step": 1085 }, { "epoch": 0.27974369707312363, "grad_norm": 0.1483662115680414, "learning_rate": 9.049309998996051e-05, "loss": 0.4089, "step": 1086 }, { "epoch": 0.28000128795440643, "grad_norm": 0.15321106916321484, "learning_rate": 9.046670339153634e-05, "loss": 0.3954, "step": 1087 }, { "epoch": 0.28025887883568923, "grad_norm": 0.15886847839102722, "learning_rate": 9.04402740590147e-05, "loss": 0.3894, "step": 1088 }, { "epoch": 0.28051646971697203, "grad_norm": 0.16250330935063964, "learning_rate": 9.041381201377468e-05, "loss": 0.468, "step": 1089 }, { "epoch": 0.2807740605982548, "grad_norm": 0.15623090822225083, "learning_rate": 9.03873172772218e-05, "loss": 0.3899, "step": 1090 }, { "epoch": 0.2807740605982548, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 AUC (fixed)": 0.8122053431115767, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4406072497367859, "eval_runtime": 17.0174, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 1090 }, { "epoch": 0.2810316514795376, "grad_norm": 0.15709351106877914, "learning_rate": 9.036078987078805e-05, "loss": 0.3625, "step": 1091 }, { "epoch": 0.2812892423608204, "grad_norm": 0.15802775459264787, "learning_rate": 9.033422981593181e-05, "loss": 0.3267, "step": 1092 }, { "epoch": 0.2815468332421032, "grad_norm": 0.1674648588059315, "learning_rate": 9.03076371341379e-05, "loss": 0.3682, "step": 1093 }, { "epoch": 0.281804424123386, "grad_norm": 0.1572499644765613, "learning_rate": 9.02810118469175e-05, "loss": 0.4096, "step": 1094 }, { "epoch": 0.2820620150046688, "grad_norm": 0.12563999943582055, "learning_rate": 9.025435397580824e-05, "loss": 0.3172, "step": 1095 }, { "epoch": 0.2820620150046688, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.7857517024620219, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4828657805919647, "eval_runtime": 16.9504, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 1095 }, { "epoch": 0.2823196058859516, "grad_norm": 0.18983275713366182, "learning_rate": 9.0227663542374e-05, "loss": 0.3968, "step": 1096 }, { "epoch": 0.2825771967672344, "grad_norm": 0.10634112725509623, "learning_rate": 9.020094056820508e-05, "loss": 0.2934, "step": 1097 }, { "epoch": 0.2828347876485172, "grad_norm": 0.23858461675868176, "learning_rate": 9.017418507491806e-05, "loss": 0.372, "step": 1098 }, { "epoch": 0.28309237852980007, "grad_norm": 0.17301605162005754, "learning_rate": 9.014739708415587e-05, "loss": 0.3716, "step": 1099 }, { "epoch": 0.28334996941108287, "grad_norm": 0.17341199523060663, "learning_rate": 9.012057661758769e-05, "loss": 0.4462, "step": 1100 }, { "epoch": 0.28334996941108287, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.84472049689441, "eval_PRM F1 AUC": 0.6922472498690415, "eval_PRM F1 AUC (fixed)": 0.7773703509690937, "eval_PRM F1 Neg": 0.5098039215686274, "eval_PRM NPV": 0.4642857142857143, "eval_PRM Precision": 0.8717948717948718, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.470703125, "eval_runtime": 17.1644, "eval_samples_per_second": 2.563, "eval_steps_per_second": 0.175, "step": 1100 }, { "epoch": 0.28360756029236567, "grad_norm": 0.16654404049101154, "learning_rate": 9.009372369690897e-05, "loss": 0.3597, "step": 1101 }, { "epoch": 0.28386515117364847, "grad_norm": 0.17791366931087743, "learning_rate": 9.006683834384142e-05, "loss": 0.3955, "step": 1102 }, { "epoch": 0.28412274205493127, "grad_norm": 0.26790999717018765, "learning_rate": 9.003992058013302e-05, "loss": 0.4953, "step": 1103 }, { "epoch": 0.28438033293621406, "grad_norm": 0.2471056020762633, "learning_rate": 9.00129704275579e-05, "loss": 0.4532, "step": 1104 }, { "epoch": 0.28463792381749686, "grad_norm": 0.172927513163023, "learning_rate": 8.998598790791644e-05, "loss": 0.3315, "step": 1105 }, { "epoch": 0.28463792381749686, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8375, "eval_PRM F1 AUC": 0.6862231534834993, "eval_PRM F1 AUC (fixed)": 0.7592980618124673, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.4482758620689655, "eval_PRM Precision": 0.8701298701298701, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4874822497367859, "eval_runtime": 16.8878, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 1105 }, { "epoch": 0.28489551469877966, "grad_norm": 0.17711079002730504, "learning_rate": 8.995897304303519e-05, "loss": 0.4616, "step": 1106 }, { "epoch": 0.28515310558006246, "grad_norm": 0.14990346735992197, "learning_rate": 8.993192585476687e-05, "loss": 0.2471, "step": 1107 }, { "epoch": 0.28541069646134526, "grad_norm": 0.17692223898478826, "learning_rate": 8.99048463649903e-05, "loss": 0.3902, "step": 1108 }, { "epoch": 0.28566828734262806, "grad_norm": 0.1637599027848208, "learning_rate": 8.98777345956105e-05, "loss": 0.447, "step": 1109 }, { "epoch": 0.28592587822391086, "grad_norm": 0.35664184288409917, "learning_rate": 8.985059056855858e-05, "loss": 0.4892, "step": 1110 }, { "epoch": 0.28592587822391086, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8654970760233918, "eval_PRM F1 AUC": 0.6414353064431639, "eval_PRM F1 AUC (fixed)": 0.7655840754321634, "eval_PRM F1 Neg": 0.43902439024390244, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8409090909090909, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5237926244735718, "eval_runtime": 17.068, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 1110 }, { "epoch": 0.28618346910519366, "grad_norm": 0.33498489598855613, "learning_rate": 8.982341430579172e-05, "loss": 0.5845, "step": 1111 }, { "epoch": 0.28644105998647645, "grad_norm": 0.2522230040086564, "learning_rate": 8.979620582929318e-05, "loss": 0.5213, "step": 1112 }, { "epoch": 0.2866986508677593, "grad_norm": 0.12854418234531897, "learning_rate": 8.976896516107229e-05, "loss": 0.3658, "step": 1113 }, { "epoch": 0.2869562417490421, "grad_norm": 0.15217942213386607, "learning_rate": 8.974169232316445e-05, "loss": 0.3509, "step": 1114 }, { "epoch": 0.2872138326303249, "grad_norm": 0.14638860334343684, "learning_rate": 8.9714387337631e-05, "loss": 0.4169, "step": 1115 }, { "epoch": 0.2872138326303249, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.7750130958617077, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4607599377632141, "eval_runtime": 17.0619, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 1115 }, { "epoch": 0.2874714235116077, "grad_norm": 0.19013707721833667, "learning_rate": 8.968705022655937e-05, "loss": 0.3119, "step": 1116 }, { "epoch": 0.2877290143928905, "grad_norm": 0.17302133014684773, "learning_rate": 8.965968101206291e-05, "loss": 0.3745, "step": 1117 }, { "epoch": 0.2879866052741733, "grad_norm": 0.1397272078529865, "learning_rate": 8.9632279716281e-05, "loss": 0.4289, "step": 1118 }, { "epoch": 0.2882441961554561, "grad_norm": 0.12129589043490052, "learning_rate": 8.960484636137894e-05, "loss": 0.3844, "step": 1119 }, { "epoch": 0.2885017870367389, "grad_norm": 0.1342621292452447, "learning_rate": 8.957738096954795e-05, "loss": 0.347, "step": 1120 }, { "epoch": 0.2885017870367389, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8035620743844946, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4545454680919647, "eval_runtime": 17.7692, "eval_samples_per_second": 2.476, "eval_steps_per_second": 0.169, "step": 1120 }, { "epoch": 0.2887593779180217, "grad_norm": 0.2146920067691594, "learning_rate": 8.954988356300518e-05, "loss": 0.448, "step": 1121 }, { "epoch": 0.2890169687993045, "grad_norm": 0.12042846139948085, "learning_rate": 8.952235416399369e-05, "loss": 0.3452, "step": 1122 }, { "epoch": 0.2892745596805873, "grad_norm": 0.2246769363893663, "learning_rate": 8.94947927947824e-05, "loss": 0.4023, "step": 1123 }, { "epoch": 0.2895321505618701, "grad_norm": 0.16829886390351667, "learning_rate": 8.94671994776661e-05, "loss": 0.4088, "step": 1124 }, { "epoch": 0.2897897414431529, "grad_norm": 0.19259174366772489, "learning_rate": 8.943957423496541e-05, "loss": 0.3848, "step": 1125 }, { "epoch": 0.2897897414431529, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8085385018334206, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4265802502632141, "eval_runtime": 17.042, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 1125 }, { "epoch": 0.2900473323244357, "grad_norm": 0.15085277159710533, "learning_rate": 8.94119170890268e-05, "loss": 0.4532, "step": 1126 }, { "epoch": 0.2903049232057185, "grad_norm": 0.15134893601674007, "learning_rate": 8.938422806222253e-05, "loss": 0.4272, "step": 1127 }, { "epoch": 0.29056251408700134, "grad_norm": 0.1827157497719352, "learning_rate": 8.935650717695063e-05, "loss": 0.3573, "step": 1128 }, { "epoch": 0.29082010496828414, "grad_norm": 0.15689178610227686, "learning_rate": 8.932875445563495e-05, "loss": 0.4795, "step": 1129 }, { "epoch": 0.29107769584956694, "grad_norm": 0.19929403334166856, "learning_rate": 8.930096992072505e-05, "loss": 0.4173, "step": 1130 }, { "epoch": 0.29107769584956694, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.7998952331063385, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4345703125, "eval_runtime": 17.6207, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 1130 }, { "epoch": 0.29133528673084974, "grad_norm": 0.18946647806924455, "learning_rate": 8.927315359469626e-05, "loss": 0.3222, "step": 1131 }, { "epoch": 0.29159287761213254, "grad_norm": 0.20696200780240526, "learning_rate": 8.924530550004956e-05, "loss": 0.3743, "step": 1132 }, { "epoch": 0.29185046849341534, "grad_norm": 0.1987515888651939, "learning_rate": 8.921742565931172e-05, "loss": 0.35, "step": 1133 }, { "epoch": 0.29210805937469814, "grad_norm": 0.16159976235476287, "learning_rate": 8.918951409503513e-05, "loss": 0.3929, "step": 1134 }, { "epoch": 0.29236565025598094, "grad_norm": 0.16238900311613275, "learning_rate": 8.916157082979784e-05, "loss": 0.3747, "step": 1135 }, { "epoch": 0.29236565025598094, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.6511262441068623, "eval_PRM F1 AUC (fixed)": 0.8017286537454165, "eval_PRM F1 Neg": 0.45454545454545453, "eval_PRM NPV": 0.47619047619047616, "eval_PRM Precision": 0.8470588235294118, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4612926244735718, "eval_runtime": 16.8421, "eval_samples_per_second": 2.613, "eval_steps_per_second": 0.178, "step": 1135 }, { "epoch": 0.29262324113726373, "grad_norm": 0.18428072984802213, "learning_rate": 8.913359588620357e-05, "loss": 0.4846, "step": 1136 }, { "epoch": 0.29288083201854653, "grad_norm": 0.1900315353785097, "learning_rate": 8.910558928688166e-05, "loss": 0.3433, "step": 1137 }, { "epoch": 0.29313842289982933, "grad_norm": 0.13568771290802525, "learning_rate": 8.907755105448704e-05, "loss": 0.364, "step": 1138 }, { "epoch": 0.29339601378111213, "grad_norm": 0.13052243820266574, "learning_rate": 8.904948121170023e-05, "loss": 0.3534, "step": 1139 }, { "epoch": 0.29365360466239493, "grad_norm": 0.22566695500407144, "learning_rate": 8.902137978122735e-05, "loss": 0.5242, "step": 1140 }, { "epoch": 0.29365360466239493, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.7899423782084861, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4554332494735718, "eval_runtime": 16.6283, "eval_samples_per_second": 2.646, "eval_steps_per_second": 0.18, "step": 1140 }, { "epoch": 0.29391119554367773, "grad_norm": 0.1692190710500419, "learning_rate": 8.899324678580004e-05, "loss": 0.4123, "step": 1141 }, { "epoch": 0.2941687864249606, "grad_norm": 0.20765894455220776, "learning_rate": 8.896508224817549e-05, "loss": 0.3285, "step": 1142 }, { "epoch": 0.2944263773062434, "grad_norm": 0.13904671627369197, "learning_rate": 8.893688619113639e-05, "loss": 0.4232, "step": 1143 }, { "epoch": 0.2946839681875262, "grad_norm": 0.13868165860035878, "learning_rate": 8.890865863749094e-05, "loss": 0.3716, "step": 1144 }, { "epoch": 0.294941559068809, "grad_norm": 0.1563081737442769, "learning_rate": 8.888039961007282e-05, "loss": 0.3796, "step": 1145 }, { "epoch": 0.294941559068809, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.7857517024620221, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.45871803164482117, "eval_runtime": 16.8684, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 1145 }, { "epoch": 0.2951991499500918, "grad_norm": 0.17148236643686612, "learning_rate": 8.885210913174116e-05, "loss": 0.4471, "step": 1146 }, { "epoch": 0.2954567408313746, "grad_norm": 0.18441483048141605, "learning_rate": 8.882378722538052e-05, "loss": 0.3662, "step": 1147 }, { "epoch": 0.2957143317126574, "grad_norm": 0.1267849212135647, "learning_rate": 8.879543391390091e-05, "loss": 0.3472, "step": 1148 }, { "epoch": 0.2959719225939402, "grad_norm": 0.21454118416807022, "learning_rate": 8.876704922023773e-05, "loss": 0.559, "step": 1149 }, { "epoch": 0.29622951347522297, "grad_norm": 0.13037442744739258, "learning_rate": 8.873863316735176e-05, "loss": 0.3644, "step": 1150 }, { "epoch": 0.29622951347522297, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.7967522262964902, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46084871888160706, "eval_runtime": 17.0718, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 1150 }, { "epoch": 0.29648710435650577, "grad_norm": 0.13833008365614993, "learning_rate": 8.871018577822915e-05, "loss": 0.4311, "step": 1151 }, { "epoch": 0.29674469523778857, "grad_norm": 0.14610234625415291, "learning_rate": 8.868170707588142e-05, "loss": 0.4, "step": 1152 }, { "epoch": 0.29700228611907137, "grad_norm": 0.17081565687354094, "learning_rate": 8.865319708334539e-05, "loss": 0.3739, "step": 1153 }, { "epoch": 0.29725987700035417, "grad_norm": 0.18591235797268513, "learning_rate": 8.86246558236832e-05, "loss": 0.4815, "step": 1154 }, { "epoch": 0.29751746788163697, "grad_norm": 0.15041370244571453, "learning_rate": 8.859608331998229e-05, "loss": 0.3936, "step": 1155 }, { "epoch": 0.29751746788163697, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8019905709795704, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4398970305919647, "eval_runtime": 17.1175, "eval_samples_per_second": 2.57, "eval_steps_per_second": 0.175, "step": 1155 }, { "epoch": 0.2977750587629198, "grad_norm": 0.18498795475592514, "learning_rate": 8.856747959535537e-05, "loss": 0.3891, "step": 1156 }, { "epoch": 0.2980326496442026, "grad_norm": 0.1865577774791989, "learning_rate": 8.85388446729404e-05, "loss": 0.3755, "step": 1157 }, { "epoch": 0.2982902405254854, "grad_norm": 0.14158700429660712, "learning_rate": 8.851017857590057e-05, "loss": 0.3832, "step": 1158 }, { "epoch": 0.2985478314067682, "grad_norm": 0.11877620381015096, "learning_rate": 8.848148132742431e-05, "loss": 0.3249, "step": 1159 }, { "epoch": 0.298805422288051, "grad_norm": 0.13393740338330443, "learning_rate": 8.845275295072523e-05, "loss": 0.3774, "step": 1160 }, { "epoch": 0.298805422288051, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8137768465165007, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.43741121888160706, "eval_runtime": 17.6799, "eval_samples_per_second": 2.489, "eval_steps_per_second": 0.17, "step": 1160 }, { "epoch": 0.2990630131693338, "grad_norm": 0.2809457665636938, "learning_rate": 8.842399346904214e-05, "loss": 0.5072, "step": 1161 }, { "epoch": 0.2993206040506166, "grad_norm": 0.1421598886917343, "learning_rate": 8.839520290563898e-05, "loss": 0.3696, "step": 1162 }, { "epoch": 0.2995781949318994, "grad_norm": 0.19354837911463907, "learning_rate": 8.836638128380485e-05, "loss": 0.4889, "step": 1163 }, { "epoch": 0.2998357858131822, "grad_norm": 0.1403723474570022, "learning_rate": 8.8337528626854e-05, "loss": 0.3794, "step": 1164 }, { "epoch": 0.300093376694465, "grad_norm": 0.16073944963198727, "learning_rate": 8.830864495812575e-05, "loss": 0.4333, "step": 1165 }, { "epoch": 0.300093376694465, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8150864326872709, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4271129369735718, "eval_runtime": 16.944, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 1165 }, { "epoch": 0.3003509675757478, "grad_norm": 0.1350182376247347, "learning_rate": 8.827973030098448e-05, "loss": 0.3809, "step": 1166 }, { "epoch": 0.3006085584570306, "grad_norm": 0.14958855249156072, "learning_rate": 8.825078467881969e-05, "loss": 0.4395, "step": 1167 }, { "epoch": 0.3008661493383134, "grad_norm": 0.128554203239887, "learning_rate": 8.822180811504593e-05, "loss": 0.3676, "step": 1168 }, { "epoch": 0.3011237402195962, "grad_norm": 0.17459651454266562, "learning_rate": 8.819280063310274e-05, "loss": 0.4544, "step": 1169 }, { "epoch": 0.301381331100879, "grad_norm": 0.18874387236409038, "learning_rate": 8.816376225645471e-05, "loss": 0.4498, "step": 1170 }, { "epoch": 0.301381331100879, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.7975379779989523, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.44717684388160706, "eval_runtime": 17.5798, "eval_samples_per_second": 2.503, "eval_steps_per_second": 0.171, "step": 1170 }, { "epoch": 0.30163892198216186, "grad_norm": 0.17317334322066305, "learning_rate": 8.813469300859136e-05, "loss": 0.4307, "step": 1171 }, { "epoch": 0.30189651286344465, "grad_norm": 0.15562637374979635, "learning_rate": 8.810559291302724e-05, "loss": 0.4605, "step": 1172 }, { "epoch": 0.30215410374472745, "grad_norm": 0.14318991515102034, "learning_rate": 8.807646199330187e-05, "loss": 0.4409, "step": 1173 }, { "epoch": 0.30241169462601025, "grad_norm": 0.11595524745244784, "learning_rate": 8.804730027297961e-05, "loss": 0.3555, "step": 1174 }, { "epoch": 0.30266928550729305, "grad_norm": 0.16136396366631714, "learning_rate": 8.801810777564982e-05, "loss": 0.3936, "step": 1175 }, { "epoch": 0.30266928550729305, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.7828706128863279, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4664417505264282, "eval_runtime": 17.0863, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 1175 }, { "epoch": 0.30292687638857585, "grad_norm": 0.1968764338436339, "learning_rate": 8.798888452492674e-05, "loss": 0.4913, "step": 1176 }, { "epoch": 0.30318446726985865, "grad_norm": 0.13855772989577, "learning_rate": 8.795963054444947e-05, "loss": 0.4691, "step": 1177 }, { "epoch": 0.30344205815114145, "grad_norm": 0.16407096095524348, "learning_rate": 8.793034585788199e-05, "loss": 0.3687, "step": 1178 }, { "epoch": 0.30369964903242425, "grad_norm": 0.1218858383609149, "learning_rate": 8.790103048891307e-05, "loss": 0.3499, "step": 1179 }, { "epoch": 0.30395723991370704, "grad_norm": 0.16665699691334412, "learning_rate": 8.787168446125638e-05, "loss": 0.3798, "step": 1180 }, { "epoch": 0.30395723991370704, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.7627029858564693, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4906782805919647, "eval_runtime": 17.0084, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 1180 }, { "epoch": 0.30421483079498984, "grad_norm": 0.15397147526861624, "learning_rate": 8.784230779865029e-05, "loss": 0.3445, "step": 1181 }, { "epoch": 0.30447242167627264, "grad_norm": 0.21275502542260502, "learning_rate": 8.781290052485802e-05, "loss": 0.4511, "step": 1182 }, { "epoch": 0.30473001255755544, "grad_norm": 0.16415926499365743, "learning_rate": 8.778346266366757e-05, "loss": 0.3753, "step": 1183 }, { "epoch": 0.30498760343883824, "grad_norm": 0.12378140355671932, "learning_rate": 8.775399423889161e-05, "loss": 0.3193, "step": 1184 }, { "epoch": 0.3052451943201211, "grad_norm": 0.16098141515356412, "learning_rate": 8.77244952743676e-05, "loss": 0.4169, "step": 1185 }, { "epoch": 0.3052451943201211, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.7705605028810895, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.48757103085517883, "eval_runtime": 17.5867, "eval_samples_per_second": 2.502, "eval_steps_per_second": 0.171, "step": 1185 }, { "epoch": 0.3055027852014039, "grad_norm": 0.17324325398639254, "learning_rate": 8.769496579395764e-05, "loss": 0.3733, "step": 1186 }, { "epoch": 0.3057603760826867, "grad_norm": 0.14197743620468575, "learning_rate": 8.766540582154859e-05, "loss": 0.369, "step": 1187 }, { "epoch": 0.3060179669639695, "grad_norm": 0.16480132985351342, "learning_rate": 8.76358153810519e-05, "loss": 0.394, "step": 1188 }, { "epoch": 0.3062755578452523, "grad_norm": 0.2826096008580452, "learning_rate": 8.760619449640372e-05, "loss": 0.468, "step": 1189 }, { "epoch": 0.3065331487265351, "grad_norm": 0.18957887520775457, "learning_rate": 8.757654319156482e-05, "loss": 0.4294, "step": 1190 }, { "epoch": 0.3065331487265351, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8072289156626505, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4574751555919647, "eval_runtime": 17.1127, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 1190 }, { "epoch": 0.3067907396078179, "grad_norm": 0.14414649332121532, "learning_rate": 8.754686149052057e-05, "loss": 0.3039, "step": 1191 }, { "epoch": 0.3070483304891007, "grad_norm": 0.17509755549957035, "learning_rate": 8.751714941728091e-05, "loss": 0.3898, "step": 1192 }, { "epoch": 0.3073059213703835, "grad_norm": 0.1932275456795746, "learning_rate": 8.748740699588034e-05, "loss": 0.3568, "step": 1193 }, { "epoch": 0.3075635122516663, "grad_norm": 0.1774795799754782, "learning_rate": 8.745763425037797e-05, "loss": 0.3454, "step": 1194 }, { "epoch": 0.3078211031329491, "grad_norm": 0.2659508438059728, "learning_rate": 8.742783120485739e-05, "loss": 0.3625, "step": 1195 }, { "epoch": 0.3078211031329491, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.8124672603457307, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4498401880264282, "eval_runtime": 16.9365, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 1195 }, { "epoch": 0.3080786940142319, "grad_norm": 0.21356756307895253, "learning_rate": 8.739799788342669e-05, "loss": 0.3284, "step": 1196 }, { "epoch": 0.3083362848955147, "grad_norm": 0.17366284083597983, "learning_rate": 8.736813431021849e-05, "loss": 0.3822, "step": 1197 }, { "epoch": 0.3085938757767975, "grad_norm": 0.22473261015938767, "learning_rate": 8.733824050938987e-05, "loss": 0.4305, "step": 1198 }, { "epoch": 0.30885146665808033, "grad_norm": 0.1812789568753846, "learning_rate": 8.730831650512235e-05, "loss": 0.3994, "step": 1199 }, { "epoch": 0.30910905753936313, "grad_norm": 0.20540965466740607, "learning_rate": 8.727836232162187e-05, "loss": 0.3863, "step": 1200 }, { "epoch": 0.30910905753936313, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8459926663174437, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.43190696835517883, "eval_runtime": 16.8974, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 1200 }, { "epoch": 0.30936664842064593, "grad_norm": 0.1896679470155028, "learning_rate": 8.724837798311882e-05, "loss": 0.4249, "step": 1201 }, { "epoch": 0.3096242393019287, "grad_norm": 0.1291647190340969, "learning_rate": 8.721836351386798e-05, "loss": 0.3658, "step": 1202 }, { "epoch": 0.3098818301832115, "grad_norm": 0.14056234051345792, "learning_rate": 8.718831893814843e-05, "loss": 0.4249, "step": 1203 }, { "epoch": 0.3101394210644943, "grad_norm": 0.20666558657223139, "learning_rate": 8.71582442802637e-05, "loss": 0.4737, "step": 1204 }, { "epoch": 0.3103970119457771, "grad_norm": 0.16662802933282916, "learning_rate": 8.71281395645416e-05, "loss": 0.4764, "step": 1205 }, { "epoch": 0.3103970119457771, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8496595075955998, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4136185944080353, "eval_runtime": 16.9638, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 1205 }, { "epoch": 0.3106546028270599, "grad_norm": 0.16339072732165263, "learning_rate": 8.709800481533427e-05, "loss": 0.4464, "step": 1206 }, { "epoch": 0.3109121937083427, "grad_norm": 0.1815034469123639, "learning_rate": 8.706784005701814e-05, "loss": 0.4031, "step": 1207 }, { "epoch": 0.3111697845896255, "grad_norm": 0.13853133121765238, "learning_rate": 8.703764531399392e-05, "loss": 0.431, "step": 1208 }, { "epoch": 0.3114273754709083, "grad_norm": 0.13783723603341652, "learning_rate": 8.700742061068657e-05, "loss": 0.382, "step": 1209 }, { "epoch": 0.3116849663521911, "grad_norm": 0.1405843355948723, "learning_rate": 8.697716597154527e-05, "loss": 0.3798, "step": 1210 }, { "epoch": 0.3116849663521911, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8512310110005238, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.41237571835517883, "eval_runtime": 17.4804, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 1210 }, { "epoch": 0.3119425572334739, "grad_norm": 0.18397417100794597, "learning_rate": 8.694688142104346e-05, "loss": 0.36, "step": 1211 }, { "epoch": 0.3122001481147567, "grad_norm": 0.10642471958300147, "learning_rate": 8.691656698367871e-05, "loss": 0.4115, "step": 1212 }, { "epoch": 0.3124577389960395, "grad_norm": 0.1994724055535455, "learning_rate": 8.688622268397286e-05, "loss": 0.4739, "step": 1213 }, { "epoch": 0.31271532987732237, "grad_norm": 0.11369822753136088, "learning_rate": 8.68558485464718e-05, "loss": 0.4602, "step": 1214 }, { "epoch": 0.31297292075860517, "grad_norm": 0.11256651847643659, "learning_rate": 8.682544459574562e-05, "loss": 0.3026, "step": 1215 }, { "epoch": 0.31297292075860517, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8342063907805134, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4140625, "eval_runtime": 17.2116, "eval_samples_per_second": 2.556, "eval_steps_per_second": 0.174, "step": 1215 }, { "epoch": 0.31323051163988797, "grad_norm": 0.17862063780763238, "learning_rate": 8.679501085638853e-05, "loss": 0.4273, "step": 1216 }, { "epoch": 0.31348810252117076, "grad_norm": 0.1577348090762122, "learning_rate": 8.676454735301878e-05, "loss": 0.3978, "step": 1217 }, { "epoch": 0.31374569340245356, "grad_norm": 0.15925934019021948, "learning_rate": 8.673405411027877e-05, "loss": 0.3517, "step": 1218 }, { "epoch": 0.31400328428373636, "grad_norm": 0.16926013606207752, "learning_rate": 8.670353115283492e-05, "loss": 0.3725, "step": 1219 }, { "epoch": 0.31426087516501916, "grad_norm": 0.18883500614297238, "learning_rate": 8.667297850537768e-05, "loss": 0.38, "step": 1220 }, { "epoch": 0.31426087516501916, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8255631220534311, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.41725853085517883, "eval_runtime": 17.4378, "eval_samples_per_second": 2.523, "eval_steps_per_second": 0.172, "step": 1220 }, { "epoch": 0.31451846604630196, "grad_norm": 0.14939234966264475, "learning_rate": 8.664239619262152e-05, "loss": 0.3146, "step": 1221 }, { "epoch": 0.31477605692758476, "grad_norm": 0.14149866397194702, "learning_rate": 8.661178423930491e-05, "loss": 0.3476, "step": 1222 }, { "epoch": 0.31503364780886756, "grad_norm": 0.14442653026119623, "learning_rate": 8.658114267019032e-05, "loss": 0.4064, "step": 1223 }, { "epoch": 0.31529123869015035, "grad_norm": 0.14810123407861983, "learning_rate": 8.655047151006412e-05, "loss": 0.3844, "step": 1224 }, { "epoch": 0.31554882957143315, "grad_norm": 0.17168154326680385, "learning_rate": 8.65197707837367e-05, "loss": 0.3731, "step": 1225 }, { "epoch": 0.31554882957143315, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.8258250392875851, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4500177502632141, "eval_runtime": 17.8052, "eval_samples_per_second": 2.471, "eval_steps_per_second": 0.168, "step": 1225 }, { "epoch": 0.31580642045271595, "grad_norm": 0.3030975977119537, "learning_rate": 8.648904051604228e-05, "loss": 0.4581, "step": 1226 }, { "epoch": 0.31606401133399875, "grad_norm": 0.1751484085095841, "learning_rate": 8.645828073183901e-05, "loss": 0.4038, "step": 1227 }, { "epoch": 0.3163216022152816, "grad_norm": 0.10830543210017876, "learning_rate": 8.642749145600896e-05, "loss": 0.2773, "step": 1228 }, { "epoch": 0.3165791930965644, "grad_norm": 0.12772794170071314, "learning_rate": 8.639667271345798e-05, "loss": 0.3576, "step": 1229 }, { "epoch": 0.3168367839778472, "grad_norm": 0.14268356543286403, "learning_rate": 8.636582452911582e-05, "loss": 0.3755, "step": 1230 }, { "epoch": 0.3168367839778472, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.817705605028811, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42356178164482117, "eval_runtime": 16.7115, "eval_samples_per_second": 2.633, "eval_steps_per_second": 0.18, "step": 1230 }, { "epoch": 0.31709437485913, "grad_norm": 0.12163397658951906, "learning_rate": 8.6334946927936e-05, "loss": 0.3552, "step": 1231 }, { "epoch": 0.3173519657404128, "grad_norm": 0.16776555706104138, "learning_rate": 8.630403993489586e-05, "loss": 0.3961, "step": 1232 }, { "epoch": 0.3176095566216956, "grad_norm": 0.17970020587684662, "learning_rate": 8.627310357499651e-05, "loss": 0.4193, "step": 1233 }, { "epoch": 0.3178671475029784, "grad_norm": 0.1806456252773367, "learning_rate": 8.624213787326283e-05, "loss": 0.3441, "step": 1234 }, { "epoch": 0.3181247383842612, "grad_norm": 0.13372390871625306, "learning_rate": 8.621114285474341e-05, "loss": 0.3791, "step": 1235 }, { "epoch": 0.3181247383842612, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8140387637506549, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.42666903138160706, "eval_runtime": 17.774, "eval_samples_per_second": 2.476, "eval_steps_per_second": 0.169, "step": 1235 }, { "epoch": 0.318382329265544, "grad_norm": 0.16891276628395552, "learning_rate": 8.618011854451056e-05, "loss": 0.3737, "step": 1236 }, { "epoch": 0.3186399201468268, "grad_norm": 0.12078289545573649, "learning_rate": 8.614906496766028e-05, "loss": 0.2555, "step": 1237 }, { "epoch": 0.3188975110281096, "grad_norm": 0.22927635404931196, "learning_rate": 8.611798214931228e-05, "loss": 0.4498, "step": 1238 }, { "epoch": 0.3191551019093924, "grad_norm": 0.14416880745920815, "learning_rate": 8.60868701146099e-05, "loss": 0.3825, "step": 1239 }, { "epoch": 0.3194126927906752, "grad_norm": 0.18370493477302663, "learning_rate": 8.60557288887201e-05, "loss": 0.4087, "step": 1240 }, { "epoch": 0.3194126927906752, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8192771084337349, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42551490664482117, "eval_runtime": 17.4223, "eval_samples_per_second": 2.525, "eval_steps_per_second": 0.172, "step": 1240 }, { "epoch": 0.319670283671958, "grad_norm": 0.13499526977426504, "learning_rate": 8.602455849683343e-05, "loss": 0.3337, "step": 1241 }, { "epoch": 0.31992787455324084, "grad_norm": 0.1650001933459186, "learning_rate": 8.599335896416411e-05, "loss": 0.3741, "step": 1242 }, { "epoch": 0.32018546543452364, "grad_norm": 0.2131474507015171, "learning_rate": 8.596213031594991e-05, "loss": 0.4309, "step": 1243 }, { "epoch": 0.32044305631580644, "grad_norm": 0.16270471474180964, "learning_rate": 8.593087257745206e-05, "loss": 0.3022, "step": 1244 }, { "epoch": 0.32070064719708924, "grad_norm": 0.28199811651187745, "learning_rate": 8.589958577395548e-05, "loss": 0.5201, "step": 1245 }, { "epoch": 0.32070064719708924, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8234677841801991, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4303089380264282, "eval_runtime": 17.5743, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 1245 }, { "epoch": 0.32095823807837204, "grad_norm": 0.17211826248051826, "learning_rate": 8.586826993076845e-05, "loss": 0.4354, "step": 1246 }, { "epoch": 0.32121582895965484, "grad_norm": 0.1558940660053975, "learning_rate": 8.583692507322283e-05, "loss": 0.4052, "step": 1247 }, { "epoch": 0.32147341984093764, "grad_norm": 0.15693953542368577, "learning_rate": 8.580555122667393e-05, "loss": 0.3479, "step": 1248 }, { "epoch": 0.32173101072222043, "grad_norm": 0.12866745799305607, "learning_rate": 8.57741484165005e-05, "loss": 0.3977, "step": 1249 }, { "epoch": 0.32198860160350323, "grad_norm": 0.1576725019290017, "learning_rate": 8.57427166681047e-05, "loss": 0.3907, "step": 1250 }, { "epoch": 0.32198860160350323, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.821896280775275, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4234730005264282, "eval_runtime": 16.929, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 1250 }, { "epoch": 0.32224619248478603, "grad_norm": 0.13994496627475964, "learning_rate": 8.571125600691214e-05, "loss": 0.4031, "step": 1251 }, { "epoch": 0.32250378336606883, "grad_norm": 0.19596879488832833, "learning_rate": 8.567976645837182e-05, "loss": 0.4396, "step": 1252 }, { "epoch": 0.32276137424735163, "grad_norm": 0.12227294951033923, "learning_rate": 8.564824804795607e-05, "loss": 0.3479, "step": 1253 }, { "epoch": 0.3230189651286344, "grad_norm": 0.14608353702519508, "learning_rate": 8.561670080116058e-05, "loss": 0.3804, "step": 1254 }, { "epoch": 0.3232765560099172, "grad_norm": 0.18672799730283188, "learning_rate": 8.558512474350437e-05, "loss": 0.3226, "step": 1255 }, { "epoch": 0.3232765560099172, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8174436877946569, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42018821835517883, "eval_runtime": 17.1514, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 1255 }, { "epoch": 0.3235341468912, "grad_norm": 0.11825448718166798, "learning_rate": 8.55535199005298e-05, "loss": 0.3897, "step": 1256 }, { "epoch": 0.3237917377724829, "grad_norm": 0.13160022422288747, "learning_rate": 8.552188629780244e-05, "loss": 0.3846, "step": 1257 }, { "epoch": 0.3240493286537657, "grad_norm": 0.15730486806555002, "learning_rate": 8.549022396091117e-05, "loss": 0.4055, "step": 1258 }, { "epoch": 0.3243069195350485, "grad_norm": 0.1749720457799955, "learning_rate": 8.545853291546815e-05, "loss": 0.3278, "step": 1259 }, { "epoch": 0.3245645104163313, "grad_norm": 0.12655220053680086, "learning_rate": 8.542681318710868e-05, "loss": 0.34, "step": 1260 }, { "epoch": 0.3245645104163313, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8208486118386591, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4215198755264282, "eval_runtime": 16.6848, "eval_samples_per_second": 2.637, "eval_steps_per_second": 0.18, "step": 1260 }, { "epoch": 0.3248221012976141, "grad_norm": 0.18477328036303636, "learning_rate": 8.53950648014913e-05, "loss": 0.4419, "step": 1261 }, { "epoch": 0.3250796921788969, "grad_norm": 0.13539757208711653, "learning_rate": 8.536328778429776e-05, "loss": 0.3835, "step": 1262 }, { "epoch": 0.32533728306017967, "grad_norm": 0.14506415255471578, "learning_rate": 8.533148216123294e-05, "loss": 0.3345, "step": 1263 }, { "epoch": 0.32559487394146247, "grad_norm": 0.17447624941093595, "learning_rate": 8.529964795802485e-05, "loss": 0.448, "step": 1264 }, { "epoch": 0.32585246482274527, "grad_norm": 0.13471232226570085, "learning_rate": 8.526778520042465e-05, "loss": 0.3891, "step": 1265 }, { "epoch": 0.32585246482274527, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8292299633315872, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4249822497367859, "eval_runtime": 17.2677, "eval_samples_per_second": 2.548, "eval_steps_per_second": 0.174, "step": 1265 }, { "epoch": 0.32611005570402807, "grad_norm": 0.14133878815996587, "learning_rate": 8.523589391420659e-05, "loss": 0.3642, "step": 1266 }, { "epoch": 0.32636764658531087, "grad_norm": 0.15809887204198128, "learning_rate": 8.520397412516796e-05, "loss": 0.4276, "step": 1267 }, { "epoch": 0.32662523746659367, "grad_norm": 0.17408018223997435, "learning_rate": 8.517202585912916e-05, "loss": 0.3671, "step": 1268 }, { "epoch": 0.32688282834787646, "grad_norm": 0.14759042263439778, "learning_rate": 8.514004914193359e-05, "loss": 0.3888, "step": 1269 }, { "epoch": 0.32714041922915926, "grad_norm": 0.142151912473614, "learning_rate": 8.510804399944768e-05, "loss": 0.3761, "step": 1270 }, { "epoch": 0.32714041922915926, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8289680460974332, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4115767180919647, "eval_runtime": 17.5498, "eval_samples_per_second": 2.507, "eval_steps_per_second": 0.171, "step": 1270 }, { "epoch": 0.3273980101104421, "grad_norm": 0.16297593692085313, "learning_rate": 8.507601045756085e-05, "loss": 0.3486, "step": 1271 }, { "epoch": 0.3276556009917249, "grad_norm": 0.1488473489630805, "learning_rate": 8.504394854218549e-05, "loss": 0.3507, "step": 1272 }, { "epoch": 0.3279131918730077, "grad_norm": 0.14840130142532929, "learning_rate": 8.501185827925695e-05, "loss": 0.3529, "step": 1273 }, { "epoch": 0.3281707827542905, "grad_norm": 0.24385263451908412, "learning_rate": 8.49797396947335e-05, "loss": 0.4821, "step": 1274 }, { "epoch": 0.3284283736355733, "grad_norm": 0.1930800362732749, "learning_rate": 8.49475928145963e-05, "loss": 0.4544, "step": 1275 }, { "epoch": 0.3284283736355733, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8318491356731273, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.41512784361839294, "eval_runtime": 17.0142, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 1275 }, { "epoch": 0.3286859645168561, "grad_norm": 0.19851611447060466, "learning_rate": 8.491541766484948e-05, "loss": 0.3297, "step": 1276 }, { "epoch": 0.3289435553981389, "grad_norm": 0.21440471176504394, "learning_rate": 8.48832142715199e-05, "loss": 0.4597, "step": 1277 }, { "epoch": 0.3292011462794217, "grad_norm": 0.18507804814086945, "learning_rate": 8.485098266065744e-05, "loss": 0.3727, "step": 1278 }, { "epoch": 0.3294587371607045, "grad_norm": 0.1530855606606991, "learning_rate": 8.481872285833466e-05, "loss": 0.4036, "step": 1279 }, { "epoch": 0.3297163280419873, "grad_norm": 0.15978439362907434, "learning_rate": 8.478643489064696e-05, "loss": 0.3761, "step": 1280 }, { "epoch": 0.3297163280419873, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8389209009952854, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.41139915585517883, "eval_runtime": 17.4856, "eval_samples_per_second": 2.516, "eval_steps_per_second": 0.172, "step": 1280 }, { "epoch": 0.3299739189232701, "grad_norm": 0.16227483798866657, "learning_rate": 8.475411878371257e-05, "loss": 0.3174, "step": 1281 }, { "epoch": 0.3302315098045529, "grad_norm": 0.21017507599791935, "learning_rate": 8.472177456367247e-05, "loss": 0.4298, "step": 1282 }, { "epoch": 0.3304891006858357, "grad_norm": 0.13204248189334422, "learning_rate": 8.468940225669032e-05, "loss": 0.3534, "step": 1283 }, { "epoch": 0.3307466915671185, "grad_norm": 0.14258606263414392, "learning_rate": 8.465700188895258e-05, "loss": 0.3688, "step": 1284 }, { "epoch": 0.3310042824484013, "grad_norm": 0.1305835169588656, "learning_rate": 8.462457348666835e-05, "loss": 0.3611, "step": 1285 }, { "epoch": 0.3310042824484013, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4419389069080353, "eval_runtime": 17.0583, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 1285 }, { "epoch": 0.33126187332968415, "grad_norm": 0.16092013947178962, "learning_rate": 8.459211707606944e-05, "loss": 0.372, "step": 1286 }, { "epoch": 0.33151946421096695, "grad_norm": 0.17778770214874737, "learning_rate": 8.45596326834103e-05, "loss": 0.3949, "step": 1287 }, { "epoch": 0.33177705509224975, "grad_norm": 0.18362134703055624, "learning_rate": 8.452712033496804e-05, "loss": 0.3685, "step": 1288 }, { "epoch": 0.33203464597353255, "grad_norm": 0.17087794860624836, "learning_rate": 8.449458005704234e-05, "loss": 0.385, "step": 1289 }, { "epoch": 0.33229223685481535, "grad_norm": 0.18615913920379806, "learning_rate": 8.446201187595553e-05, "loss": 0.4307, "step": 1290 }, { "epoch": 0.33229223685481535, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.854635935044526, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.39657315611839294, "eval_runtime": 16.9029, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.177, "step": 1290 }, { "epoch": 0.33254982773609815, "grad_norm": 0.1460038447016405, "learning_rate": 8.442941581805244e-05, "loss": 0.4036, "step": 1291 }, { "epoch": 0.33280741861738095, "grad_norm": 0.11943139862815354, "learning_rate": 8.439679190970052e-05, "loss": 0.3282, "step": 1292 }, { "epoch": 0.33306500949866374, "grad_norm": 0.17332064832884891, "learning_rate": 8.436414017728969e-05, "loss": 0.427, "step": 1293 }, { "epoch": 0.33332260037994654, "grad_norm": 0.15322325576197193, "learning_rate": 8.433146064723244e-05, "loss": 0.3419, "step": 1294 }, { "epoch": 0.33358019126122934, "grad_norm": 0.13911380716005922, "learning_rate": 8.42987533459637e-05, "loss": 0.4263, "step": 1295 }, { "epoch": 0.33358019126122934, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8425877422734416, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3982599377632141, "eval_runtime": 16.8784, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 1295 }, { "epoch": 0.33383778214251214, "grad_norm": 0.18206489318644195, "learning_rate": 8.426601829994084e-05, "loss": 0.3426, "step": 1296 }, { "epoch": 0.33409537302379494, "grad_norm": 0.18250021523584306, "learning_rate": 8.423325553564376e-05, "loss": 0.4747, "step": 1297 }, { "epoch": 0.33435296390507774, "grad_norm": 0.11819516066568826, "learning_rate": 8.42004650795747e-05, "loss": 0.3437, "step": 1298 }, { "epoch": 0.33461055478636054, "grad_norm": 0.19065441482794301, "learning_rate": 8.416764695825835e-05, "loss": 0.4615, "step": 1299 }, { "epoch": 0.3348681456676434, "grad_norm": 0.1380286940212448, "learning_rate": 8.413480119824173e-05, "loss": 0.3242, "step": 1300 }, { "epoch": 0.3348681456676434, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8331587218438973, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4088245630264282, "eval_runtime": 17.1128, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 1300 }, { "epoch": 0.3351257365489262, "grad_norm": 0.15578851670667726, "learning_rate": 8.410192782609429e-05, "loss": 0.3764, "step": 1301 }, { "epoch": 0.335383327430209, "grad_norm": 0.215388303388419, "learning_rate": 8.406902686840772e-05, "loss": 0.3254, "step": 1302 }, { "epoch": 0.3356409183114918, "grad_norm": 0.13339317338676554, "learning_rate": 8.403609835179613e-05, "loss": 0.4124, "step": 1303 }, { "epoch": 0.3358985091927746, "grad_norm": 0.14146535775312236, "learning_rate": 8.400314230289583e-05, "loss": 0.4055, "step": 1304 }, { "epoch": 0.3361561000740574, "grad_norm": 0.14849592257542354, "learning_rate": 8.397015874836547e-05, "loss": 0.3757, "step": 1305 }, { "epoch": 0.3361561000740574, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8242535358826611, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4293323755264282, "eval_runtime": 17.386, "eval_samples_per_second": 2.531, "eval_steps_per_second": 0.173, "step": 1305 }, { "epoch": 0.3364136909553402, "grad_norm": 0.17936713734274362, "learning_rate": 8.39371477148859e-05, "loss": 0.4234, "step": 1306 }, { "epoch": 0.336671281836623, "grad_norm": 0.13451082024384375, "learning_rate": 8.390410922916024e-05, "loss": 0.371, "step": 1307 }, { "epoch": 0.3369288727179058, "grad_norm": 0.1309211290832178, "learning_rate": 8.387104331791376e-05, "loss": 0.3937, "step": 1308 }, { "epoch": 0.3371864635991886, "grad_norm": 0.2278044101515965, "learning_rate": 8.383795000789398e-05, "loss": 0.4203, "step": 1309 }, { "epoch": 0.3374440544804714, "grad_norm": 0.1840985853408649, "learning_rate": 8.380482932587055e-05, "loss": 0.3201, "step": 1310 }, { "epoch": 0.3374440544804714, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8414634146341463, "eval_PRM F1 AUC": 0.6547930853850183, "eval_PRM F1 AUC (fixed)": 0.8169198533263489, "eval_PRM F1 Neg": 0.4583333333333333, "eval_PRM NPV": 0.44, "eval_PRM Precision": 0.8518518518518519, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42311790585517883, "eval_runtime": 16.929, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 1310 }, { "epoch": 0.3377016453617542, "grad_norm": 0.1305953076616349, "learning_rate": 8.377168129863525e-05, "loss": 0.3281, "step": 1311 }, { "epoch": 0.337959236243037, "grad_norm": 0.1649868811408297, "learning_rate": 8.373850595300202e-05, "loss": 0.3613, "step": 1312 }, { "epoch": 0.3382168271243198, "grad_norm": 0.19185949815093697, "learning_rate": 8.370530331580686e-05, "loss": 0.3323, "step": 1313 }, { "epoch": 0.33847441800560263, "grad_norm": 0.1833500953398535, "learning_rate": 8.367207341390785e-05, "loss": 0.4303, "step": 1314 }, { "epoch": 0.3387320088868854, "grad_norm": 0.14749333207401943, "learning_rate": 8.363881627418515e-05, "loss": 0.3659, "step": 1315 }, { "epoch": 0.3387320088868854, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8323729701414352, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46297940611839294, "eval_runtime": 17.1502, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 1315 }, { "epoch": 0.3389895997681682, "grad_norm": 0.1798958834222602, "learning_rate": 8.360553192354094e-05, "loss": 0.3787, "step": 1316 }, { "epoch": 0.339247190649451, "grad_norm": 0.15965668527631885, "learning_rate": 8.357222038889938e-05, "loss": 0.3776, "step": 1317 }, { "epoch": 0.3395047815307338, "grad_norm": 0.13709013840232095, "learning_rate": 8.35388816972067e-05, "loss": 0.3272, "step": 1318 }, { "epoch": 0.3397623724120166, "grad_norm": 0.17306432176073624, "learning_rate": 8.3505515875431e-05, "loss": 0.3394, "step": 1319 }, { "epoch": 0.3400199632932994, "grad_norm": 0.20485278000248477, "learning_rate": 8.347212295056239e-05, "loss": 0.3999, "step": 1320 }, { "epoch": 0.3400199632932994, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8082765845992667, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.5025745630264282, "eval_runtime": 17.4317, "eval_samples_per_second": 2.524, "eval_steps_per_second": 0.172, "step": 1320 }, { "epoch": 0.3402775541745822, "grad_norm": 0.21742616600145087, "learning_rate": 8.343870294961289e-05, "loss": 0.3972, "step": 1321 }, { "epoch": 0.340535145055865, "grad_norm": 0.15347377286264746, "learning_rate": 8.34052558996164e-05, "loss": 0.3675, "step": 1322 }, { "epoch": 0.3407927359371478, "grad_norm": 0.11522537504058397, "learning_rate": 8.337178182762875e-05, "loss": 0.2629, "step": 1323 }, { "epoch": 0.3410503268184306, "grad_norm": 0.17747280570334042, "learning_rate": 8.333828076072758e-05, "loss": 0.3105, "step": 1324 }, { "epoch": 0.3413079176997134, "grad_norm": 0.14334080436061902, "learning_rate": 8.33047527260124e-05, "loss": 0.297, "step": 1325 }, { "epoch": 0.3413079176997134, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8343558282208589, "eval_PRM F1 AUC": 0.6487689889994761, "eval_PRM F1 AUC (fixed)": 0.7998952331063385, "eval_PRM F1 Neg": 0.4489795918367347, "eval_PRM NPV": 0.4230769230769231, "eval_PRM Precision": 0.85, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4607599377632141, "eval_runtime": 16.9502, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 1325 }, { "epoch": 0.3415655085809962, "grad_norm": 0.12958132437691017, "learning_rate": 8.327119775060448e-05, "loss": 0.3461, "step": 1326 }, { "epoch": 0.341823099462279, "grad_norm": 0.16596786806410102, "learning_rate": 8.323761586164695e-05, "loss": 0.4507, "step": 1327 }, { "epoch": 0.3420806903435618, "grad_norm": 0.16310848530413852, "learning_rate": 8.320400708630469e-05, "loss": 0.3616, "step": 1328 }, { "epoch": 0.34233828122484466, "grad_norm": 0.1531680955964758, "learning_rate": 8.317037145176429e-05, "loss": 0.3164, "step": 1329 }, { "epoch": 0.34259587210612746, "grad_norm": 0.157358284374019, "learning_rate": 8.313670898523411e-05, "loss": 0.4087, "step": 1330 }, { "epoch": 0.34259587210612746, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8017286537454165, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.48268821835517883, "eval_runtime": 16.476, "eval_samples_per_second": 2.671, "eval_steps_per_second": 0.182, "step": 1330 }, { "epoch": 0.34285346298741026, "grad_norm": 0.15273514663059792, "learning_rate": 8.310301971394423e-05, "loss": 0.3618, "step": 1331 }, { "epoch": 0.34311105386869306, "grad_norm": 0.1485857094378795, "learning_rate": 8.306930366514636e-05, "loss": 0.3632, "step": 1332 }, { "epoch": 0.34336864474997586, "grad_norm": 0.17822254981407065, "learning_rate": 8.30355608661139e-05, "loss": 0.4401, "step": 1333 }, { "epoch": 0.34362623563125866, "grad_norm": 0.1308862540507762, "learning_rate": 8.300179134414188e-05, "loss": 0.3314, "step": 1334 }, { "epoch": 0.34388382651254146, "grad_norm": 0.2297224618715055, "learning_rate": 8.296799512654695e-05, "loss": 0.3424, "step": 1335 }, { "epoch": 0.34388382651254146, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8027763226820326, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.49440696835517883, "eval_runtime": 17.6253, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 1335 }, { "epoch": 0.34414141739382426, "grad_norm": 0.14532675301528403, "learning_rate": 8.293417224066737e-05, "loss": 0.3423, "step": 1336 }, { "epoch": 0.34439900827510705, "grad_norm": 0.11052412566857149, "learning_rate": 8.290032271386294e-05, "loss": 0.3278, "step": 1337 }, { "epoch": 0.34465659915638985, "grad_norm": 0.14583081075008858, "learning_rate": 8.286644657351505e-05, "loss": 0.3772, "step": 1338 }, { "epoch": 0.34491419003767265, "grad_norm": 0.20985079572005483, "learning_rate": 8.283254384702659e-05, "loss": 0.419, "step": 1339 }, { "epoch": 0.34517178091895545, "grad_norm": 0.2044333659003953, "learning_rate": 8.279861456182194e-05, "loss": 0.426, "step": 1340 }, { "epoch": 0.34517178091895545, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8132530120481928, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4859730005264282, "eval_runtime": 16.4089, "eval_samples_per_second": 2.681, "eval_steps_per_second": 0.183, "step": 1340 }, { "epoch": 0.34542937180023825, "grad_norm": 0.1488553394812171, "learning_rate": 8.276465874534702e-05, "loss": 0.3617, "step": 1341 }, { "epoch": 0.34568696268152105, "grad_norm": 0.14487188948309115, "learning_rate": 8.273067642506914e-05, "loss": 0.3837, "step": 1342 }, { "epoch": 0.3459445535628039, "grad_norm": 0.19509054206903778, "learning_rate": 8.269666762847712e-05, "loss": 0.4664, "step": 1343 }, { "epoch": 0.3462021444440867, "grad_norm": 0.1877184003038439, "learning_rate": 8.266263238308115e-05, "loss": 0.356, "step": 1344 }, { "epoch": 0.3464597353253695, "grad_norm": 0.12332032428633803, "learning_rate": 8.262857071641283e-05, "loss": 0.3118, "step": 1345 }, { "epoch": 0.3464597353253695, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.8111576741749608, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.453125, "eval_runtime": 16.8925, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 1345 }, { "epoch": 0.3467173262066523, "grad_norm": 0.1311427978034802, "learning_rate": 8.259448265602513e-05, "loss": 0.3584, "step": 1346 }, { "epoch": 0.3469749170879351, "grad_norm": 0.23254126235500683, "learning_rate": 8.256036822949237e-05, "loss": 0.3641, "step": 1347 }, { "epoch": 0.3472325079692179, "grad_norm": 0.17118025943518272, "learning_rate": 8.252622746441021e-05, "loss": 0.3598, "step": 1348 }, { "epoch": 0.3474900988505007, "grad_norm": 0.162229989839118, "learning_rate": 8.249206038839559e-05, "loss": 0.4044, "step": 1349 }, { "epoch": 0.3477476897317835, "grad_norm": 0.20043217561988813, "learning_rate": 8.245786702908675e-05, "loss": 0.4092, "step": 1350 }, { "epoch": 0.3477476897317835, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8875739644970414, "eval_PRM F1 AUC": 0.7126767941330541, "eval_PRM F1 AUC (fixed)": 0.8260869565217392, "eval_PRM F1 Neg": 0.5581395348837209, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.872093023255814, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.46120384335517883, "eval_runtime": 16.3219, "eval_samples_per_second": 2.696, "eval_steps_per_second": 0.184, "step": 1350 }, { "epoch": 0.3480052806130663, "grad_norm": 0.1468694486131412, "learning_rate": 8.24236474141432e-05, "loss": 0.355, "step": 1351 }, { "epoch": 0.3482628714943491, "grad_norm": 0.11661797452146432, "learning_rate": 8.238940157124568e-05, "loss": 0.2925, "step": 1352 }, { "epoch": 0.3485204623756319, "grad_norm": 0.21304593212659667, "learning_rate": 8.235512952809613e-05, "loss": 0.464, "step": 1353 }, { "epoch": 0.3487780532569147, "grad_norm": 0.16172080694612898, "learning_rate": 8.23208313124177e-05, "loss": 0.3323, "step": 1354 }, { "epoch": 0.3490356441381975, "grad_norm": 0.22435519944824392, "learning_rate": 8.228650695195472e-05, "loss": 0.3813, "step": 1355 }, { "epoch": 0.3490356441381975, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8318491356731273, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4624467194080353, "eval_runtime": 17.4116, "eval_samples_per_second": 2.527, "eval_steps_per_second": 0.172, "step": 1355 }, { "epoch": 0.3492932350194803, "grad_norm": 0.19975174090905976, "learning_rate": 8.225215647447265e-05, "loss": 0.5092, "step": 1356 }, { "epoch": 0.34955082590076314, "grad_norm": 0.3079830518811906, "learning_rate": 8.221777990775809e-05, "loss": 0.4776, "step": 1357 }, { "epoch": 0.34980841678204594, "grad_norm": 0.17480055910468015, "learning_rate": 8.218337727961873e-05, "loss": 0.3814, "step": 1358 }, { "epoch": 0.35006600766332874, "grad_norm": 0.14224167471586507, "learning_rate": 8.214894861788336e-05, "loss": 0.3662, "step": 1359 }, { "epoch": 0.35032359854461154, "grad_norm": 0.15896607144738206, "learning_rate": 8.21144939504018e-05, "loss": 0.4329, "step": 1360 }, { "epoch": 0.35032359854461154, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8395061728395061, "eval_PRM F1 AUC": 0.6705081194342588, "eval_PRM F1 AUC (fixed)": 0.8344683080146674, "eval_PRM F1 Neg": 0.48, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8607594936708861, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42800071835517883, "eval_runtime": 17.6248, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 1360 }, { "epoch": 0.35058118942589434, "grad_norm": 0.18087938119665922, "learning_rate": 8.208001330504496e-05, "loss": 0.3368, "step": 1361 }, { "epoch": 0.35083878030717713, "grad_norm": 0.1909163053669263, "learning_rate": 8.204550670970469e-05, "loss": 0.3536, "step": 1362 }, { "epoch": 0.35109637118845993, "grad_norm": 0.19560014969971432, "learning_rate": 8.201097419229389e-05, "loss": 0.3739, "step": 1363 }, { "epoch": 0.35135396206974273, "grad_norm": 0.16676037559523177, "learning_rate": 8.197641578074642e-05, "loss": 0.4326, "step": 1364 }, { "epoch": 0.35161155295102553, "grad_norm": 0.14036581651181826, "learning_rate": 8.194183150301706e-05, "loss": 0.2584, "step": 1365 }, { "epoch": 0.35161155295102553, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8606600314300681, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.42196378111839294, "eval_runtime": 17.4568, "eval_samples_per_second": 2.521, "eval_steps_per_second": 0.172, "step": 1365 }, { "epoch": 0.35186914383230833, "grad_norm": 0.2348522807595575, "learning_rate": 8.190722138708152e-05, "loss": 0.4836, "step": 1366 }, { "epoch": 0.3521267347135911, "grad_norm": 0.12127022912515531, "learning_rate": 8.187258546093645e-05, "loss": 0.3511, "step": 1367 }, { "epoch": 0.3523843255948739, "grad_norm": 0.24288760008600477, "learning_rate": 8.183792375259931e-05, "loss": 0.4685, "step": 1368 }, { "epoch": 0.3526419164761567, "grad_norm": 0.2538830643188772, "learning_rate": 8.180323629010848e-05, "loss": 0.4104, "step": 1369 }, { "epoch": 0.3528995073574395, "grad_norm": 0.1321031597475086, "learning_rate": 8.176852310152314e-05, "loss": 0.33, "step": 1370 }, { "epoch": 0.3528995073574395, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8716605552645363, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.41823509335517883, "eval_runtime": 16.8512, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 1370 }, { "epoch": 0.3531570982387223, "grad_norm": 0.17062861788107217, "learning_rate": 8.173378421492329e-05, "loss": 0.3892, "step": 1371 }, { "epoch": 0.3534146891200052, "grad_norm": 0.13316230294852624, "learning_rate": 8.169901965840971e-05, "loss": 0.3915, "step": 1372 }, { "epoch": 0.353672280001288, "grad_norm": 0.17518396719677154, "learning_rate": 8.166422946010396e-05, "loss": 0.393, "step": 1373 }, { "epoch": 0.3539298708825708, "grad_norm": 0.15370184459909259, "learning_rate": 8.162941364814831e-05, "loss": 0.3648, "step": 1374 }, { "epoch": 0.3541874617638536, "grad_norm": 0.1330686698203916, "learning_rate": 8.159457225070577e-05, "loss": 0.3917, "step": 1375 }, { "epoch": 0.3541874617638536, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8666841278156102, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.3955078125, "eval_runtime": 17.3397, "eval_samples_per_second": 2.538, "eval_steps_per_second": 0.173, "step": 1375 }, { "epoch": 0.35444505264513637, "grad_norm": 0.16703914422429106, "learning_rate": 8.155970529596006e-05, "loss": 0.3635, "step": 1376 }, { "epoch": 0.35470264352641917, "grad_norm": 0.15493303473551956, "learning_rate": 8.152481281211557e-05, "loss": 0.4039, "step": 1377 }, { "epoch": 0.35496023440770197, "grad_norm": 0.13203534949022494, "learning_rate": 8.148989482739731e-05, "loss": 0.3889, "step": 1378 }, { "epoch": 0.35521782528898477, "grad_norm": 0.12849488823611613, "learning_rate": 8.145495137005097e-05, "loss": 0.3698, "step": 1379 }, { "epoch": 0.35547541617026757, "grad_norm": 0.1290611628936926, "learning_rate": 8.141998246834277e-05, "loss": 0.3191, "step": 1380 }, { "epoch": 0.35547541617026757, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8635411210057622, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.3990589380264282, "eval_runtime": 17.0379, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 1380 }, { "epoch": 0.35573300705155037, "grad_norm": 0.15518361514459356, "learning_rate": 8.138498815055958e-05, "loss": 0.3809, "step": 1381 }, { "epoch": 0.35599059793283316, "grad_norm": 0.21866681354392167, "learning_rate": 8.134996844500881e-05, "loss": 0.4957, "step": 1382 }, { "epoch": 0.35624818881411596, "grad_norm": 0.16691264432842712, "learning_rate": 8.131492338001839e-05, "loss": 0.4661, "step": 1383 }, { "epoch": 0.35650577969539876, "grad_norm": 0.14048437549847448, "learning_rate": 8.12798529839368e-05, "loss": 0.3434, "step": 1384 }, { "epoch": 0.35676337057668156, "grad_norm": 0.18509547515632593, "learning_rate": 8.124475728513297e-05, "loss": 0.3905, "step": 1385 }, { "epoch": 0.35676337057668156, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8556836039811421, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.40500709414482117, "eval_runtime": 17.4343, "eval_samples_per_second": 2.524, "eval_steps_per_second": 0.172, "step": 1385 }, { "epoch": 0.3570209614579644, "grad_norm": 0.15721466762663772, "learning_rate": 8.120963631199631e-05, "loss": 0.3667, "step": 1386 }, { "epoch": 0.3572785523392472, "grad_norm": 0.1294660087901017, "learning_rate": 8.117449009293668e-05, "loss": 0.3801, "step": 1387 }, { "epoch": 0.35753614322053, "grad_norm": 0.12639460991421722, "learning_rate": 8.113931865638438e-05, "loss": 0.3921, "step": 1388 }, { "epoch": 0.3577937341018128, "grad_norm": 0.12543637129674107, "learning_rate": 8.110412203079007e-05, "loss": 0.337, "step": 1389 }, { "epoch": 0.3580513249830956, "grad_norm": 0.22228695759655492, "learning_rate": 8.106890024462481e-05, "loss": 0.4571, "step": 1390 }, { "epoch": 0.3580513249830956, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8953488372093024, "eval_PRM F1 AUC": 0.7029858564693556, "eval_PRM F1 AUC (fixed)": 0.8407543216343635, "eval_PRM F1 Neg": 0.55, "eval_PRM NPV": 0.6470588235294118, "eval_PRM Precision": 0.8651685393258427, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4252485930919647, "eval_runtime": 16.6542, "eval_samples_per_second": 2.642, "eval_steps_per_second": 0.18, "step": 1390 }, { "epoch": 0.3583089158643784, "grad_norm": 0.1562264555854055, "learning_rate": 8.103365332638001e-05, "loss": 0.4251, "step": 1391 }, { "epoch": 0.3585665067456612, "grad_norm": 0.1409574109322409, "learning_rate": 8.099838130456741e-05, "loss": 0.4266, "step": 1392 }, { "epoch": 0.358824097626944, "grad_norm": 0.1480149775372459, "learning_rate": 8.096308420771908e-05, "loss": 0.4172, "step": 1393 }, { "epoch": 0.3590816885082268, "grad_norm": 0.14849229891070298, "learning_rate": 8.09277620643873e-05, "loss": 0.4201, "step": 1394 }, { "epoch": 0.3593392793895096, "grad_norm": 0.13992412467538312, "learning_rate": 8.089241490314468e-05, "loss": 0.357, "step": 1395 }, { "epoch": 0.3593392793895096, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8368255631220534, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4189453125, "eval_runtime": 17.0231, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 1395 }, { "epoch": 0.3595968702707924, "grad_norm": 0.24889386699297159, "learning_rate": 8.085704275258404e-05, "loss": 0.3891, "step": 1396 }, { "epoch": 0.3598544611520752, "grad_norm": 0.19551401137825344, "learning_rate": 8.082164564131845e-05, "loss": 0.3578, "step": 1397 }, { "epoch": 0.360112052033358, "grad_norm": 0.1455011681980945, "learning_rate": 8.078622359798111e-05, "loss": 0.4047, "step": 1398 }, { "epoch": 0.3603696429146408, "grad_norm": 0.15255777338413923, "learning_rate": 8.075077665122544e-05, "loss": 0.4584, "step": 1399 }, { "epoch": 0.36062723379592365, "grad_norm": 0.13169993763746787, "learning_rate": 8.071530482972495e-05, "loss": 0.3419, "step": 1400 }, { "epoch": 0.36062723379592365, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8901734104046243, "eval_PRM F1 AUC": 0.6812467260345731, "eval_PRM F1 AUC (fixed)": 0.8457307490832897, "eval_PRM F1 Neg": 0.5128205128205128, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8555555555555555, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4606267809867859, "eval_runtime": 16.8656, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 1400 }, { "epoch": 0.36088482467720645, "grad_norm": 0.248537432624282, "learning_rate": 8.067980816217335e-05, "loss": 0.4773, "step": 1401 }, { "epoch": 0.36114241555848925, "grad_norm": 0.14391151961224946, "learning_rate": 8.064428667728439e-05, "loss": 0.3399, "step": 1402 }, { "epoch": 0.36140000643977205, "grad_norm": 0.11489270862321287, "learning_rate": 8.060874040379189e-05, "loss": 0.2953, "step": 1403 }, { "epoch": 0.36165759732105485, "grad_norm": 0.14371898662361124, "learning_rate": 8.057316937044977e-05, "loss": 0.3642, "step": 1404 }, { "epoch": 0.36191518820233765, "grad_norm": 0.16909939720540157, "learning_rate": 8.053757360603191e-05, "loss": 0.4007, "step": 1405 }, { "epoch": 0.36191518820233765, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8901734104046243, "eval_PRM F1 AUC": 0.6812467260345731, "eval_PRM F1 AUC (fixed)": 0.8428496595075955, "eval_PRM F1 Neg": 0.5128205128205128, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8555555555555555, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.43918678164482117, "eval_runtime": 17.4826, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 1405 }, { "epoch": 0.36217277908362044, "grad_norm": 0.12207382964204679, "learning_rate": 8.050195313933229e-05, "loss": 0.3562, "step": 1406 }, { "epoch": 0.36243036996490324, "grad_norm": 0.21599704646494047, "learning_rate": 8.046630799916476e-05, "loss": 0.439, "step": 1407 }, { "epoch": 0.36268796084618604, "grad_norm": 0.12557432987607228, "learning_rate": 8.043063821436322e-05, "loss": 0.3448, "step": 1408 }, { "epoch": 0.36294555172746884, "grad_norm": 0.1281397816731501, "learning_rate": 8.039494381378146e-05, "loss": 0.4453, "step": 1409 }, { "epoch": 0.36320314260875164, "grad_norm": 0.20623591962417667, "learning_rate": 8.035922482629318e-05, "loss": 0.4297, "step": 1410 }, { "epoch": 0.36320314260875164, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 AUC (fixed)": 0.8368255631220535, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.4267578125, "eval_runtime": 17.069, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 1410 }, { "epoch": 0.36346073349003444, "grad_norm": 0.26617095280275, "learning_rate": 8.032348128079203e-05, "loss": 0.4439, "step": 1411 }, { "epoch": 0.36371832437131724, "grad_norm": 0.24196498497379682, "learning_rate": 8.028771320619144e-05, "loss": 0.3918, "step": 1412 }, { "epoch": 0.36397591525260004, "grad_norm": 0.20264336724441273, "learning_rate": 8.025192063142472e-05, "loss": 0.384, "step": 1413 }, { "epoch": 0.36423350613388283, "grad_norm": 0.1747867526069207, "learning_rate": 8.0216103585445e-05, "loss": 0.3817, "step": 1414 }, { "epoch": 0.3644910970151657, "grad_norm": 0.12921580660774498, "learning_rate": 8.018026209722518e-05, "loss": 0.4061, "step": 1415 }, { "epoch": 0.3644910970151657, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8901734104046243, "eval_PRM F1 AUC": 0.6812467260345731, "eval_PRM F1 AUC (fixed)": 0.8428496595075957, "eval_PRM F1 Neg": 0.5128205128205128, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8555555555555555, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4754527807235718, "eval_runtime": 17.1859, "eval_samples_per_second": 2.56, "eval_steps_per_second": 0.175, "step": 1415 }, { "epoch": 0.3647486878964485, "grad_norm": 0.15186777923244818, "learning_rate": 8.014439619575802e-05, "loss": 0.3493, "step": 1416 }, { "epoch": 0.3650062787777313, "grad_norm": 0.13991241954942993, "learning_rate": 8.01085059100559e-05, "loss": 0.4061, "step": 1417 }, { "epoch": 0.3652638696590141, "grad_norm": 0.18737472839361183, "learning_rate": 8.0072591269151e-05, "loss": 0.4265, "step": 1418 }, { "epoch": 0.3655214605402969, "grad_norm": 0.2526565469001541, "learning_rate": 8.003665230209521e-05, "loss": 0.4409, "step": 1419 }, { "epoch": 0.3657790514215797, "grad_norm": 0.3072026599547163, "learning_rate": 8.000068903796008e-05, "loss": 0.5149, "step": 1420 }, { "epoch": 0.3657790514215797, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9028571428571428, "eval_PRM F1 AUC": 0.6932949188056574, "eval_PRM F1 AUC (fixed)": 0.8360398114195915, "eval_PRM F1 Neg": 0.5405405405405406, "eval_PRM NPV": 0.7142857142857143, "eval_PRM Precision": 0.8586956521739131, "eval_PRM Recall": 0.9518072289156626, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.5146928429603577, "eval_runtime": 16.8778, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 1420 }, { "epoch": 0.3660366423028625, "grad_norm": 0.23539512575766042, "learning_rate": 7.996470150583677e-05, "loss": 0.3786, "step": 1421 }, { "epoch": 0.3662942331841453, "grad_norm": 0.2869517163629186, "learning_rate": 7.992868973483617e-05, "loss": 0.4579, "step": 1422 }, { "epoch": 0.3665518240654281, "grad_norm": 0.15910221046319536, "learning_rate": 7.989265375408865e-05, "loss": 0.2962, "step": 1423 }, { "epoch": 0.3668094149467109, "grad_norm": 0.12244119385302561, "learning_rate": 7.985659359274428e-05, "loss": 0.3364, "step": 1424 }, { "epoch": 0.3670670058279937, "grad_norm": 0.24856937781701635, "learning_rate": 7.982050927997264e-05, "loss": 0.4419, "step": 1425 }, { "epoch": 0.3670670058279937, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8427672955974843, "eval_PRM F1 AUC": 0.707962283918282, "eval_PRM F1 AUC (fixed)": 0.8148245154531168, "eval_PRM F1 Neg": 0.5283018867924528, "eval_PRM NPV": 0.4666666666666667, "eval_PRM Precision": 0.881578947368421, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.47336646914482117, "eval_runtime": 17.1663, "eval_samples_per_second": 2.563, "eval_steps_per_second": 0.175, "step": 1425 }, { "epoch": 0.3673245967092765, "grad_norm": 0.19065314776790587, "learning_rate": 7.978440084496282e-05, "loss": 0.4672, "step": 1426 }, { "epoch": 0.3675821875905593, "grad_norm": 0.273501848901122, "learning_rate": 7.974826831692349e-05, "loss": 0.3886, "step": 1427 }, { "epoch": 0.36783977847184207, "grad_norm": 0.2644704759962792, "learning_rate": 7.971211172508276e-05, "loss": 0.4214, "step": 1428 }, { "epoch": 0.3680973693531249, "grad_norm": 0.1804329120699411, "learning_rate": 7.967593109868817e-05, "loss": 0.3521, "step": 1429 }, { "epoch": 0.3683549602344077, "grad_norm": 0.1552484757585082, "learning_rate": 7.96397264670068e-05, "loss": 0.3474, "step": 1430 }, { "epoch": 0.3683549602344077, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8137768465165007, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4945845305919647, "eval_runtime": 17.4764, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 1430 }, { "epoch": 0.3686125511156905, "grad_norm": 0.1563692167955651, "learning_rate": 7.96034978593251e-05, "loss": 0.3822, "step": 1431 }, { "epoch": 0.3688701419969733, "grad_norm": 0.23519815994241292, "learning_rate": 7.956724530494887e-05, "loss": 0.5294, "step": 1432 }, { "epoch": 0.3691277328782561, "grad_norm": 0.23637085121877152, "learning_rate": 7.953096883320337e-05, "loss": 0.447, "step": 1433 }, { "epoch": 0.3693853237595389, "grad_norm": 0.15927649520450732, "learning_rate": 7.949466847343312e-05, "loss": 0.3643, "step": 1434 }, { "epoch": 0.3696429146408217, "grad_norm": 0.1410503602874715, "learning_rate": 7.9458344255002e-05, "loss": 0.4049, "step": 1435 }, { "epoch": 0.3696429146408217, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8106338397066527, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.53125, "eval_runtime": 17.4485, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 1435 }, { "epoch": 0.3699005055221045, "grad_norm": 0.16668598813851612, "learning_rate": 7.942199620729324e-05, "loss": 0.3445, "step": 1436 }, { "epoch": 0.3701580964033873, "grad_norm": 0.1612253745918565, "learning_rate": 7.938562435970924e-05, "loss": 0.3776, "step": 1437 }, { "epoch": 0.3704156872846701, "grad_norm": 0.28443159463950224, "learning_rate": 7.934922874167174e-05, "loss": 0.4961, "step": 1438 }, { "epoch": 0.3706732781659529, "grad_norm": 0.14007728381863407, "learning_rate": 7.931280938262169e-05, "loss": 0.403, "step": 1439 }, { "epoch": 0.3709308690472357, "grad_norm": 0.14141042342640664, "learning_rate": 7.927636631201922e-05, "loss": 0.3409, "step": 1440 }, { "epoch": 0.3709308690472357, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8211105290728129, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4620916247367859, "eval_runtime": 16.8284, "eval_samples_per_second": 2.615, "eval_steps_per_second": 0.178, "step": 1440 }, { "epoch": 0.3711884599285185, "grad_norm": 0.14529145441729857, "learning_rate": 7.923989955934363e-05, "loss": 0.3953, "step": 1441 }, { "epoch": 0.3714460508098013, "grad_norm": 0.15416532815020742, "learning_rate": 7.920340915409343e-05, "loss": 0.4573, "step": 1442 }, { "epoch": 0.3717036416910841, "grad_norm": 0.1302577270600015, "learning_rate": 7.916689512578622e-05, "loss": 0.3999, "step": 1443 }, { "epoch": 0.37196123257236696, "grad_norm": 0.13671813951190143, "learning_rate": 7.913035750395871e-05, "loss": 0.4069, "step": 1444 }, { "epoch": 0.37221882345364976, "grad_norm": 0.14748956050659248, "learning_rate": 7.909379631816673e-05, "loss": 0.3742, "step": 1445 }, { "epoch": 0.37221882345364976, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8399685699319015, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4311967194080353, "eval_runtime": 17.2863, "eval_samples_per_second": 2.545, "eval_steps_per_second": 0.174, "step": 1445 }, { "epoch": 0.37247641433493256, "grad_norm": 0.15565297815252133, "learning_rate": 7.905721159798513e-05, "loss": 0.3619, "step": 1446 }, { "epoch": 0.37273400521621536, "grad_norm": 0.12794157339496393, "learning_rate": 7.902060337300785e-05, "loss": 0.348, "step": 1447 }, { "epoch": 0.37299159609749816, "grad_norm": 0.11967357669264121, "learning_rate": 7.898397167284777e-05, "loss": 0.2732, "step": 1448 }, { "epoch": 0.37324918697878096, "grad_norm": 0.14743365189708196, "learning_rate": 7.89473165271368e-05, "loss": 0.4309, "step": 1449 }, { "epoch": 0.37350677786006375, "grad_norm": 0.10644913856291996, "learning_rate": 7.891063796552584e-05, "loss": 0.3255, "step": 1450 }, { "epoch": 0.37350677786006375, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8493975903614457, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4223189055919647, "eval_runtime": 17.5741, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 1450 }, { "epoch": 0.37376436874134655, "grad_norm": 0.11634918095601579, "learning_rate": 7.887393601768468e-05, "loss": 0.3652, "step": 1451 }, { "epoch": 0.37402195962262935, "grad_norm": 0.13996813488006055, "learning_rate": 7.883721071330206e-05, "loss": 0.3554, "step": 1452 }, { "epoch": 0.37427955050391215, "grad_norm": 0.11089529188487263, "learning_rate": 7.880046208208563e-05, "loss": 0.3703, "step": 1453 }, { "epoch": 0.37453714138519495, "grad_norm": 0.15341674881029121, "learning_rate": 7.876369015376186e-05, "loss": 0.4314, "step": 1454 }, { "epoch": 0.37479473226647775, "grad_norm": 0.13386574169282345, "learning_rate": 7.872689495807608e-05, "loss": 0.3764, "step": 1455 }, { "epoch": 0.37479473226647775, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8465165007857517, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4137073755264282, "eval_runtime": 17.0281, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 1455 }, { "epoch": 0.37505232314776055, "grad_norm": 0.1369699845273803, "learning_rate": 7.869007652479248e-05, "loss": 0.3622, "step": 1456 }, { "epoch": 0.37530991402904335, "grad_norm": 0.1432036817017207, "learning_rate": 7.865323488369399e-05, "loss": 0.3757, "step": 1457 }, { "epoch": 0.3755675049103262, "grad_norm": 0.1412145563921165, "learning_rate": 7.861637006458238e-05, "loss": 0.3928, "step": 1458 }, { "epoch": 0.375825095791609, "grad_norm": 0.12195903826389952, "learning_rate": 7.85794820972781e-05, "loss": 0.341, "step": 1459 }, { "epoch": 0.3760826866728918, "grad_norm": 0.1864896327378782, "learning_rate": 7.854257101162037e-05, "loss": 0.3809, "step": 1460 }, { "epoch": 0.3760826866728918, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8444211629125197, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4232954680919647, "eval_runtime": 17.4616, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 1460 }, { "epoch": 0.3763402775541746, "grad_norm": 0.1726069041489504, "learning_rate": 7.85056368374671e-05, "loss": 0.3744, "step": 1461 }, { "epoch": 0.3765978684354574, "grad_norm": 0.1768878202250996, "learning_rate": 7.846867960469486e-05, "loss": 0.4118, "step": 1462 }, { "epoch": 0.3768554593167402, "grad_norm": 0.14048413412020386, "learning_rate": 7.843169934319889e-05, "loss": 0.3427, "step": 1463 }, { "epoch": 0.377113050198023, "grad_norm": 0.14797672911035345, "learning_rate": 7.839469608289308e-05, "loss": 0.3458, "step": 1464 }, { "epoch": 0.3773706410793058, "grad_norm": 0.13129653898918622, "learning_rate": 7.835766985370986e-05, "loss": 0.3825, "step": 1465 }, { "epoch": 0.3773706410793058, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8323729701414352, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.44424715638160706, "eval_runtime": 17.7255, "eval_samples_per_second": 2.482, "eval_steps_per_second": 0.169, "step": 1465 }, { "epoch": 0.3776282319605886, "grad_norm": 0.13781871183081718, "learning_rate": 7.832062068560028e-05, "loss": 0.3717, "step": 1466 }, { "epoch": 0.3778858228418714, "grad_norm": 0.20946442389558764, "learning_rate": 7.828354860853399e-05, "loss": 0.4241, "step": 1467 }, { "epoch": 0.3781434137231542, "grad_norm": 0.22425415062460602, "learning_rate": 7.82464536524991e-05, "loss": 0.4122, "step": 1468 }, { "epoch": 0.378401004604437, "grad_norm": 0.18346985460789594, "learning_rate": 7.820933584750223e-05, "loss": 0.3973, "step": 1469 }, { "epoch": 0.3786585954857198, "grad_norm": 0.1356984484517548, "learning_rate": 7.817219522356854e-05, "loss": 0.4181, "step": 1470 }, { "epoch": 0.3786585954857198, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8273965426925092, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4406072497367859, "eval_runtime": 16.7708, "eval_samples_per_second": 2.624, "eval_steps_per_second": 0.179, "step": 1470 }, { "epoch": 0.3789161863670026, "grad_norm": 0.2461318462755359, "learning_rate": 7.813503181074158e-05, "loss": 0.4901, "step": 1471 }, { "epoch": 0.37917377724828544, "grad_norm": 0.13730957758256832, "learning_rate": 7.80978456390834e-05, "loss": 0.3965, "step": 1472 }, { "epoch": 0.37943136812956824, "grad_norm": 0.13577545564335572, "learning_rate": 7.80606367386744e-05, "loss": 0.3513, "step": 1473 }, { "epoch": 0.37968895901085103, "grad_norm": 0.14977198244614462, "learning_rate": 7.802340513961342e-05, "loss": 0.4169, "step": 1474 }, { "epoch": 0.37994654989213383, "grad_norm": 0.12419756970413116, "learning_rate": 7.798615087201762e-05, "loss": 0.3863, "step": 1475 }, { "epoch": 0.37994654989213383, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8161341016238868, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4322620630264282, "eval_runtime": 17.6592, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 1475 }, { "epoch": 0.38020414077341663, "grad_norm": 0.16280587191534948, "learning_rate": 7.794887396602252e-05, "loss": 0.4245, "step": 1476 }, { "epoch": 0.38046173165469943, "grad_norm": 0.15436708642834077, "learning_rate": 7.791157445178193e-05, "loss": 0.4161, "step": 1477 }, { "epoch": 0.38071932253598223, "grad_norm": 0.1496496597279818, "learning_rate": 7.787425235946798e-05, "loss": 0.4246, "step": 1478 }, { "epoch": 0.38097691341726503, "grad_norm": 0.21329535676825526, "learning_rate": 7.783690771927104e-05, "loss": 0.3321, "step": 1479 }, { "epoch": 0.3812345042985478, "grad_norm": 0.12684358469860735, "learning_rate": 7.779954056139971e-05, "loss": 0.387, "step": 1480 }, { "epoch": 0.3812345042985478, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8313253012048193, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.43723365664482117, "eval_runtime": 18.0962, "eval_samples_per_second": 2.431, "eval_steps_per_second": 0.166, "step": 1480 }, { "epoch": 0.3814920951798306, "grad_norm": 0.11934879648265088, "learning_rate": 7.776215091608085e-05, "loss": 0.342, "step": 1481 }, { "epoch": 0.3817496860611134, "grad_norm": 0.16889361774625997, "learning_rate": 7.772473881355947e-05, "loss": 0.4303, "step": 1482 }, { "epoch": 0.3820072769423962, "grad_norm": 0.12341310482287064, "learning_rate": 7.768730428409875e-05, "loss": 0.3424, "step": 1483 }, { "epoch": 0.382264867823679, "grad_norm": 0.16214057586910535, "learning_rate": 7.764984735798002e-05, "loss": 0.4162, "step": 1484 }, { "epoch": 0.3825224587049618, "grad_norm": 0.1208546046888841, "learning_rate": 7.761236806550272e-05, "loss": 0.3617, "step": 1485 }, { "epoch": 0.3825224587049618, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8302776322682033, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.45028409361839294, "eval_runtime": 17.6577, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 1485 }, { "epoch": 0.3827800495862446, "grad_norm": 0.15767325243358565, "learning_rate": 7.75748664369844e-05, "loss": 0.4262, "step": 1486 }, { "epoch": 0.3830376404675275, "grad_norm": 0.10555063986862433, "learning_rate": 7.753734250276066e-05, "loss": 0.318, "step": 1487 }, { "epoch": 0.3832952313488103, "grad_norm": 0.1354873949060526, "learning_rate": 7.749979629318516e-05, "loss": 0.3506, "step": 1488 }, { "epoch": 0.38355282223009307, "grad_norm": 0.18341235620462912, "learning_rate": 7.746222783862955e-05, "loss": 0.3883, "step": 1489 }, { "epoch": 0.38381041311137587, "grad_norm": 0.13452528724333285, "learning_rate": 7.74246371694835e-05, "loss": 0.4169, "step": 1490 }, { "epoch": 0.38381041311137587, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8326348873755893, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4368785619735718, "eval_runtime": 17.0948, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 1490 }, { "epoch": 0.38406800399265867, "grad_norm": 0.10541879108481858, "learning_rate": 7.738702431615464e-05, "loss": 0.3607, "step": 1491 }, { "epoch": 0.38432559487394147, "grad_norm": 0.13964032755496925, "learning_rate": 7.734938930906854e-05, "loss": 0.3649, "step": 1492 }, { "epoch": 0.38458318575522427, "grad_norm": 0.13444725763073687, "learning_rate": 7.731173217866873e-05, "loss": 0.408, "step": 1493 }, { "epoch": 0.38484077663650706, "grad_norm": 0.1593150120697173, "learning_rate": 7.727405295541656e-05, "loss": 0.441, "step": 1494 }, { "epoch": 0.38509836751778986, "grad_norm": 0.16149687865603315, "learning_rate": 7.723635166979133e-05, "loss": 0.3732, "step": 1495 }, { "epoch": 0.38509836751778986, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8279203771608171, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.43918678164482117, "eval_runtime": 16.9888, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 1495 }, { "epoch": 0.38535595839907266, "grad_norm": 0.20619527904331075, "learning_rate": 7.719862835229014e-05, "loss": 0.3437, "step": 1496 }, { "epoch": 0.38561354928035546, "grad_norm": 0.16822993120525714, "learning_rate": 7.71608830334279e-05, "loss": 0.48, "step": 1497 }, { "epoch": 0.38587114016163826, "grad_norm": 0.1326659987894727, "learning_rate": 7.712311574373739e-05, "loss": 0.3539, "step": 1498 }, { "epoch": 0.38612873104292106, "grad_norm": 0.12479794909144715, "learning_rate": 7.708532651376905e-05, "loss": 0.3429, "step": 1499 }, { "epoch": 0.38638632192420386, "grad_norm": 0.18732989325973226, "learning_rate": 7.704751537409118e-05, "loss": 0.3829, "step": 1500 }, { "epoch": 0.38638632192420386, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8349921424829753, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.47958096861839294, "eval_runtime": 16.9726, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 1500 }, { "epoch": 0.3866439128054867, "grad_norm": 0.14813726272362412, "learning_rate": 7.700968235528974e-05, "loss": 0.3274, "step": 1501 }, { "epoch": 0.3869015036867695, "grad_norm": 0.14870013875814994, "learning_rate": 7.697182748796841e-05, "loss": 0.3253, "step": 1502 }, { "epoch": 0.3871590945680523, "grad_norm": 0.1388231416079047, "learning_rate": 7.69339508027485e-05, "loss": 0.3516, "step": 1503 }, { "epoch": 0.3874166854493351, "grad_norm": 0.17073717793569934, "learning_rate": 7.689605233026904e-05, "loss": 0.4615, "step": 1504 }, { "epoch": 0.3876742763306179, "grad_norm": 0.17478034003219137, "learning_rate": 7.685813210118664e-05, "loss": 0.3228, "step": 1505 }, { "epoch": 0.3876742763306179, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8292299633315872, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4525923430919647, "eval_runtime": 16.8921, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 1505 }, { "epoch": 0.3879318672119007, "grad_norm": 0.12140507377051665, "learning_rate": 7.682019014617552e-05, "loss": 0.3143, "step": 1506 }, { "epoch": 0.3881894580931835, "grad_norm": 0.1348108929045567, "learning_rate": 7.678222649592748e-05, "loss": 0.2916, "step": 1507 }, { "epoch": 0.3884470489744663, "grad_norm": 0.17072839530221123, "learning_rate": 7.674424118115184e-05, "loss": 0.4133, "step": 1508 }, { "epoch": 0.3887046398557491, "grad_norm": 0.15192570680931522, "learning_rate": 7.670623423257548e-05, "loss": 0.3208, "step": 1509 }, { "epoch": 0.3889622307370319, "grad_norm": 0.13923376996908815, "learning_rate": 7.666820568094276e-05, "loss": 0.351, "step": 1510 }, { "epoch": 0.3889622307370319, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.8294918805657412, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4459339380264282, "eval_runtime": 16.8476, "eval_samples_per_second": 2.612, "eval_steps_per_second": 0.178, "step": 1510 }, { "epoch": 0.3892198216183147, "grad_norm": 0.13332215585380947, "learning_rate": 7.663015555701551e-05, "loss": 0.3455, "step": 1511 }, { "epoch": 0.3894774124995975, "grad_norm": 0.19612724440214718, "learning_rate": 7.659208389157307e-05, "loss": 0.3095, "step": 1512 }, { "epoch": 0.3897350033808803, "grad_norm": 0.14546584285987435, "learning_rate": 7.65539907154121e-05, "loss": 0.2957, "step": 1513 }, { "epoch": 0.3899925942621631, "grad_norm": 0.12757353650303827, "learning_rate": 7.651587605934675e-05, "loss": 0.3045, "step": 1514 }, { "epoch": 0.39025018514344595, "grad_norm": 0.12789245470553237, "learning_rate": 7.647773995420851e-05, "loss": 0.3683, "step": 1515 }, { "epoch": 0.39025018514344595, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.8273965426925091, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4732776880264282, "eval_runtime": 17.0298, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 1515 }, { "epoch": 0.39050777602472875, "grad_norm": 0.1760140052598356, "learning_rate": 7.64395824308462e-05, "loss": 0.3746, "step": 1516 }, { "epoch": 0.39076536690601155, "grad_norm": 0.1829722918935349, "learning_rate": 7.640140352012601e-05, "loss": 0.4585, "step": 1517 }, { "epoch": 0.39102295778729435, "grad_norm": 0.15989859792499364, "learning_rate": 7.63632032529314e-05, "loss": 0.3583, "step": 1518 }, { "epoch": 0.39128054866857714, "grad_norm": 0.2318240239340174, "learning_rate": 7.632498166016315e-05, "loss": 0.4468, "step": 1519 }, { "epoch": 0.39153813954985994, "grad_norm": 0.21266224428898567, "learning_rate": 7.628673877273919e-05, "loss": 0.4787, "step": 1520 }, { "epoch": 0.39153813954985994, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8305395495023573, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4439808130264282, "eval_runtime": 18.0339, "eval_samples_per_second": 2.44, "eval_steps_per_second": 0.166, "step": 1520 }, { "epoch": 0.39179573043114274, "grad_norm": 0.17730241499672117, "learning_rate": 7.624847462159479e-05, "loss": 0.428, "step": 1521 }, { "epoch": 0.39205332131242554, "grad_norm": 0.15677206332885174, "learning_rate": 7.621018923768235e-05, "loss": 0.3751, "step": 1522 }, { "epoch": 0.39231091219370834, "grad_norm": 0.11803823706948607, "learning_rate": 7.617188265197148e-05, "loss": 0.3878, "step": 1523 }, { "epoch": 0.39256850307499114, "grad_norm": 0.18160223652927948, "learning_rate": 7.613355489544891e-05, "loss": 0.4073, "step": 1524 }, { "epoch": 0.39282609395627394, "grad_norm": 0.1492920206896327, "learning_rate": 7.609520599911853e-05, "loss": 0.3775, "step": 1525 }, { "epoch": 0.39282609395627394, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.8315872184389732, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.42604759335517883, "eval_runtime": 17.6137, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 1525 }, { "epoch": 0.39308368483755673, "grad_norm": 0.16842011187970488, "learning_rate": 7.605683599400131e-05, "loss": 0.3402, "step": 1526 }, { "epoch": 0.39334127571883953, "grad_norm": 0.17681705599967015, "learning_rate": 7.60184449111353e-05, "loss": 0.3829, "step": 1527 }, { "epoch": 0.39359886660012233, "grad_norm": 0.1580442884085002, "learning_rate": 7.598003278157558e-05, "loss": 0.4697, "step": 1528 }, { "epoch": 0.39385645748140513, "grad_norm": 0.14318958138775478, "learning_rate": 7.594159963639429e-05, "loss": 0.3883, "step": 1529 }, { "epoch": 0.394114048362688, "grad_norm": 0.14560641571167493, "learning_rate": 7.590314550668054e-05, "loss": 0.3532, "step": 1530 }, { "epoch": 0.394114048362688, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8313253012048192, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.43918678164482117, "eval_runtime": 17.4066, "eval_samples_per_second": 2.528, "eval_steps_per_second": 0.172, "step": 1530 }, { "epoch": 0.3943716392439708, "grad_norm": 0.31348260951993906, "learning_rate": 7.586467042354044e-05, "loss": 0.4302, "step": 1531 }, { "epoch": 0.3946292301252536, "grad_norm": 0.1471326111950281, "learning_rate": 7.582617441809703e-05, "loss": 0.3966, "step": 1532 }, { "epoch": 0.3948868210065364, "grad_norm": 0.11533552914020075, "learning_rate": 7.578765752149028e-05, "loss": 0.3159, "step": 1533 }, { "epoch": 0.3951444118878192, "grad_norm": 0.2195564752293955, "learning_rate": 7.574911976487709e-05, "loss": 0.3733, "step": 1534 }, { "epoch": 0.395402002769102, "grad_norm": 0.13274452561393288, "learning_rate": 7.571056117943116e-05, "loss": 0.3849, "step": 1535 }, { "epoch": 0.395402002769102, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8705882352941177, "eval_PRM F1 AUC": 0.6631744368779466, "eval_PRM F1 AUC (fixed)": 0.8195390256678889, "eval_PRM F1 Neg": 0.47619047619047616, "eval_PRM NPV": 0.5263157894736842, "eval_PRM Precision": 0.8505747126436781, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4623579680919647, "eval_runtime": 17.0067, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 1535 }, { "epoch": 0.3956595936503848, "grad_norm": 0.12704848069403604, "learning_rate": 7.567198179634312e-05, "loss": 0.3363, "step": 1536 }, { "epoch": 0.3959171845316676, "grad_norm": 0.14068388225944006, "learning_rate": 7.563338164682036e-05, "loss": 0.334, "step": 1537 }, { "epoch": 0.3961747754129504, "grad_norm": 0.15795373992576903, "learning_rate": 7.559476076208711e-05, "loss": 0.3081, "step": 1538 }, { "epoch": 0.3964323662942332, "grad_norm": 0.16876522939624136, "learning_rate": 7.555611917338434e-05, "loss": 0.4269, "step": 1539 }, { "epoch": 0.396689957175516, "grad_norm": 0.13384599664271368, "learning_rate": 7.551745691196981e-05, "loss": 0.3986, "step": 1540 }, { "epoch": 0.396689957175516, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.863905325443787, "eval_PRM F1 AUC": 0.6571503404924044, "eval_PRM F1 AUC (fixed)": 0.8129910948140388, "eval_PRM F1 Neg": 0.46511627906976744, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8488372093023255, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.447265625, "eval_runtime": 17.4495, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 1540 }, { "epoch": 0.39694754805679877, "grad_norm": 0.16338996613859239, "learning_rate": 7.547877400911799e-05, "loss": 0.3772, "step": 1541 }, { "epoch": 0.39720513893808157, "grad_norm": 0.15692663587738873, "learning_rate": 7.544007049611999e-05, "loss": 0.4148, "step": 1542 }, { "epoch": 0.39746272981936437, "grad_norm": 0.16902886403744088, "learning_rate": 7.540134640428365e-05, "loss": 0.4509, "step": 1543 }, { "epoch": 0.3977203207006472, "grad_norm": 0.14802471052858074, "learning_rate": 7.536260176493348e-05, "loss": 0.3891, "step": 1544 }, { "epoch": 0.39797791158193, "grad_norm": 0.1854248374969804, "learning_rate": 7.532383660941054e-05, "loss": 0.3896, "step": 1545 }, { "epoch": 0.39797791158193, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.8053954950235727, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4311967194080353, "eval_runtime": 16.9098, "eval_samples_per_second": 2.602, "eval_steps_per_second": 0.177, "step": 1545 }, { "epoch": 0.3982355024632128, "grad_norm": 0.1248294787353036, "learning_rate": 7.528505096907253e-05, "loss": 0.3557, "step": 1546 }, { "epoch": 0.3984930933444956, "grad_norm": 0.13446807468887198, "learning_rate": 7.524624487529371e-05, "loss": 0.258, "step": 1547 }, { "epoch": 0.3987506842257784, "grad_norm": 0.25790835297708575, "learning_rate": 7.520741835946492e-05, "loss": 0.4442, "step": 1548 }, { "epoch": 0.3990082751070612, "grad_norm": 0.20385543492449934, "learning_rate": 7.516857145299341e-05, "loss": 0.4546, "step": 1549 }, { "epoch": 0.399265865988344, "grad_norm": 0.13787763557116675, "learning_rate": 7.512970418730308e-05, "loss": 0.3824, "step": 1550 }, { "epoch": 0.399265865988344, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8072289156626506, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4410511255264282, "eval_runtime": 17.4579, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 1550 }, { "epoch": 0.3995234568696268, "grad_norm": 0.18875613552634338, "learning_rate": 7.509081659383417e-05, "loss": 0.4108, "step": 1551 }, { "epoch": 0.3997810477509096, "grad_norm": 0.15752008515308788, "learning_rate": 7.505190870404343e-05, "loss": 0.386, "step": 1552 }, { "epoch": 0.4000386386321924, "grad_norm": 0.1865070689677509, "learning_rate": 7.501298054940402e-05, "loss": 0.4915, "step": 1553 }, { "epoch": 0.4002962295134752, "grad_norm": 0.2158730203522799, "learning_rate": 7.497403216140546e-05, "loss": 0.3127, "step": 1554 }, { "epoch": 0.400553820394758, "grad_norm": 0.15779216555998116, "learning_rate": 7.493506357155367e-05, "loss": 0.39, "step": 1555 }, { "epoch": 0.400553820394758, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.7998952331063385, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4584517180919647, "eval_runtime": 17.5469, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 1555 }, { "epoch": 0.4008114112760408, "grad_norm": 0.18250485405576147, "learning_rate": 7.489607481137092e-05, "loss": 0.4606, "step": 1556 }, { "epoch": 0.4010690021573236, "grad_norm": 0.21602588864209615, "learning_rate": 7.485706591239576e-05, "loss": 0.4445, "step": 1557 }, { "epoch": 0.40132659303860646, "grad_norm": 0.145986255910209, "learning_rate": 7.481803690618304e-05, "loss": 0.3959, "step": 1558 }, { "epoch": 0.40158418391988926, "grad_norm": 0.13965147507705808, "learning_rate": 7.47789878243039e-05, "loss": 0.3901, "step": 1559 }, { "epoch": 0.40184177480117206, "grad_norm": 0.1567287618178594, "learning_rate": 7.473991869834569e-05, "loss": 0.4307, "step": 1560 }, { "epoch": 0.40184177480117206, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8518518518518519, "eval_PRM F1 AUC": 0.6982713462545836, "eval_PRM F1 AUC (fixed)": 0.784442116291252, "eval_PRM F1 Neg": 0.52, "eval_PRM NPV": 0.48148148148148145, "eval_PRM Precision": 0.8734177215189873, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4617365002632141, "eval_runtime": 17.6017, "eval_samples_per_second": 2.5, "eval_steps_per_second": 0.17, "step": 1560 }, { "epoch": 0.40209936568245486, "grad_norm": 0.15503475434533706, "learning_rate": 7.4700829559912e-05, "loss": 0.3195, "step": 1561 }, { "epoch": 0.40235695656373766, "grad_norm": 0.12567350065579952, "learning_rate": 7.46617204406226e-05, "loss": 0.4115, "step": 1562 }, { "epoch": 0.40261454744502045, "grad_norm": 0.1428551942004378, "learning_rate": 7.46225913721134e-05, "loss": 0.4404, "step": 1563 }, { "epoch": 0.40287213832630325, "grad_norm": 0.142247960429266, "learning_rate": 7.458344238603647e-05, "loss": 0.2924, "step": 1564 }, { "epoch": 0.40312972920758605, "grad_norm": 0.13459576882337287, "learning_rate": 7.454427351405999e-05, "loss": 0.3549, "step": 1565 }, { "epoch": 0.40312972920758605, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.7731796752226296, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4788707494735718, "eval_runtime": 17.5542, "eval_samples_per_second": 2.507, "eval_steps_per_second": 0.171, "step": 1565 }, { "epoch": 0.40338732008886885, "grad_norm": 0.13858706409440535, "learning_rate": 7.450508478786823e-05, "loss": 0.3659, "step": 1566 }, { "epoch": 0.40364491097015165, "grad_norm": 0.19273360591692804, "learning_rate": 7.44658762391615e-05, "loss": 0.4856, "step": 1567 }, { "epoch": 0.40390250185143445, "grad_norm": 0.13939068530565746, "learning_rate": 7.442664789965618e-05, "loss": 0.3402, "step": 1568 }, { "epoch": 0.40416009273271725, "grad_norm": 0.21326993610270198, "learning_rate": 7.438739980108462e-05, "loss": 0.3306, "step": 1569 }, { "epoch": 0.40441768361400005, "grad_norm": 0.19263415958749042, "learning_rate": 7.434813197519515e-05, "loss": 0.4201, "step": 1570 }, { "epoch": 0.40441768361400005, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.7776322682032477, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.48819246888160706, "eval_runtime": 17.0945, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 1570 }, { "epoch": 0.40467527449528284, "grad_norm": 0.15754979874438907, "learning_rate": 7.430884445375213e-05, "loss": 0.3645, "step": 1571 }, { "epoch": 0.40493286537656564, "grad_norm": 0.16096630191648154, "learning_rate": 7.426953726853574e-05, "loss": 0.434, "step": 1572 }, { "epoch": 0.4051904562578485, "grad_norm": 0.1338077817919584, "learning_rate": 7.423021045134217e-05, "loss": 0.3886, "step": 1573 }, { "epoch": 0.4054480471391313, "grad_norm": 0.1628053863002934, "learning_rate": 7.419086403398345e-05, "loss": 0.4004, "step": 1574 }, { "epoch": 0.4057056380204141, "grad_norm": 0.17163041822104835, "learning_rate": 7.415149804828743e-05, "loss": 0.3323, "step": 1575 }, { "epoch": 0.4057056380204141, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8025144054478786, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.44460228085517883, "eval_runtime": 16.8998, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 1575 }, { "epoch": 0.4059632289016969, "grad_norm": 0.16332083288047294, "learning_rate": 7.411211252609784e-05, "loss": 0.3958, "step": 1576 }, { "epoch": 0.4062208197829797, "grad_norm": 0.15460537114332742, "learning_rate": 7.407270749927419e-05, "loss": 0.4033, "step": 1577 }, { "epoch": 0.4064784106642625, "grad_norm": 0.15829083941586652, "learning_rate": 7.403328299969178e-05, "loss": 0.4258, "step": 1578 }, { "epoch": 0.4067360015455453, "grad_norm": 0.13557165560228338, "learning_rate": 7.399383905924165e-05, "loss": 0.3718, "step": 1579 }, { "epoch": 0.4069935924268281, "grad_norm": 0.17537373944145013, "learning_rate": 7.395437570983057e-05, "loss": 0.368, "step": 1580 }, { "epoch": 0.4069935924268281, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8103719224724987, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4269353747367859, "eval_runtime": 17.0434, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 1580 }, { "epoch": 0.4072511833081109, "grad_norm": 0.12957445452887748, "learning_rate": 7.391489298338099e-05, "loss": 0.4112, "step": 1581 }, { "epoch": 0.4075087741893937, "grad_norm": 0.11821400041916534, "learning_rate": 7.387539091183111e-05, "loss": 0.3644, "step": 1582 }, { "epoch": 0.4077663650706765, "grad_norm": 0.14788700254788611, "learning_rate": 7.383586952713465e-05, "loss": 0.3645, "step": 1583 }, { "epoch": 0.4080239559519593, "grad_norm": 0.1551040982083199, "learning_rate": 7.379632886126108e-05, "loss": 0.4002, "step": 1584 }, { "epoch": 0.4082815468332421, "grad_norm": 0.10497177562538057, "learning_rate": 7.375676894619538e-05, "loss": 0.3119, "step": 1585 }, { "epoch": 0.4082815468332421, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8103719224724987, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4283558130264282, "eval_runtime": 16.3114, "eval_samples_per_second": 2.698, "eval_steps_per_second": 0.184, "step": 1585 }, { "epoch": 0.4085391377145249, "grad_norm": 0.12819481736529953, "learning_rate": 7.371718981393815e-05, "loss": 0.2799, "step": 1586 }, { "epoch": 0.40879672859580773, "grad_norm": 0.10443032547451916, "learning_rate": 7.367759149650551e-05, "loss": 0.3153, "step": 1587 }, { "epoch": 0.40905431947709053, "grad_norm": 0.12706831256199655, "learning_rate": 7.363797402592913e-05, "loss": 0.3287, "step": 1588 }, { "epoch": 0.40931191035837333, "grad_norm": 0.1643945767425304, "learning_rate": 7.359833743425611e-05, "loss": 0.3943, "step": 1589 }, { "epoch": 0.40956950123965613, "grad_norm": 0.12591902655255258, "learning_rate": 7.355868175354911e-05, "loss": 0.2785, "step": 1590 }, { "epoch": 0.40956950123965613, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8145625982189628, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.43723365664482117, "eval_runtime": 17.6155, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 1590 }, { "epoch": 0.40982709212093893, "grad_norm": 0.1724523208618192, "learning_rate": 7.351900701588612e-05, "loss": 0.404, "step": 1591 }, { "epoch": 0.41008468300222173, "grad_norm": 0.13524163491552585, "learning_rate": 7.347931325336066e-05, "loss": 0.3376, "step": 1592 }, { "epoch": 0.4103422738835045, "grad_norm": 0.14062811662516628, "learning_rate": 7.343960049808156e-05, "loss": 0.3348, "step": 1593 }, { "epoch": 0.4105998647647873, "grad_norm": 0.13847837304605756, "learning_rate": 7.339986878217303e-05, "loss": 0.3726, "step": 1594 }, { "epoch": 0.4108574556460701, "grad_norm": 0.17151700961087127, "learning_rate": 7.336011813777463e-05, "loss": 0.3695, "step": 1595 }, { "epoch": 0.4108574556460701, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8137768465165007, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4410511255264282, "eval_runtime": 17.4902, "eval_samples_per_second": 2.516, "eval_steps_per_second": 0.172, "step": 1595 }, { "epoch": 0.4111150465273529, "grad_norm": 0.1906964295003375, "learning_rate": 7.332034859704123e-05, "loss": 0.3628, "step": 1596 }, { "epoch": 0.4113726374086357, "grad_norm": 0.13353012469626363, "learning_rate": 7.3280560192143e-05, "loss": 0.339, "step": 1597 }, { "epoch": 0.4116302282899185, "grad_norm": 0.1658378199815432, "learning_rate": 7.324075295526531e-05, "loss": 0.4049, "step": 1598 }, { "epoch": 0.4118878191712013, "grad_norm": 0.16627736582444355, "learning_rate": 7.320092691860886e-05, "loss": 0.4206, "step": 1599 }, { "epoch": 0.4121454100524841, "grad_norm": 0.22458568728485723, "learning_rate": 7.316108211438945e-05, "loss": 0.4673, "step": 1600 }, { "epoch": 0.4121454100524841, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8046097433211106, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.42942115664482117, "eval_runtime": 17.6587, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 1600 }, { "epoch": 0.41240300093376697, "grad_norm": 0.178880612917144, "learning_rate": 7.312121857483815e-05, "loss": 0.3725, "step": 1601 }, { "epoch": 0.41266059181504977, "grad_norm": 0.17218263635711015, "learning_rate": 7.308133633220114e-05, "loss": 0.3638, "step": 1602 }, { "epoch": 0.41291818269633257, "grad_norm": 0.167975574760578, "learning_rate": 7.304143541873974e-05, "loss": 0.3681, "step": 1603 }, { "epoch": 0.41317577357761537, "grad_norm": 0.18753898145608214, "learning_rate": 7.300151586673037e-05, "loss": 0.3991, "step": 1604 }, { "epoch": 0.41343336445889817, "grad_norm": 0.22062075160832262, "learning_rate": 7.296157770846452e-05, "loss": 0.3709, "step": 1605 }, { "epoch": 0.41343336445889817, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8229439497118911, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4056285619735718, "eval_runtime": 16.4663, "eval_samples_per_second": 2.672, "eval_steps_per_second": 0.182, "step": 1605 }, { "epoch": 0.41369095534018097, "grad_norm": 0.18977924951772585, "learning_rate": 7.292162097624874e-05, "loss": 0.4406, "step": 1606 }, { "epoch": 0.41394854622146376, "grad_norm": 0.1436728554129188, "learning_rate": 7.288164570240463e-05, "loss": 0.3726, "step": 1607 }, { "epoch": 0.41420613710274656, "grad_norm": 0.12708431246504245, "learning_rate": 7.284165191926872e-05, "loss": 0.347, "step": 1608 }, { "epoch": 0.41446372798402936, "grad_norm": 0.15636489847987395, "learning_rate": 7.28016396591926e-05, "loss": 0.377, "step": 1609 }, { "epoch": 0.41472131886531216, "grad_norm": 0.13452344495388474, "learning_rate": 7.276160895454273e-05, "loss": 0.2757, "step": 1610 }, { "epoch": 0.41472131886531216, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8378732320586696, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3943536877632141, "eval_runtime": 16.6852, "eval_samples_per_second": 2.637, "eval_steps_per_second": 0.18, "step": 1610 }, { "epoch": 0.41497890974659496, "grad_norm": 0.1542573866336418, "learning_rate": 7.272155983770055e-05, "loss": 0.2986, "step": 1611 }, { "epoch": 0.41523650062787776, "grad_norm": 0.14518737294656395, "learning_rate": 7.268149234106233e-05, "loss": 0.3802, "step": 1612 }, { "epoch": 0.41549409150916056, "grad_norm": 0.2164966644733006, "learning_rate": 7.264140649703927e-05, "loss": 0.5182, "step": 1613 }, { "epoch": 0.41575168239044336, "grad_norm": 0.18335198120490992, "learning_rate": 7.26013023380574e-05, "loss": 0.3585, "step": 1614 }, { "epoch": 0.41600927327172615, "grad_norm": 0.17322194603764646, "learning_rate": 7.25611798965575e-05, "loss": 0.4726, "step": 1615 }, { "epoch": 0.41600927327172615, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8352540597171294, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3852982819080353, "eval_runtime": 17.0236, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 1615 }, { "epoch": 0.416266864153009, "grad_norm": 0.12232906264806807, "learning_rate": 7.252103920499524e-05, "loss": 0.3421, "step": 1616 }, { "epoch": 0.4165244550342918, "grad_norm": 0.16778538057369627, "learning_rate": 7.248088029584095e-05, "loss": 0.3489, "step": 1617 }, { "epoch": 0.4167820459155746, "grad_norm": 0.106998583203376, "learning_rate": 7.24407032015798e-05, "loss": 0.3007, "step": 1618 }, { "epoch": 0.4170396367968574, "grad_norm": 0.12576274326177686, "learning_rate": 7.240050795471158e-05, "loss": 0.3505, "step": 1619 }, { "epoch": 0.4172972276781402, "grad_norm": 0.18232134881036993, "learning_rate": 7.236029458775082e-05, "loss": 0.3706, "step": 1620 }, { "epoch": 0.4172972276781402, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8425877422734416, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37917259335517883, "eval_runtime": 17.0033, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 1620 }, { "epoch": 0.417554818559423, "grad_norm": 0.15309278374263297, "learning_rate": 7.232006313322667e-05, "loss": 0.3803, "step": 1621 }, { "epoch": 0.4178124094407058, "grad_norm": 0.12852489661948097, "learning_rate": 7.227981362368298e-05, "loss": 0.3517, "step": 1622 }, { "epoch": 0.4180700003219886, "grad_norm": 0.12559937661754786, "learning_rate": 7.223954609167813e-05, "loss": 0.3301, "step": 1623 }, { "epoch": 0.4183275912032714, "grad_norm": 0.1870006884323831, "learning_rate": 7.219926056978507e-05, "loss": 0.3524, "step": 1624 }, { "epoch": 0.4185851820845542, "grad_norm": 0.1503511674518234, "learning_rate": 7.21589570905914e-05, "loss": 0.3712, "step": 1625 }, { "epoch": 0.4185851820845542, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8370874803562074, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3871626555919647, "eval_runtime": 17.3038, "eval_samples_per_second": 2.543, "eval_steps_per_second": 0.173, "step": 1625 }, { "epoch": 0.418842772965837, "grad_norm": 0.1962815245174824, "learning_rate": 7.211863568669912e-05, "loss": 0.4286, "step": 1626 }, { "epoch": 0.4191003638471198, "grad_norm": 0.19892995545115355, "learning_rate": 7.207829639072483e-05, "loss": 0.4582, "step": 1627 }, { "epoch": 0.4193579547284026, "grad_norm": 0.1637905963173261, "learning_rate": 7.203793923529956e-05, "loss": 0.337, "step": 1628 }, { "epoch": 0.4196155456096854, "grad_norm": 0.12441741413677421, "learning_rate": 7.199756425306881e-05, "loss": 0.2899, "step": 1629 }, { "epoch": 0.41987313649096825, "grad_norm": 0.1482867119342889, "learning_rate": 7.195717147669245e-05, "loss": 0.3929, "step": 1630 }, { "epoch": 0.41987313649096825, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8339444735463594, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3959517180919647, "eval_runtime": 17.1601, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 1630 }, { "epoch": 0.42013072737225104, "grad_norm": 0.11997835013993044, "learning_rate": 7.191676093884478e-05, "loss": 0.3339, "step": 1631 }, { "epoch": 0.42038831825353384, "grad_norm": 0.14754816005261343, "learning_rate": 7.18763326722145e-05, "loss": 0.4107, "step": 1632 }, { "epoch": 0.42064590913481664, "grad_norm": 0.1917188140363985, "learning_rate": 7.183588670950456e-05, "loss": 0.3919, "step": 1633 }, { "epoch": 0.42090350001609944, "grad_norm": 0.12897558441039192, "learning_rate": 7.179542308343233e-05, "loss": 0.3194, "step": 1634 }, { "epoch": 0.42116109089738224, "grad_norm": 0.16189992112396553, "learning_rate": 7.175494182672939e-05, "loss": 0.4415, "step": 1635 }, { "epoch": 0.42116109089738224, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8268727082242011, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.41903409361839294, "eval_runtime": 17.0661, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 1635 }, { "epoch": 0.42141868177866504, "grad_norm": 0.19082729608947205, "learning_rate": 7.171444297214163e-05, "loss": 0.3584, "step": 1636 }, { "epoch": 0.42167627265994784, "grad_norm": 0.15497682120873124, "learning_rate": 7.167392655242914e-05, "loss": 0.4473, "step": 1637 }, { "epoch": 0.42193386354123064, "grad_norm": 0.13942468277613548, "learning_rate": 7.163339260036624e-05, "loss": 0.4069, "step": 1638 }, { "epoch": 0.42219145442251343, "grad_norm": 0.12793360974305049, "learning_rate": 7.159284114874141e-05, "loss": 0.3088, "step": 1639 }, { "epoch": 0.42244904530379623, "grad_norm": 0.17848180270930525, "learning_rate": 7.155227223035732e-05, "loss": 0.4505, "step": 1640 }, { "epoch": 0.42244904530379623, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8239916186485071, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42409446835517883, "eval_runtime": 17.153, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 1640 }, { "epoch": 0.42270663618507903, "grad_norm": 0.1483130171252024, "learning_rate": 7.151168587803075e-05, "loss": 0.4207, "step": 1641 }, { "epoch": 0.42296422706636183, "grad_norm": 0.1273691026283171, "learning_rate": 7.147108212459257e-05, "loss": 0.3156, "step": 1642 }, { "epoch": 0.42322181794764463, "grad_norm": 0.1823027073422586, "learning_rate": 7.143046100288776e-05, "loss": 0.3893, "step": 1643 }, { "epoch": 0.42347940882892743, "grad_norm": 0.14733814208343146, "learning_rate": 7.138982254577531e-05, "loss": 0.4293, "step": 1644 }, { "epoch": 0.4237369997102103, "grad_norm": 0.1406277076224388, "learning_rate": 7.134916678612825e-05, "loss": 0.3605, "step": 1645 }, { "epoch": 0.4237369997102103, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.821110529072813, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42471590638160706, "eval_runtime": 16.8892, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 1645 }, { "epoch": 0.4239945905914931, "grad_norm": 0.1360882375814374, "learning_rate": 7.130849375683361e-05, "loss": 0.3408, "step": 1646 }, { "epoch": 0.4242521814727759, "grad_norm": 0.18513822271834893, "learning_rate": 7.126780349079242e-05, "loss": 0.42, "step": 1647 }, { "epoch": 0.4245097723540587, "grad_norm": 0.15352215299099797, "learning_rate": 7.122709602091957e-05, "loss": 0.3501, "step": 1648 }, { "epoch": 0.4247673632353415, "grad_norm": 0.15578519721296688, "learning_rate": 7.118637138014396e-05, "loss": 0.4202, "step": 1649 }, { "epoch": 0.4250249541166243, "grad_norm": 0.14793587983394899, "learning_rate": 7.11456296014083e-05, "loss": 0.3376, "step": 1650 }, { "epoch": 0.4250249541166243, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.8268727082242012, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4164595305919647, "eval_runtime": 17.2225, "eval_samples_per_second": 2.555, "eval_steps_per_second": 0.174, "step": 1650 }, { "epoch": 0.4252825449979071, "grad_norm": 0.12365968333207746, "learning_rate": 7.110487071766923e-05, "loss": 0.3149, "step": 1651 }, { "epoch": 0.4255401358791899, "grad_norm": 0.15181476791503504, "learning_rate": 7.106409476189718e-05, "loss": 0.3796, "step": 1652 }, { "epoch": 0.4257977267604727, "grad_norm": 0.13219219694307918, "learning_rate": 7.10233017670764e-05, "loss": 0.3584, "step": 1653 }, { "epoch": 0.42605531764175547, "grad_norm": 0.13367881626469846, "learning_rate": 7.098249176620495e-05, "loss": 0.2846, "step": 1654 }, { "epoch": 0.42631290852303827, "grad_norm": 0.1471472806669616, "learning_rate": 7.09416647922946e-05, "loss": 0.3626, "step": 1655 }, { "epoch": 0.42631290852303827, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8255631220534311, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.41628196835517883, "eval_runtime": 17.6557, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 1655 }, { "epoch": 0.42657049940432107, "grad_norm": 0.132500953249351, "learning_rate": 7.090082087837092e-05, "loss": 0.3475, "step": 1656 }, { "epoch": 0.42682809028560387, "grad_norm": 0.14565255961920318, "learning_rate": 7.085996005747309e-05, "loss": 0.4209, "step": 1657 }, { "epoch": 0.42708568116688667, "grad_norm": 0.13388965561706115, "learning_rate": 7.081908236265402e-05, "loss": 0.2854, "step": 1658 }, { "epoch": 0.4273432720481695, "grad_norm": 0.12532083680459524, "learning_rate": 7.077818782698029e-05, "loss": 0.3136, "step": 1659 }, { "epoch": 0.4276008629294523, "grad_norm": 0.21681625661231177, "learning_rate": 7.073727648353206e-05, "loss": 0.4566, "step": 1660 }, { "epoch": 0.4276008629294523, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8255631220534312, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4304865002632141, "eval_runtime": 17.6883, "eval_samples_per_second": 2.488, "eval_steps_per_second": 0.17, "step": 1660 }, { "epoch": 0.4278584538107351, "grad_norm": 0.11912709697393278, "learning_rate": 7.069634836540311e-05, "loss": 0.2856, "step": 1661 }, { "epoch": 0.4281160446920179, "grad_norm": 0.16207036241383604, "learning_rate": 7.065540350570078e-05, "loss": 0.3565, "step": 1662 }, { "epoch": 0.4283736355733007, "grad_norm": 0.18035727516717912, "learning_rate": 7.061444193754596e-05, "loss": 0.4184, "step": 1663 }, { "epoch": 0.4286312264545835, "grad_norm": 0.13314348308553056, "learning_rate": 7.057346369407305e-05, "loss": 0.3113, "step": 1664 }, { "epoch": 0.4288888173358663, "grad_norm": 0.13172214351737782, "learning_rate": 7.053246880842992e-05, "loss": 0.3425, "step": 1665 }, { "epoch": 0.4288888173358663, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8395061728395061, "eval_PRM F1 AUC": 0.6705081194342588, "eval_PRM F1 AUC (fixed)": 0.8129910948140388, "eval_PRM F1 Neg": 0.48, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8607594936708861, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4350142180919647, "eval_runtime": 17.1129, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 1665 }, { "epoch": 0.4291464082171491, "grad_norm": 0.242205176382298, "learning_rate": 7.049145731377794e-05, "loss": 0.3827, "step": 1666 }, { "epoch": 0.4294039990984319, "grad_norm": 0.2115397540028098, "learning_rate": 7.045042924329189e-05, "loss": 0.4184, "step": 1667 }, { "epoch": 0.4296615899797147, "grad_norm": 0.19444072765202533, "learning_rate": 7.040938463015998e-05, "loss": 0.402, "step": 1668 }, { "epoch": 0.4299191808609975, "grad_norm": 0.153718373191594, "learning_rate": 7.036832350758377e-05, "loss": 0.3376, "step": 1669 }, { "epoch": 0.4301767717422803, "grad_norm": 0.14058132234021567, "learning_rate": 7.032724590877821e-05, "loss": 0.3097, "step": 1670 }, { "epoch": 0.4301767717422803, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8153483499214248, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.45321378111839294, "eval_runtime": 16.989, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 1670 }, { "epoch": 0.4304343626235631, "grad_norm": 0.1540216398765928, "learning_rate": 7.028615186697154e-05, "loss": 0.3472, "step": 1671 }, { "epoch": 0.4306919535048459, "grad_norm": 0.24956774447817262, "learning_rate": 7.024504141540533e-05, "loss": 0.4581, "step": 1672 }, { "epoch": 0.43094954438612876, "grad_norm": 0.18407445952809962, "learning_rate": 7.020391458733442e-05, "loss": 0.3525, "step": 1673 }, { "epoch": 0.43120713526741156, "grad_norm": 0.21693048647349547, "learning_rate": 7.016277141602687e-05, "loss": 0.4354, "step": 1674 }, { "epoch": 0.43146472614869436, "grad_norm": 0.17080097106682174, "learning_rate": 7.012161193476398e-05, "loss": 0.362, "step": 1675 }, { "epoch": 0.43146472614869436, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8395061728395061, "eval_PRM F1 AUC": 0.6705081194342588, "eval_PRM F1 AUC (fixed)": 0.8213724463069669, "eval_PRM F1 Neg": 0.48, "eval_PRM NPV": 0.4444444444444444, "eval_PRM Precision": 0.8607594936708861, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4223189055919647, "eval_runtime": 17.0844, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 1675 }, { "epoch": 0.43172231702997715, "grad_norm": 0.1857300129304199, "learning_rate": 7.008043617684029e-05, "loss": 0.4717, "step": 1676 }, { "epoch": 0.43197990791125995, "grad_norm": 0.2560040048096338, "learning_rate": 7.003924417556343e-05, "loss": 0.3636, "step": 1677 }, { "epoch": 0.43223749879254275, "grad_norm": 0.2419266075430232, "learning_rate": 6.99980359642542e-05, "loss": 0.4895, "step": 1678 }, { "epoch": 0.43249508967382555, "grad_norm": 0.25027081320670364, "learning_rate": 6.995681157624652e-05, "loss": 0.4339, "step": 1679 }, { "epoch": 0.43275268055510835, "grad_norm": 0.170515222410119, "learning_rate": 6.991557104488739e-05, "loss": 0.3679, "step": 1680 }, { "epoch": 0.43275268055510835, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8289680460974334, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4154829680919647, "eval_runtime": 17.4531, "eval_samples_per_second": 2.521, "eval_steps_per_second": 0.172, "step": 1680 }, { "epoch": 0.43301027143639115, "grad_norm": 0.18310147734471674, "learning_rate": 6.987431440353687e-05, "loss": 0.3885, "step": 1681 }, { "epoch": 0.43326786231767395, "grad_norm": 0.1967158183774711, "learning_rate": 6.983304168556802e-05, "loss": 0.3716, "step": 1682 }, { "epoch": 0.43352545319895675, "grad_norm": 0.1451668946266958, "learning_rate": 6.979175292436699e-05, "loss": 0.3713, "step": 1683 }, { "epoch": 0.43378304408023954, "grad_norm": 0.13596152863948568, "learning_rate": 6.975044815333282e-05, "loss": 0.3885, "step": 1684 }, { "epoch": 0.43404063496152234, "grad_norm": 0.15931568373498023, "learning_rate": 6.970912740587752e-05, "loss": 0.3747, "step": 1685 }, { "epoch": 0.43404063496152234, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8901734104046243, "eval_PRM F1 AUC": 0.6812467260345731, "eval_PRM F1 AUC (fixed)": 0.8431115767417496, "eval_PRM F1 Neg": 0.5128205128205128, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8555555555555555, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4402521252632141, "eval_runtime": 17.1166, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 1685 }, { "epoch": 0.43429822584280514, "grad_norm": 0.1891362594968986, "learning_rate": 6.966779071542605e-05, "loss": 0.3181, "step": 1686 }, { "epoch": 0.43455581672408794, "grad_norm": 0.19353794558001683, "learning_rate": 6.962643811541627e-05, "loss": 0.4575, "step": 1687 }, { "epoch": 0.4348134076053708, "grad_norm": 0.11494463538518664, "learning_rate": 6.958506963929885e-05, "loss": 0.3316, "step": 1688 }, { "epoch": 0.4350709984866536, "grad_norm": 0.1936566556060151, "learning_rate": 6.954368532053739e-05, "loss": 0.4077, "step": 1689 }, { "epoch": 0.4353285893679364, "grad_norm": 0.13135924029370072, "learning_rate": 6.950228519260823e-05, "loss": 0.3354, "step": 1690 }, { "epoch": 0.4353285893679364, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8347302252488212, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4311967194080353, "eval_runtime": 16.9796, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 1690 }, { "epoch": 0.4355861802492192, "grad_norm": 0.20022433677024662, "learning_rate": 6.946086928900054e-05, "loss": 0.422, "step": 1691 }, { "epoch": 0.435843771130502, "grad_norm": 0.18366629653456173, "learning_rate": 6.941943764321623e-05, "loss": 0.4589, "step": 1692 }, { "epoch": 0.4361013620117848, "grad_norm": 0.15705629577402927, "learning_rate": 6.937799028876997e-05, "loss": 0.4236, "step": 1693 }, { "epoch": 0.4363589528930676, "grad_norm": 0.13882151295266146, "learning_rate": 6.93365272591891e-05, "loss": 0.3521, "step": 1694 }, { "epoch": 0.4366165437743504, "grad_norm": 0.13239171602123623, "learning_rate": 6.929504858801366e-05, "loss": 0.4381, "step": 1695 }, { "epoch": 0.4366165437743504, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8205128205128205, "eval_PRM F1 AUC": 0.6898899947616554, "eval_PRM F1 AUC (fixed)": 0.817443687794657, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.42424242424242425, "eval_PRM Precision": 0.8767123287671232, "eval_PRM Recall": 0.7710843373493976, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.46102628111839294, "eval_runtime": 17.1442, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 1695 }, { "epoch": 0.4368741346556332, "grad_norm": 0.19085992745409852, "learning_rate": 6.925355430879638e-05, "loss": 0.3789, "step": 1696 }, { "epoch": 0.437131725536916, "grad_norm": 0.2579891690692368, "learning_rate": 6.921204445510254e-05, "loss": 0.3967, "step": 1697 }, { "epoch": 0.4373893164181988, "grad_norm": 0.22855319790289935, "learning_rate": 6.917051906051006e-05, "loss": 0.4178, "step": 1698 }, { "epoch": 0.4376469072994816, "grad_norm": 0.1532384890658266, "learning_rate": 6.912897815860943e-05, "loss": 0.3691, "step": 1699 }, { "epoch": 0.4379044981807644, "grad_norm": 0.17672536325016108, "learning_rate": 6.908742178300369e-05, "loss": 0.3464, "step": 1700 }, { "epoch": 0.4379044981807644, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8184913567312728, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46022728085517883, "eval_runtime": 17.3178, "eval_samples_per_second": 2.541, "eval_steps_per_second": 0.173, "step": 1700 }, { "epoch": 0.4381620890620472, "grad_norm": 0.1648239220047686, "learning_rate": 6.904584996730838e-05, "loss": 0.3914, "step": 1701 }, { "epoch": 0.43841967994333003, "grad_norm": 0.1141412049080383, "learning_rate": 6.900426274515156e-05, "loss": 0.3293, "step": 1702 }, { "epoch": 0.43867727082461283, "grad_norm": 0.20543449288842194, "learning_rate": 6.89626601501737e-05, "loss": 0.4069, "step": 1703 }, { "epoch": 0.43893486170589563, "grad_norm": 0.16173671673549217, "learning_rate": 6.892104221602778e-05, "loss": 0.3826, "step": 1704 }, { "epoch": 0.43919245258717843, "grad_norm": 0.1893225188235678, "learning_rate": 6.887940897637908e-05, "loss": 0.445, "step": 1705 }, { "epoch": 0.43919245258717843, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8336825563122053, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4788263440132141, "eval_runtime": 17.6784, "eval_samples_per_second": 2.489, "eval_steps_per_second": 0.17, "step": 1705 }, { "epoch": 0.4394500434684612, "grad_norm": 0.18630614798788867, "learning_rate": 6.883776046490538e-05, "loss": 0.4424, "step": 1706 }, { "epoch": 0.439707634349744, "grad_norm": 0.14177074104369453, "learning_rate": 6.879609671529674e-05, "loss": 0.3648, "step": 1707 }, { "epoch": 0.4399652252310268, "grad_norm": 0.1721306150266505, "learning_rate": 6.875441776125557e-05, "loss": 0.3826, "step": 1708 }, { "epoch": 0.4402228161123096, "grad_norm": 0.17543560055912663, "learning_rate": 6.871272363649657e-05, "loss": 0.3841, "step": 1709 }, { "epoch": 0.4404804069935924, "grad_norm": 0.15591326453459423, "learning_rate": 6.867101437474672e-05, "loss": 0.4122, "step": 1710 }, { "epoch": 0.4404804069935924, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.821372446306967, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.45516690611839294, "eval_runtime": 16.5233, "eval_samples_per_second": 2.663, "eval_steps_per_second": 0.182, "step": 1710 }, { "epoch": 0.4407379978748752, "grad_norm": 0.13655206129355021, "learning_rate": 6.862929000974523e-05, "loss": 0.3562, "step": 1711 }, { "epoch": 0.440995588756158, "grad_norm": 0.1282885864942731, "learning_rate": 6.858755057524354e-05, "loss": 0.3939, "step": 1712 }, { "epoch": 0.4412531796374408, "grad_norm": 0.13552173100247356, "learning_rate": 6.85457961050053e-05, "loss": 0.3675, "step": 1713 }, { "epoch": 0.4415107705187236, "grad_norm": 0.1351814625112122, "learning_rate": 6.850402663280626e-05, "loss": 0.3933, "step": 1714 }, { "epoch": 0.4417683614000064, "grad_norm": 0.14169744720786462, "learning_rate": 6.84622421924344e-05, "loss": 0.4484, "step": 1715 }, { "epoch": 0.4417683614000064, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8322981366459627, "eval_PRM F1 AUC": 0.6644840230487166, "eval_PRM F1 AUC (fixed)": 0.8135149292823467, "eval_PRM F1 Neg": 0.47058823529411764, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8589743589743589, "eval_PRM Recall": 0.8072289156626506, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4529474377632141, "eval_runtime": 16.6447, "eval_samples_per_second": 2.643, "eval_steps_per_second": 0.18, "step": 1715 }, { "epoch": 0.44202595228128927, "grad_norm": 0.2271303054406433, "learning_rate": 6.84204428176897e-05, "loss": 0.3501, "step": 1716 }, { "epoch": 0.44228354316257207, "grad_norm": 0.15378921941660625, "learning_rate": 6.837862854238432e-05, "loss": 0.3586, "step": 1717 }, { "epoch": 0.44254113404385487, "grad_norm": 0.1495132105789954, "learning_rate": 6.83367994003424e-05, "loss": 0.4018, "step": 1718 }, { "epoch": 0.44279872492513767, "grad_norm": 0.21086766758596315, "learning_rate": 6.829495542540013e-05, "loss": 0.4094, "step": 1719 }, { "epoch": 0.44305631580642046, "grad_norm": 0.13688962767599477, "learning_rate": 6.825309665140571e-05, "loss": 0.3686, "step": 1720 }, { "epoch": 0.44305631580642046, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8158721843897327, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46803978085517883, "eval_runtime": 17.5793, "eval_samples_per_second": 2.503, "eval_steps_per_second": 0.171, "step": 1720 }, { "epoch": 0.44331390668770326, "grad_norm": 0.1333967628283758, "learning_rate": 6.821122311221931e-05, "loss": 0.2785, "step": 1721 }, { "epoch": 0.44357149756898606, "grad_norm": 0.15281665920531123, "learning_rate": 6.816933484171302e-05, "loss": 0.3859, "step": 1722 }, { "epoch": 0.44382908845026886, "grad_norm": 0.17771362217536785, "learning_rate": 6.812743187377091e-05, "loss": 0.3824, "step": 1723 }, { "epoch": 0.44408667933155166, "grad_norm": 0.21778928990755528, "learning_rate": 6.808551424228884e-05, "loss": 0.451, "step": 1724 }, { "epoch": 0.44434427021283446, "grad_norm": 0.10609758424993862, "learning_rate": 6.80435819811746e-05, "loss": 0.2491, "step": 1725 }, { "epoch": 0.44434427021283446, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8129910948140388, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.48739346861839294, "eval_runtime": 17.603, "eval_samples_per_second": 2.5, "eval_steps_per_second": 0.17, "step": 1725 }, { "epoch": 0.44460186109411726, "grad_norm": 0.1495077715591695, "learning_rate": 6.80016351243478e-05, "loss": 0.4116, "step": 1726 }, { "epoch": 0.44485945197540006, "grad_norm": 0.15902314315407612, "learning_rate": 6.795967370573985e-05, "loss": 0.3691, "step": 1727 }, { "epoch": 0.44511704285668285, "grad_norm": 0.14668113698313168, "learning_rate": 6.791769775929395e-05, "loss": 0.4258, "step": 1728 }, { "epoch": 0.44537463373796565, "grad_norm": 0.14090097932135287, "learning_rate": 6.787570731896506e-05, "loss": 0.384, "step": 1729 }, { "epoch": 0.44563222461924845, "grad_norm": 0.12279551466760454, "learning_rate": 6.783370241871983e-05, "loss": 0.3591, "step": 1730 }, { "epoch": 0.44563222461924845, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8135149292823468, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.47265625, "eval_runtime": 16.9998, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 1730 }, { "epoch": 0.4458898155005313, "grad_norm": 0.11004166096353546, "learning_rate": 6.779168309253663e-05, "loss": 0.288, "step": 1731 }, { "epoch": 0.4461474063818141, "grad_norm": 0.1373344425290363, "learning_rate": 6.774964937440549e-05, "loss": 0.3416, "step": 1732 }, { "epoch": 0.4464049972630969, "grad_norm": 0.1861323851494907, "learning_rate": 6.77076012983281e-05, "loss": 0.4617, "step": 1733 }, { "epoch": 0.4466625881443797, "grad_norm": 0.13426266155814937, "learning_rate": 6.766553889831776e-05, "loss": 0.3921, "step": 1734 }, { "epoch": 0.4469201790256625, "grad_norm": 0.11448251857231911, "learning_rate": 6.762346220839932e-05, "loss": 0.292, "step": 1735 }, { "epoch": 0.4469201790256625, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8171817705605029, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46315696835517883, "eval_runtime": 16.9253, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 1735 }, { "epoch": 0.4471777699069453, "grad_norm": 0.11542488199321789, "learning_rate": 6.758137126260927e-05, "loss": 0.3977, "step": 1736 }, { "epoch": 0.4474353607882281, "grad_norm": 0.13532912048509205, "learning_rate": 6.753926609499553e-05, "loss": 0.3347, "step": 1737 }, { "epoch": 0.4476929516695109, "grad_norm": 0.12615595527688414, "learning_rate": 6.749714673961759e-05, "loss": 0.3719, "step": 1738 }, { "epoch": 0.4479505425507937, "grad_norm": 0.14492841377117893, "learning_rate": 6.745501323054639e-05, "loss": 0.3695, "step": 1739 }, { "epoch": 0.4482081334320765, "grad_norm": 0.1285255899503753, "learning_rate": 6.741286560186437e-05, "loss": 0.3797, "step": 1740 }, { "epoch": 0.4482081334320765, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8242535358826611, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.46653053164482117, "eval_runtime": 17.2999, "eval_samples_per_second": 2.543, "eval_steps_per_second": 0.173, "step": 1740 }, { "epoch": 0.4484657243133593, "grad_norm": 0.1489394526765812, "learning_rate": 6.73707038876653e-05, "loss": 0.3514, "step": 1741 }, { "epoch": 0.4487233151946421, "grad_norm": 0.12267758533739277, "learning_rate": 6.732852812205443e-05, "loss": 0.3685, "step": 1742 }, { "epoch": 0.4489809060759249, "grad_norm": 0.11871984144582193, "learning_rate": 6.728633833914834e-05, "loss": 0.3468, "step": 1743 }, { "epoch": 0.4492384969572077, "grad_norm": 0.19853299310987585, "learning_rate": 6.724413457307497e-05, "loss": 0.3548, "step": 1744 }, { "epoch": 0.44949608783849054, "grad_norm": 0.13986965004720225, "learning_rate": 6.72019168579735e-05, "loss": 0.369, "step": 1745 }, { "epoch": 0.44949608783849054, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8289680460974332, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4685724377632141, "eval_runtime": 17.1048, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 1745 }, { "epoch": 0.44975367871977334, "grad_norm": 0.24337101990458107, "learning_rate": 6.715968522799449e-05, "loss": 0.5371, "step": 1746 }, { "epoch": 0.45001126960105614, "grad_norm": 0.15656125611883218, "learning_rate": 6.711743971729967e-05, "loss": 0.3608, "step": 1747 }, { "epoch": 0.45026886048233894, "grad_norm": 0.1156802244453824, "learning_rate": 6.707518036006208e-05, "loss": 0.37, "step": 1748 }, { "epoch": 0.45052645136362174, "grad_norm": 0.1251717102580924, "learning_rate": 6.703290719046591e-05, "loss": 0.3752, "step": 1749 }, { "epoch": 0.45078404224490454, "grad_norm": 0.1589306906202831, "learning_rate": 6.699062024270654e-05, "loss": 0.3488, "step": 1750 }, { "epoch": 0.45078404224490454, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8218962807752751, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4593394994735718, "eval_runtime": 17.002, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 1750 }, { "epoch": 0.45104163312618734, "grad_norm": 0.15305367646211848, "learning_rate": 6.694831955099048e-05, "loss": 0.2927, "step": 1751 }, { "epoch": 0.45129922400747013, "grad_norm": 0.14804032810620574, "learning_rate": 6.690600514953535e-05, "loss": 0.3988, "step": 1752 }, { "epoch": 0.45155681488875293, "grad_norm": 0.1560343091330646, "learning_rate": 6.686367707256993e-05, "loss": 0.4452, "step": 1753 }, { "epoch": 0.45181440577003573, "grad_norm": 0.15215229302898645, "learning_rate": 6.682133535433393e-05, "loss": 0.3454, "step": 1754 }, { "epoch": 0.45207199665131853, "grad_norm": 0.12847547778420332, "learning_rate": 6.677898002907824e-05, "loss": 0.3139, "step": 1755 }, { "epoch": 0.45207199665131853, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.818753273965427, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4617365002632141, "eval_runtime": 16.4301, "eval_samples_per_second": 2.678, "eval_steps_per_second": 0.183, "step": 1755 }, { "epoch": 0.45232958753260133, "grad_norm": 0.1477943557497144, "learning_rate": 6.673661113106466e-05, "loss": 0.4068, "step": 1756 }, { "epoch": 0.45258717841388413, "grad_norm": 0.1511303741817972, "learning_rate": 6.669422869456602e-05, "loss": 0.4087, "step": 1757 }, { "epoch": 0.4528447692951669, "grad_norm": 0.13139264127147623, "learning_rate": 6.665183275386606e-05, "loss": 0.3335, "step": 1758 }, { "epoch": 0.4531023601764498, "grad_norm": 0.18048434840499797, "learning_rate": 6.66094233432595e-05, "loss": 0.3989, "step": 1759 }, { "epoch": 0.4533599510577326, "grad_norm": 0.15954195412321842, "learning_rate": 6.656700049705185e-05, "loss": 0.3923, "step": 1760 }, { "epoch": 0.4533599510577326, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.819800942902043, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.46218040585517883, "eval_runtime": 16.9355, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 1760 }, { "epoch": 0.4536175419390154, "grad_norm": 0.2049842261251955, "learning_rate": 6.652456424955963e-05, "loss": 0.4129, "step": 1761 }, { "epoch": 0.4538751328202982, "grad_norm": 0.1426572592417938, "learning_rate": 6.648211463511011e-05, "loss": 0.4157, "step": 1762 }, { "epoch": 0.454132723701581, "grad_norm": 0.15175757619670358, "learning_rate": 6.64396516880414e-05, "loss": 0.3496, "step": 1763 }, { "epoch": 0.4543903145828638, "grad_norm": 0.13528718739541562, "learning_rate": 6.639717544270235e-05, "loss": 0.3165, "step": 1764 }, { "epoch": 0.4546479054641466, "grad_norm": 0.19530181721713039, "learning_rate": 6.635468593345265e-05, "loss": 0.4133, "step": 1765 }, { "epoch": 0.4546479054641466, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8466257668711656, "eval_PRM F1 AUC": 0.6765322158198009, "eval_PRM F1 AUC (fixed)": 0.8059193294918806, "eval_PRM F1 Neg": 0.4897959183673469, "eval_PRM NPV": 0.46153846153846156, "eval_PRM Precision": 0.8625, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4614701569080353, "eval_runtime": 17.6729, "eval_samples_per_second": 2.49, "eval_steps_per_second": 0.17, "step": 1765 }, { "epoch": 0.45490549634542937, "grad_norm": 0.14463457721223935, "learning_rate": 6.631218319466263e-05, "loss": 0.3627, "step": 1766 }, { "epoch": 0.45516308722671217, "grad_norm": 0.13385592068048957, "learning_rate": 6.626966726071342e-05, "loss": 0.4145, "step": 1767 }, { "epoch": 0.45542067810799497, "grad_norm": 0.1568733952765744, "learning_rate": 6.622713816599673e-05, "loss": 0.4013, "step": 1768 }, { "epoch": 0.45567826898927777, "grad_norm": 0.1450985715593632, "learning_rate": 6.618459594491496e-05, "loss": 0.3235, "step": 1769 }, { "epoch": 0.45593585987056057, "grad_norm": 0.15473087082418885, "learning_rate": 6.614204063188114e-05, "loss": 0.4391, "step": 1770 }, { "epoch": 0.45593585987056057, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8048716605552645, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.47629615664482117, "eval_runtime": 17.1046, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 1770 }, { "epoch": 0.45619345075184337, "grad_norm": 0.1597197275171068, "learning_rate": 6.609947226131886e-05, "loss": 0.4044, "step": 1771 }, { "epoch": 0.45645104163312616, "grad_norm": 0.13092753418484807, "learning_rate": 6.605689086766228e-05, "loss": 0.3569, "step": 1772 }, { "epoch": 0.45670863251440896, "grad_norm": 0.2180789498457224, "learning_rate": 6.601429648535612e-05, "loss": 0.3719, "step": 1773 }, { "epoch": 0.4569662233956918, "grad_norm": 0.12425193143172036, "learning_rate": 6.597168914885557e-05, "loss": 0.3207, "step": 1774 }, { "epoch": 0.4572238142769746, "grad_norm": 0.17297479293725546, "learning_rate": 6.592906889262632e-05, "loss": 0.4564, "step": 1775 }, { "epoch": 0.4572238142769746, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8135149292823467, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.47336646914482117, "eval_runtime": 17.6046, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 1775 }, { "epoch": 0.4574814051582574, "grad_norm": 0.14221285111612977, "learning_rate": 6.588643575114453e-05, "loss": 0.377, "step": 1776 }, { "epoch": 0.4577389960395402, "grad_norm": 0.12181618900089665, "learning_rate": 6.584378975889671e-05, "loss": 0.2739, "step": 1777 }, { "epoch": 0.457996586920823, "grad_norm": 0.13247459693730074, "learning_rate": 6.580113095037988e-05, "loss": 0.3342, "step": 1778 }, { "epoch": 0.4582541778021058, "grad_norm": 0.13854065238318528, "learning_rate": 6.575845936010131e-05, "loss": 0.3616, "step": 1779 }, { "epoch": 0.4585117686833886, "grad_norm": 0.15817649226108169, "learning_rate": 6.571577502257868e-05, "loss": 0.3531, "step": 1780 }, { "epoch": 0.4585117686833886, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.822943949711891, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4604048430919647, "eval_runtime": 16.5001, "eval_samples_per_second": 2.667, "eval_steps_per_second": 0.182, "step": 1780 }, { "epoch": 0.4587693595646714, "grad_norm": 0.2153893590670722, "learning_rate": 6.567307797233996e-05, "loss": 0.4502, "step": 1781 }, { "epoch": 0.4590269504459542, "grad_norm": 0.12363789940639183, "learning_rate": 6.563036824392344e-05, "loss": 0.2915, "step": 1782 }, { "epoch": 0.459284541327237, "grad_norm": 0.1376832158336152, "learning_rate": 6.558764587187758e-05, "loss": 0.3941, "step": 1783 }, { "epoch": 0.4595421322085198, "grad_norm": 0.13701724803519236, "learning_rate": 6.554491089076116e-05, "loss": 0.3555, "step": 1784 }, { "epoch": 0.4597997230898026, "grad_norm": 0.16306476725703423, "learning_rate": 6.550216333514311e-05, "loss": 0.3623, "step": 1785 }, { "epoch": 0.4597997230898026, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8268727082242011, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4519708752632141, "eval_runtime": 16.8731, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 1785 }, { "epoch": 0.4600573139710854, "grad_norm": 0.227678970554314, "learning_rate": 6.545940323960253e-05, "loss": 0.372, "step": 1786 }, { "epoch": 0.4603149048523682, "grad_norm": 0.12454168871909095, "learning_rate": 6.541663063872866e-05, "loss": 0.3684, "step": 1787 }, { "epoch": 0.46057249573365105, "grad_norm": 0.1326560038115873, "learning_rate": 6.537384556712092e-05, "loss": 0.3429, "step": 1788 }, { "epoch": 0.46083008661493385, "grad_norm": 0.13872710248306508, "learning_rate": 6.533104805938873e-05, "loss": 0.3703, "step": 1789 }, { "epoch": 0.46108767749621665, "grad_norm": 0.14160275745056403, "learning_rate": 6.528823815015162e-05, "loss": 0.3379, "step": 1790 }, { "epoch": 0.46108767749621665, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8211105290728131, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4526810944080353, "eval_runtime": 17.5622, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 1790 }, { "epoch": 0.46134526837749945, "grad_norm": 0.14379831385229544, "learning_rate": 6.524541587403913e-05, "loss": 0.3287, "step": 1791 }, { "epoch": 0.46160285925878225, "grad_norm": 0.1597197496689729, "learning_rate": 6.520258126569086e-05, "loss": 0.3651, "step": 1792 }, { "epoch": 0.46186045014006505, "grad_norm": 0.1330504574870503, "learning_rate": 6.515973435975628e-05, "loss": 0.3868, "step": 1793 }, { "epoch": 0.46211804102134785, "grad_norm": 0.1331841831598561, "learning_rate": 6.511687519089489e-05, "loss": 0.339, "step": 1794 }, { "epoch": 0.46237563190263065, "grad_norm": 0.1271501170893098, "learning_rate": 6.507400379377608e-05, "loss": 0.3451, "step": 1795 }, { "epoch": 0.46237563190263065, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8355159769512834, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4457564055919647, "eval_runtime": 16.8511, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 1795 }, { "epoch": 0.46263322278391344, "grad_norm": 0.1611007448146758, "learning_rate": 6.503112020307916e-05, "loss": 0.3275, "step": 1796 }, { "epoch": 0.46289081366519624, "grad_norm": 0.17241373724739617, "learning_rate": 6.498822445349328e-05, "loss": 0.335, "step": 1797 }, { "epoch": 0.46314840454647904, "grad_norm": 0.1282580640321002, "learning_rate": 6.49453165797174e-05, "loss": 0.3707, "step": 1798 }, { "epoch": 0.46340599542776184, "grad_norm": 0.1565541491281499, "learning_rate": 6.490239661646035e-05, "loss": 0.2874, "step": 1799 }, { "epoch": 0.46366358630904464, "grad_norm": 0.2257568719269108, "learning_rate": 6.485946459844066e-05, "loss": 0.4038, "step": 1800 }, { "epoch": 0.46366358630904464, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.8520167627029858, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.43954190611839294, "eval_runtime": 17.2684, "eval_samples_per_second": 2.548, "eval_steps_per_second": 0.174, "step": 1800 }, { "epoch": 0.46392117719032744, "grad_norm": 0.10712108406232321, "learning_rate": 6.481652056038672e-05, "loss": 0.295, "step": 1801 }, { "epoch": 0.4641787680716103, "grad_norm": 0.19676996340896782, "learning_rate": 6.477356453703651e-05, "loss": 0.4024, "step": 1802 }, { "epoch": 0.4644363589528931, "grad_norm": 0.22965255884107458, "learning_rate": 6.473059656313782e-05, "loss": 0.4483, "step": 1803 }, { "epoch": 0.4646939498341759, "grad_norm": 0.15848951968242295, "learning_rate": 6.468761667344805e-05, "loss": 0.3542, "step": 1804 }, { "epoch": 0.4649515407154587, "grad_norm": 0.18317261345803337, "learning_rate": 6.464462490273425e-05, "loss": 0.4238, "step": 1805 }, { "epoch": 0.4649515407154587, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8449449973808277, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42942115664482117, "eval_runtime": 17.1382, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 1805 }, { "epoch": 0.4652091315967415, "grad_norm": 0.1541276110317898, "learning_rate": 6.460162128577307e-05, "loss": 0.3201, "step": 1806 }, { "epoch": 0.4654667224780243, "grad_norm": 0.14413939819416827, "learning_rate": 6.455860585735077e-05, "loss": 0.3699, "step": 1807 }, { "epoch": 0.4657243133593071, "grad_norm": 0.16889055449492826, "learning_rate": 6.451557865226312e-05, "loss": 0.4235, "step": 1808 }, { "epoch": 0.4659819042405899, "grad_norm": 0.14938021769171567, "learning_rate": 6.447253970531549e-05, "loss": 0.3125, "step": 1809 }, { "epoch": 0.4662394951218727, "grad_norm": 0.1447876236528027, "learning_rate": 6.442948905132266e-05, "loss": 0.3264, "step": 1810 }, { "epoch": 0.4662394951218727, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8365636458878996, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4340376555919647, "eval_runtime": 17.2421, "eval_samples_per_second": 2.552, "eval_steps_per_second": 0.174, "step": 1810 }, { "epoch": 0.4664970860031555, "grad_norm": 0.1325408382794767, "learning_rate": 6.438642672510893e-05, "loss": 0.3658, "step": 1811 }, { "epoch": 0.4667546768844383, "grad_norm": 0.26555436438544056, "learning_rate": 6.434335276150806e-05, "loss": 0.4826, "step": 1812 }, { "epoch": 0.4670122677657211, "grad_norm": 0.16278004797099416, "learning_rate": 6.430026719536317e-05, "loss": 0.4357, "step": 1813 }, { "epoch": 0.4672698586470039, "grad_norm": 0.1353678196751081, "learning_rate": 6.425717006152682e-05, "loss": 0.3525, "step": 1814 }, { "epoch": 0.4675274495282867, "grad_norm": 0.13010076318143934, "learning_rate": 6.421406139486085e-05, "loss": 0.363, "step": 1815 }, { "epoch": 0.4675274495282867, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8484848484848485, "eval_PRM F1 AUC": 0.6608171817705605, "eval_PRM F1 AUC (fixed)": 0.8245154531168151, "eval_PRM F1 Neg": 0.46808510638297873, "eval_PRM NPV": 0.4583333333333333, "eval_PRM Precision": 0.8536585365853658, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.44992896914482117, "eval_runtime": 17.036, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 1815 }, { "epoch": 0.4677850404095695, "grad_norm": 0.13151199976813194, "learning_rate": 6.417094123023654e-05, "loss": 0.3905, "step": 1816 }, { "epoch": 0.46804263129085233, "grad_norm": 0.14265186376423084, "learning_rate": 6.412780960253436e-05, "loss": 0.3891, "step": 1817 }, { "epoch": 0.4683002221721351, "grad_norm": 0.17111863843915304, "learning_rate": 6.408466654664415e-05, "loss": 0.3883, "step": 1818 }, { "epoch": 0.4685578130534179, "grad_norm": 0.1397310900299257, "learning_rate": 6.40415120974649e-05, "loss": 0.3345, "step": 1819 }, { "epoch": 0.4688154039347007, "grad_norm": 0.17201275409945146, "learning_rate": 6.39983462899049e-05, "loss": 0.323, "step": 1820 }, { "epoch": 0.4688154039347007, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8520710059171598, "eval_PRM F1 AUC": 0.6293871136720797, "eval_PRM F1 AUC (fixed)": 0.816657936092195, "eval_PRM F1 Neg": 0.4186046511627907, "eval_PRM NPV": 0.45, "eval_PRM Precision": 0.8372093023255814, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4682173430919647, "eval_runtime": 17.599, "eval_samples_per_second": 2.5, "eval_steps_per_second": 0.17, "step": 1820 }, { "epoch": 0.4690729948159835, "grad_norm": 0.18324031697918397, "learning_rate": 6.395516915888158e-05, "loss": 0.38, "step": 1821 }, { "epoch": 0.4693305856972663, "grad_norm": 0.10402598490385051, "learning_rate": 6.391198073932155e-05, "loss": 0.2868, "step": 1822 }, { "epoch": 0.4695881765785491, "grad_norm": 0.19550688722467557, "learning_rate": 6.38687810661605e-05, "loss": 0.4449, "step": 1823 }, { "epoch": 0.4698457674598319, "grad_norm": 0.15513202151171826, "learning_rate": 6.382557017434332e-05, "loss": 0.3444, "step": 1824 }, { "epoch": 0.4701033583411147, "grad_norm": 0.20472026675462934, "learning_rate": 6.37823480988239e-05, "loss": 0.4232, "step": 1825 }, { "epoch": 0.4701033583411147, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8520710059171598, "eval_PRM F1 AUC": 0.6293871136720797, "eval_PRM F1 AUC (fixed)": 0.8022524882137244, "eval_PRM F1 Neg": 0.4186046511627907, "eval_PRM NPV": 0.45, "eval_PRM Precision": 0.8372093023255814, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.49032315611839294, "eval_runtime": 17.5908, "eval_samples_per_second": 2.501, "eval_steps_per_second": 0.171, "step": 1825 }, { "epoch": 0.4703609492223975, "grad_norm": 0.13222147954250396, "learning_rate": 6.373911487456519e-05, "loss": 0.3488, "step": 1826 }, { "epoch": 0.4706185401036803, "grad_norm": 0.19463858262847702, "learning_rate": 6.369587053653917e-05, "loss": 0.3901, "step": 1827 }, { "epoch": 0.4708761309849631, "grad_norm": 0.16713114547710084, "learning_rate": 6.365261511972682e-05, "loss": 0.3422, "step": 1828 }, { "epoch": 0.4711337218662459, "grad_norm": 0.14381957333856812, "learning_rate": 6.360934865911805e-05, "loss": 0.3333, "step": 1829 }, { "epoch": 0.4713913127475287, "grad_norm": 0.14879261794702997, "learning_rate": 6.356607118971171e-05, "loss": 0.3748, "step": 1830 }, { "epoch": 0.4713913127475287, "eval_PRM Accuracy": 0.7358490566037735, "eval_PRM F1": 0.8313253012048193, "eval_PRM F1 AUC": 0.6113148245154532, "eval_PRM F1 AUC (fixed)": 0.7930853850183341, "eval_PRM F1 Neg": 0.391304347826087, "eval_PRM NPV": 0.391304347826087, "eval_PRM Precision": 0.8313253012048193, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.48544034361839294, "eval_runtime": 17.2198, "eval_samples_per_second": 2.555, "eval_steps_per_second": 0.174, "step": 1830 }, { "epoch": 0.47164890362881157, "grad_norm": 0.16114587572311603, "learning_rate": 6.352278274651561e-05, "loss": 0.3811, "step": 1831 }, { "epoch": 0.47190649451009437, "grad_norm": 0.17018309477316115, "learning_rate": 6.347948336454637e-05, "loss": 0.4354, "step": 1832 }, { "epoch": 0.47216408539137716, "grad_norm": 0.15779706174679867, "learning_rate": 6.343617307882946e-05, "loss": 0.4028, "step": 1833 }, { "epoch": 0.47242167627265996, "grad_norm": 0.17386543056112677, "learning_rate": 6.339285192439922e-05, "loss": 0.382, "step": 1834 }, { "epoch": 0.47267926715394276, "grad_norm": 0.20285470789435855, "learning_rate": 6.334951993629875e-05, "loss": 0.3702, "step": 1835 }, { "epoch": 0.47267926715394276, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8383233532934131, "eval_PRM F1 AUC": 0.6173389209009953, "eval_PRM F1 AUC (fixed)": 0.787847040335254, "eval_PRM F1 Neg": 0.4, "eval_PRM NPV": 0.4090909090909091, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.48659446835517883, "eval_runtime": 16.8924, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 1835 }, { "epoch": 0.47293685803522556, "grad_norm": 0.19036692887251433, "learning_rate": 6.33061771495799e-05, "loss": 0.4635, "step": 1836 }, { "epoch": 0.47319444891650836, "grad_norm": 0.15085058845992372, "learning_rate": 6.326282359930329e-05, "loss": 0.4045, "step": 1837 }, { "epoch": 0.47345203979779116, "grad_norm": 0.1634747287161456, "learning_rate": 6.321945932053822e-05, "loss": 0.4149, "step": 1838 }, { "epoch": 0.47370963067907396, "grad_norm": 0.15987001172484994, "learning_rate": 6.317608434836269e-05, "loss": 0.3668, "step": 1839 }, { "epoch": 0.47396722156035676, "grad_norm": 0.15395071881226133, "learning_rate": 6.313269871786333e-05, "loss": 0.4, "step": 1840 }, { "epoch": 0.47396722156035676, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8402366863905325, "eval_PRM F1 AUC": 0.6016238868517548, "eval_PRM F1 AUC (fixed)": 0.7998952331063384, "eval_PRM F1 Neg": 0.37209302325581395, "eval_PRM NPV": 0.4, "eval_PRM Precision": 0.8255813953488372, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.48623934388160706, "eval_runtime": 17.0864, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 1840 }, { "epoch": 0.47422481244163955, "grad_norm": 0.14729279011932994, "learning_rate": 6.308930246413541e-05, "loss": 0.3851, "step": 1841 }, { "epoch": 0.47448240332292235, "grad_norm": 0.13822956072911927, "learning_rate": 6.304589562228275e-05, "loss": 0.2891, "step": 1842 }, { "epoch": 0.47473999420420515, "grad_norm": 0.13417641940253733, "learning_rate": 6.300247822741781e-05, "loss": 0.3132, "step": 1843 }, { "epoch": 0.47499758508548795, "grad_norm": 0.22982622155544408, "learning_rate": 6.29590503146615e-05, "loss": 0.4701, "step": 1844 }, { "epoch": 0.47525517596677075, "grad_norm": 0.19843530597553397, "learning_rate": 6.291561191914333e-05, "loss": 0.4478, "step": 1845 }, { "epoch": 0.47525517596677075, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8402366863905325, "eval_PRM F1 AUC": 0.6016238868517548, "eval_PRM F1 AUC (fixed)": 0.8088004190675746, "eval_PRM F1 Neg": 0.37209302325581395, "eval_PRM NPV": 0.4, "eval_PRM Precision": 0.8255813953488372, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.34782608695652173, "eval_loss": 0.4679509997367859, "eval_runtime": 17.0249, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 1845 }, { "epoch": 0.4755127668480536, "grad_norm": 0.11264666106935119, "learning_rate": 6.28721630760012e-05, "loss": 0.3427, "step": 1846 }, { "epoch": 0.4757703577293364, "grad_norm": 0.1349364170169096, "learning_rate": 6.282870382038154e-05, "loss": 0.3329, "step": 1847 }, { "epoch": 0.4760279486106192, "grad_norm": 0.16180123321346426, "learning_rate": 6.278523418743912e-05, "loss": 0.3588, "step": 1848 }, { "epoch": 0.476285539491902, "grad_norm": 0.13140213702797432, "learning_rate": 6.27417542123372e-05, "loss": 0.339, "step": 1849 }, { "epoch": 0.4765431303731848, "grad_norm": 0.1037858414628389, "learning_rate": 6.269826393024734e-05, "loss": 0.3324, "step": 1850 }, { "epoch": 0.4765431303731848, "eval_PRM Accuracy": 0.7452830188679245, "eval_PRM F1": 0.8383233532934131, "eval_PRM F1 AUC": 0.6173389209009953, "eval_PRM F1 AUC (fixed)": 0.821634363541121, "eval_PRM F1 Neg": 0.4, "eval_PRM NPV": 0.4090909090909091, "eval_PRM Precision": 0.8333333333333334, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4505504369735718, "eval_runtime": 17.7774, "eval_samples_per_second": 2.475, "eval_steps_per_second": 0.169, "step": 1850 }, { "epoch": 0.4768007212544676, "grad_norm": 0.13442708294755987, "learning_rate": 6.265476337634942e-05, "loss": 0.3804, "step": 1851 }, { "epoch": 0.4770583121357504, "grad_norm": 0.14046213413324507, "learning_rate": 6.261125258583171e-05, "loss": 0.3875, "step": 1852 }, { "epoch": 0.4773159030170332, "grad_norm": 0.12731210386232347, "learning_rate": 6.25677315938907e-05, "loss": 0.3364, "step": 1853 }, { "epoch": 0.477573493898316, "grad_norm": 0.16790556359809636, "learning_rate": 6.252420043573112e-05, "loss": 0.4121, "step": 1854 }, { "epoch": 0.4778310847795988, "grad_norm": 0.1295076268772362, "learning_rate": 6.248065914656598e-05, "loss": 0.3236, "step": 1855 }, { "epoch": 0.4778310847795988, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.8250392875851231, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4330610930919647, "eval_runtime": 17.064, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 1855 }, { "epoch": 0.4780886756608816, "grad_norm": 0.33712955223762625, "learning_rate": 6.243710776161644e-05, "loss": 0.4001, "step": 1856 }, { "epoch": 0.4783462665421644, "grad_norm": 0.13089345607974967, "learning_rate": 6.239354631611183e-05, "loss": 0.3516, "step": 1857 }, { "epoch": 0.4786038574234472, "grad_norm": 0.1582707854570693, "learning_rate": 6.234997484528965e-05, "loss": 0.4148, "step": 1858 }, { "epoch": 0.47886144830473, "grad_norm": 0.1641678396019646, "learning_rate": 6.230639338439549e-05, "loss": 0.3725, "step": 1859 }, { "epoch": 0.47911903918601284, "grad_norm": 0.15389051019466163, "learning_rate": 6.2262801968683e-05, "loss": 0.4003, "step": 1860 }, { "epoch": 0.47911903918601284, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8190151911995809, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4265802502632141, "eval_runtime": 17.0638, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 1860 }, { "epoch": 0.47937663006729564, "grad_norm": 0.14601188843851445, "learning_rate": 6.22192006334139e-05, "loss": 0.3531, "step": 1861 }, { "epoch": 0.47963422094857844, "grad_norm": 0.12518165917127885, "learning_rate": 6.217558941385797e-05, "loss": 0.3189, "step": 1862 }, { "epoch": 0.47989181182986124, "grad_norm": 0.13700079810562624, "learning_rate": 6.21319683452929e-05, "loss": 0.3751, "step": 1863 }, { "epoch": 0.48014940271114404, "grad_norm": 0.16461156451103587, "learning_rate": 6.208833746300446e-05, "loss": 0.3623, "step": 1864 }, { "epoch": 0.48040699359242683, "grad_norm": 0.152150323134353, "learning_rate": 6.204469680228624e-05, "loss": 0.409, "step": 1865 }, { "epoch": 0.48040699359242683, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8124672603457308, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4321732819080353, "eval_runtime": 16.7971, "eval_samples_per_second": 2.62, "eval_steps_per_second": 0.179, "step": 1865 }, { "epoch": 0.48066458447370963, "grad_norm": 0.1881542191304717, "learning_rate": 6.200104639843985e-05, "loss": 0.3628, "step": 1866 }, { "epoch": 0.48092217535499243, "grad_norm": 0.1714782159353788, "learning_rate": 6.195738628677467e-05, "loss": 0.2964, "step": 1867 }, { "epoch": 0.48117976623627523, "grad_norm": 0.14951772505118566, "learning_rate": 6.191371650260803e-05, "loss": 0.3772, "step": 1868 }, { "epoch": 0.48143735711755803, "grad_norm": 0.13888875964484063, "learning_rate": 6.187003708126504e-05, "loss": 0.3559, "step": 1869 }, { "epoch": 0.48169494799884083, "grad_norm": 0.14360209056564735, "learning_rate": 6.182634805807862e-05, "loss": 0.3915, "step": 1870 }, { "epoch": 0.48169494799884083, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8127291775798848, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4407848119735718, "eval_runtime": 17.116, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 1870 }, { "epoch": 0.4819525388801236, "grad_norm": 0.27278532576291137, "learning_rate": 6.178264946838941e-05, "loss": 0.4931, "step": 1871 }, { "epoch": 0.4822101297614064, "grad_norm": 0.1519600010926597, "learning_rate": 6.173894134754588e-05, "loss": 0.4001, "step": 1872 }, { "epoch": 0.4824677206426892, "grad_norm": 0.1443765094168506, "learning_rate": 6.169522373090412e-05, "loss": 0.4005, "step": 1873 }, { "epoch": 0.4827253115239721, "grad_norm": 0.1533942861240422, "learning_rate": 6.165149665382795e-05, "loss": 0.335, "step": 1874 }, { "epoch": 0.4829829024052549, "grad_norm": 0.17506033632877718, "learning_rate": 6.160776015168882e-05, "loss": 0.3967, "step": 1875 }, { "epoch": 0.4829829024052549, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8048716605552646, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4400745630264282, "eval_runtime": 16.9906, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 1875 }, { "epoch": 0.4832404932865377, "grad_norm": 0.19342704797793206, "learning_rate": 6.156401425986583e-05, "loss": 0.2687, "step": 1876 }, { "epoch": 0.4834980841678205, "grad_norm": 0.1562919934472492, "learning_rate": 6.152025901374565e-05, "loss": 0.4021, "step": 1877 }, { "epoch": 0.4837556750491033, "grad_norm": 0.1322374285427482, "learning_rate": 6.147649444872252e-05, "loss": 0.3605, "step": 1878 }, { "epoch": 0.48401326593038607, "grad_norm": 0.16615127167841817, "learning_rate": 6.143272060019826e-05, "loss": 0.3532, "step": 1879 }, { "epoch": 0.48427085681166887, "grad_norm": 0.19432644344268593, "learning_rate": 6.138893750358212e-05, "loss": 0.3366, "step": 1880 }, { "epoch": 0.48427085681166887, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8452380952380952, "eval_PRM F1 AUC": 0.6233630172865374, "eval_PRM F1 AUC (fixed)": 0.8074908328968046, "eval_PRM F1 Neg": 0.4090909090909091, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8352941176470589, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.47665128111839294, "eval_runtime": 16.9485, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 1880 }, { "epoch": 0.48452844769295167, "grad_norm": 0.12137651310296427, "learning_rate": 6.134514519429089e-05, "loss": 0.3158, "step": 1881 }, { "epoch": 0.48478603857423447, "grad_norm": 0.22609134483050833, "learning_rate": 6.130134370774881e-05, "loss": 0.4057, "step": 1882 }, { "epoch": 0.48504362945551727, "grad_norm": 0.22727092725357212, "learning_rate": 6.125753307938754e-05, "loss": 0.4377, "step": 1883 }, { "epoch": 0.48530122033680007, "grad_norm": 0.13675430050212425, "learning_rate": 6.12137133446461e-05, "loss": 0.3682, "step": 1884 }, { "epoch": 0.48555881121808286, "grad_norm": 0.14736923323041065, "learning_rate": 6.11698845389709e-05, "loss": 0.3221, "step": 1885 }, { "epoch": 0.48555881121808286, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.8077527501309586, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4603160619735718, "eval_runtime": 17.5576, "eval_samples_per_second": 2.506, "eval_steps_per_second": 0.171, "step": 1885 }, { "epoch": 0.48581640209936566, "grad_norm": 0.14731688432873322, "learning_rate": 6.112604669781572e-05, "loss": 0.3505, "step": 1886 }, { "epoch": 0.48607399298064846, "grad_norm": 0.13432445612157262, "learning_rate": 6.108219985664161e-05, "loss": 0.2912, "step": 1887 }, { "epoch": 0.48633158386193126, "grad_norm": 0.13238379329614677, "learning_rate": 6.103834405091689e-05, "loss": 0.3924, "step": 1888 }, { "epoch": 0.4865891747432141, "grad_norm": 0.15207481153619506, "learning_rate": 6.099447931611716e-05, "loss": 0.3241, "step": 1889 }, { "epoch": 0.4868467656244969, "grad_norm": 0.14686120579558493, "learning_rate": 6.095060568772524e-05, "loss": 0.3676, "step": 1890 }, { "epoch": 0.4868467656244969, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.7980618124672604, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.47567471861839294, "eval_runtime": 17.0825, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 1890 }, { "epoch": 0.4871043565057797, "grad_norm": 0.2205917186751997, "learning_rate": 6.090672320123113e-05, "loss": 0.488, "step": 1891 }, { "epoch": 0.4873619473870625, "grad_norm": 0.15522284421635085, "learning_rate": 6.0862831892132025e-05, "loss": 0.3853, "step": 1892 }, { "epoch": 0.4876195382683453, "grad_norm": 0.10600381147303754, "learning_rate": 6.081893179593221e-05, "loss": 0.2968, "step": 1893 }, { "epoch": 0.4878771291496281, "grad_norm": 0.1382675031186188, "learning_rate": 6.0775022948143115e-05, "loss": 0.358, "step": 1894 }, { "epoch": 0.4881347200309109, "grad_norm": 0.18137556768938917, "learning_rate": 6.0731105384283214e-05, "loss": 0.4209, "step": 1895 }, { "epoch": 0.4881347200309109, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.788108957569408, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4661754369735718, "eval_runtime": 17.0425, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 1895 }, { "epoch": 0.4883923109121937, "grad_norm": 0.13771159897426713, "learning_rate": 6.0687179139878106e-05, "loss": 0.3947, "step": 1896 }, { "epoch": 0.4886499017934765, "grad_norm": 0.1365985958729311, "learning_rate": 6.064324425046029e-05, "loss": 0.3813, "step": 1897 }, { "epoch": 0.4889074926747593, "grad_norm": 0.18836759015704257, "learning_rate": 6.059930075156941e-05, "loss": 0.4904, "step": 1898 }, { "epoch": 0.4891650835560421, "grad_norm": 0.18865752544500874, "learning_rate": 6.055534867875193e-05, "loss": 0.4033, "step": 1899 }, { "epoch": 0.4894226744373249, "grad_norm": 0.15807404428530847, "learning_rate": 6.051138806756136e-05, "loss": 0.3856, "step": 1900 }, { "epoch": 0.4894226744373249, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.7881089575694081, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.458984375, "eval_runtime": 16.8432, "eval_samples_per_second": 2.612, "eval_steps_per_second": 0.178, "step": 1900 }, { "epoch": 0.4896802653186077, "grad_norm": 0.16498572593371158, "learning_rate": 6.046741895355802e-05, "loss": 0.3298, "step": 1901 }, { "epoch": 0.4899378561998905, "grad_norm": 0.16496002269331, "learning_rate": 6.0423441372309185e-05, "loss": 0.3355, "step": 1902 }, { "epoch": 0.49019544708117335, "grad_norm": 0.1353754987800334, "learning_rate": 6.037945535938896e-05, "loss": 0.3683, "step": 1903 }, { "epoch": 0.49045303796245615, "grad_norm": 0.2546450671093939, "learning_rate": 6.033546095037824e-05, "loss": 0.3935, "step": 1904 }, { "epoch": 0.49071062884373895, "grad_norm": 0.192423048731162, "learning_rate": 6.0291458180864745e-05, "loss": 0.4125, "step": 1905 }, { "epoch": 0.49071062884373895, "eval_PRM Accuracy": 0.7547169811320755, "eval_PRM F1": 0.8452380952380952, "eval_PRM F1 AUC": 0.6233630172865374, "eval_PRM F1 AUC (fixed)": 0.8022524882137245, "eval_PRM F1 Neg": 0.4090909090909091, "eval_PRM NPV": 0.42857142857142855, "eval_PRM Precision": 0.8352941176470589, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4691939055919647, "eval_runtime": 17.5332, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 1905 }, { "epoch": 0.49096821972502175, "grad_norm": 0.15294667916102211, "learning_rate": 6.0247447086442975e-05, "loss": 0.386, "step": 1906 }, { "epoch": 0.49122581060630455, "grad_norm": 0.13710552338120335, "learning_rate": 6.0203427702714085e-05, "loss": 0.3593, "step": 1907 }, { "epoch": 0.49148340148758735, "grad_norm": 0.1145330933636216, "learning_rate": 6.015940006528602e-05, "loss": 0.3039, "step": 1908 }, { "epoch": 0.49174099236887014, "grad_norm": 0.16101169209821084, "learning_rate": 6.011536420977336e-05, "loss": 0.4458, "step": 1909 }, { "epoch": 0.49199858325015294, "grad_norm": 0.13725289928583728, "learning_rate": 6.0071320171797326e-05, "loss": 0.3665, "step": 1910 }, { "epoch": 0.49199858325015294, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8114195914091147, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4485973119735718, "eval_runtime": 17.4418, "eval_samples_per_second": 2.523, "eval_steps_per_second": 0.172, "step": 1910 }, { "epoch": 0.49225617413143574, "grad_norm": 0.12761197608676197, "learning_rate": 6.00272679869858e-05, "loss": 0.3322, "step": 1911 }, { "epoch": 0.49251376501271854, "grad_norm": 0.13594699011191508, "learning_rate": 5.998320769097321e-05, "loss": 0.4131, "step": 1912 }, { "epoch": 0.49277135589400134, "grad_norm": 0.14825317977677996, "learning_rate": 5.993913931940058e-05, "loss": 0.3784, "step": 1913 }, { "epoch": 0.49302894677528414, "grad_norm": 0.1467928278028728, "learning_rate": 5.9895062907915424e-05, "loss": 0.428, "step": 1914 }, { "epoch": 0.49328653765656694, "grad_norm": 0.21914650981144246, "learning_rate": 5.9850978492171794e-05, "loss": 0.4496, "step": 1915 }, { "epoch": 0.49328653765656694, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.8143006809848088, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4365234375, "eval_runtime": 17.7023, "eval_samples_per_second": 2.486, "eval_steps_per_second": 0.169, "step": 1915 }, { "epoch": 0.49354412853784974, "grad_norm": 0.12123771016240374, "learning_rate": 5.9806886107830194e-05, "loss": 0.2823, "step": 1916 }, { "epoch": 0.4938017194191326, "grad_norm": 0.15649592707057203, "learning_rate": 5.976278579055762e-05, "loss": 0.3649, "step": 1917 }, { "epoch": 0.4940593103004154, "grad_norm": 0.13459266337832734, "learning_rate": 5.971867757602742e-05, "loss": 0.3433, "step": 1918 }, { "epoch": 0.4943169011816982, "grad_norm": 0.15280221083736026, "learning_rate": 5.967456149991938e-05, "loss": 0.4225, "step": 1919 }, { "epoch": 0.494574492062981, "grad_norm": 0.16801780504792357, "learning_rate": 5.963043759791962e-05, "loss": 0.4129, "step": 1920 }, { "epoch": 0.494574492062981, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.8171817705605029, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.43838778138160706, "eval_runtime": 17.5347, "eval_samples_per_second": 2.509, "eval_steps_per_second": 0.171, "step": 1920 }, { "epoch": 0.4948320829442638, "grad_norm": 0.15563907511648944, "learning_rate": 5.958630590572061e-05, "loss": 0.3958, "step": 1921 }, { "epoch": 0.4950896738255466, "grad_norm": 0.161858188045907, "learning_rate": 5.954216645902109e-05, "loss": 0.3563, "step": 1922 }, { "epoch": 0.4953472647068294, "grad_norm": 0.20912967805389057, "learning_rate": 5.94980192935261e-05, "loss": 0.4026, "step": 1923 }, { "epoch": 0.4956048555881122, "grad_norm": 0.15930626634598105, "learning_rate": 5.9453864444946914e-05, "loss": 0.4682, "step": 1924 }, { "epoch": 0.495862446469395, "grad_norm": 0.13931203069182932, "learning_rate": 5.940970194900104e-05, "loss": 0.359, "step": 1925 }, { "epoch": 0.495862446469395, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.8255631220534312, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4365234375, "eval_runtime": 17.5563, "eval_samples_per_second": 2.506, "eval_steps_per_second": 0.171, "step": 1925 }, { "epoch": 0.4961200373506778, "grad_norm": 0.1416943075377075, "learning_rate": 5.9365531841412136e-05, "loss": 0.3485, "step": 1926 }, { "epoch": 0.4963776282319606, "grad_norm": 0.28506554313722937, "learning_rate": 5.932135415791003e-05, "loss": 0.5544, "step": 1927 }, { "epoch": 0.4966352191132434, "grad_norm": 0.16545301078309305, "learning_rate": 5.927716893423071e-05, "loss": 0.3788, "step": 1928 }, { "epoch": 0.4968928099945262, "grad_norm": 0.18988998641449575, "learning_rate": 5.923297620611623e-05, "loss": 0.4567, "step": 1929 }, { "epoch": 0.497150400875809, "grad_norm": 0.20856083305897258, "learning_rate": 5.9188776009314705e-05, "loss": 0.4678, "step": 1930 }, { "epoch": 0.497150400875809, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.822420115243583, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4501953125, "eval_runtime": 16.9478, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 1930 }, { "epoch": 0.49740799175709177, "grad_norm": 0.1308991500439859, "learning_rate": 5.914456837958032e-05, "loss": 0.393, "step": 1931 }, { "epoch": 0.4976655826383746, "grad_norm": 0.12028420107283791, "learning_rate": 5.9100353352673266e-05, "loss": 0.2775, "step": 1932 }, { "epoch": 0.4979231735196574, "grad_norm": 0.1460604813485323, "learning_rate": 5.905613096435971e-05, "loss": 0.3026, "step": 1933 }, { "epoch": 0.4981807644009402, "grad_norm": 0.170967236562453, "learning_rate": 5.9011901250411785e-05, "loss": 0.3929, "step": 1934 }, { "epoch": 0.498438355282223, "grad_norm": 0.22162553086457643, "learning_rate": 5.8967664246607526e-05, "loss": 0.3777, "step": 1935 }, { "epoch": 0.498438355282223, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.820062860136197, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.44034090638160706, "eval_runtime": 17.0145, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 1935 }, { "epoch": 0.4986959461635058, "grad_norm": 0.11180571869366931, "learning_rate": 5.892341998873089e-05, "loss": 0.3183, "step": 1936 }, { "epoch": 0.4989535370447886, "grad_norm": 0.16338673236488335, "learning_rate": 5.887916851257167e-05, "loss": 0.4321, "step": 1937 }, { "epoch": 0.4992111279260714, "grad_norm": 0.13180596103435183, "learning_rate": 5.8834909853925565e-05, "loss": 0.3605, "step": 1938 }, { "epoch": 0.4994687188073542, "grad_norm": 0.14767783669678966, "learning_rate": 5.8790644048594e-05, "loss": 0.4043, "step": 1939 }, { "epoch": 0.499726309688637, "grad_norm": 0.18269521671133876, "learning_rate": 5.874637113238426e-05, "loss": 0.4947, "step": 1940 }, { "epoch": 0.499726309688637, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8554216867469879, "eval_PRM F1 AUC": 0.6668412781561027, "eval_PRM F1 AUC (fixed)": 0.822943949711891, "eval_PRM F1 Neg": 0.4782608695652174, "eval_PRM NPV": 0.4782608695652174, "eval_PRM Precision": 0.8554216867469879, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42862215638160706, "eval_runtime": 17.1451, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 1940 }, { "epoch": 0.4999839005699198, "grad_norm": 0.12780521010355875, "learning_rate": 5.8702091141109296e-05, "loss": 0.3328, "step": 1941 }, { "epoch": 0.5002414914512027, "grad_norm": 0.16293512861501297, "learning_rate": 5.865780411058785e-05, "loss": 0.4396, "step": 1942 }, { "epoch": 0.5004990823324854, "grad_norm": 0.187124685628023, "learning_rate": 5.861351007664434e-05, "loss": 0.408, "step": 1943 }, { "epoch": 0.5007566732137683, "grad_norm": 0.13968885089567415, "learning_rate": 5.856920907510886e-05, "loss": 0.349, "step": 1944 }, { "epoch": 0.501014264095051, "grad_norm": 0.12969934987202722, "learning_rate": 5.852490114181709e-05, "loss": 0.307, "step": 1945 }, { "epoch": 0.501014264095051, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8245154531168152, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.43625709414482117, "eval_runtime": 17.7387, "eval_samples_per_second": 2.48, "eval_steps_per_second": 0.169, "step": 1945 }, { "epoch": 0.5012718549763339, "grad_norm": 0.11683053442116902, "learning_rate": 5.848058631261038e-05, "loss": 0.3215, "step": 1946 }, { "epoch": 0.5015294458576166, "grad_norm": 0.19077931962464129, "learning_rate": 5.8436264623335635e-05, "loss": 0.3159, "step": 1947 }, { "epoch": 0.5017870367388995, "grad_norm": 0.140771208365144, "learning_rate": 5.8391936109845304e-05, "loss": 0.3791, "step": 1948 }, { "epoch": 0.5020446276201822, "grad_norm": 0.12208501363727582, "learning_rate": 5.8347600807997336e-05, "loss": 0.3323, "step": 1949 }, { "epoch": 0.5023022185014651, "grad_norm": 0.2896596869767316, "learning_rate": 5.83032587536552e-05, "loss": 0.5041, "step": 1950 }, { "epoch": 0.5023022185014651, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8357778941854375, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4896129369735718, "eval_runtime": 16.6496, "eval_samples_per_second": 2.643, "eval_steps_per_second": 0.18, "step": 1950 }, { "epoch": 0.5025598093827478, "grad_norm": 0.3013914876754927, "learning_rate": 5.825890998268784e-05, "loss": 0.5287, "step": 1951 }, { "epoch": 0.5028174002640307, "grad_norm": 0.1413255877889976, "learning_rate": 5.82145545309696e-05, "loss": 0.3779, "step": 1952 }, { "epoch": 0.5030749911453135, "grad_norm": 0.146203035699714, "learning_rate": 5.8170192434380246e-05, "loss": 0.3789, "step": 1953 }, { "epoch": 0.5033325820265963, "grad_norm": 0.15748991732232986, "learning_rate": 5.812582372880491e-05, "loss": 0.3972, "step": 1954 }, { "epoch": 0.5035901729078791, "grad_norm": 0.13917280006553007, "learning_rate": 5.808144845013408e-05, "loss": 0.3149, "step": 1955 }, { "epoch": 0.5035901729078791, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8281822943949713, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4453125, "eval_runtime": 17.6844, "eval_samples_per_second": 2.488, "eval_steps_per_second": 0.17, "step": 1955 }, { "epoch": 0.5038477637891619, "grad_norm": 0.15012143889938592, "learning_rate": 5.803706663426355e-05, "loss": 0.3278, "step": 1956 }, { "epoch": 0.5041053546704447, "grad_norm": 0.12867356737210414, "learning_rate": 5.799267831709442e-05, "loss": 0.3751, "step": 1957 }, { "epoch": 0.5043629455517274, "grad_norm": 0.13125135700394105, "learning_rate": 5.794828353453301e-05, "loss": 0.3842, "step": 1958 }, { "epoch": 0.5046205364330103, "grad_norm": 0.15309055758164059, "learning_rate": 5.790388232249093e-05, "loss": 0.4175, "step": 1959 }, { "epoch": 0.504878127314293, "grad_norm": 0.129610758070974, "learning_rate": 5.785947471688495e-05, "loss": 0.3596, "step": 1960 }, { "epoch": 0.504878127314293, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8674698795180723, "eval_PRM F1 AUC": 0.6946045049764275, "eval_PRM F1 AUC (fixed)": 0.820062860136197, "eval_PRM F1 Neg": 0.5217391304347826, "eval_PRM NPV": 0.5217391304347826, "eval_PRM Precision": 0.8674698795180723, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.42507103085517883, "eval_runtime": 16.9759, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 1960 }, { "epoch": 0.5051357181955759, "grad_norm": 0.15629740811532955, "learning_rate": 5.781506075363702e-05, "loss": 0.4322, "step": 1961 }, { "epoch": 0.5053933090768586, "grad_norm": 0.12215444800160688, "learning_rate": 5.77706404686742e-05, "loss": 0.3787, "step": 1962 }, { "epoch": 0.5056508999581415, "grad_norm": 0.13624586074228046, "learning_rate": 5.772621389792875e-05, "loss": 0.3568, "step": 1963 }, { "epoch": 0.5059084908394242, "grad_norm": 0.14674881137528345, "learning_rate": 5.7681781077337905e-05, "loss": 0.4109, "step": 1964 }, { "epoch": 0.5061660817207071, "grad_norm": 0.19306126347480176, "learning_rate": 5.7637342042844064e-05, "loss": 0.3879, "step": 1965 }, { "epoch": 0.5061660817207071, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.8234677841801991, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4174360930919647, "eval_runtime": 17.6498, "eval_samples_per_second": 2.493, "eval_steps_per_second": 0.17, "step": 1965 }, { "epoch": 0.5064236726019898, "grad_norm": 0.1719789405625014, "learning_rate": 5.759289683039458e-05, "loss": 0.4188, "step": 1966 }, { "epoch": 0.5066812634832727, "grad_norm": 0.1464825068242375, "learning_rate": 5.754844547594181e-05, "loss": 0.3648, "step": 1967 }, { "epoch": 0.5069388543645555, "grad_norm": 0.1899320668759184, "learning_rate": 5.75039880154431e-05, "loss": 0.3859, "step": 1968 }, { "epoch": 0.5071964452458383, "grad_norm": 0.12342909376743207, "learning_rate": 5.745952448486074e-05, "loss": 0.3733, "step": 1969 }, { "epoch": 0.5074540361271211, "grad_norm": 0.11259505244678272, "learning_rate": 5.7415054920161916e-05, "loss": 0.3534, "step": 1970 }, { "epoch": 0.5074540361271211, "eval_PRM Accuracy": 0.7641509433962265, "eval_PRM F1": 0.8502994011976048, "eval_PRM F1 AUC": 0.6451021477213201, "eval_PRM F1 AUC (fixed)": 0.8292299633315872, "eval_PRM F1 Neg": 0.4444444444444444, "eval_PRM NPV": 0.45454545454545453, "eval_PRM Precision": 0.8452380952380952, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4215198755264282, "eval_runtime": 17.4164, "eval_samples_per_second": 2.526, "eval_steps_per_second": 0.172, "step": 1970 }, { "epoch": 0.5077116270084039, "grad_norm": 0.21219806715524042, "learning_rate": 5.737057935731868e-05, "loss": 0.3616, "step": 1971 }, { "epoch": 0.5079692178896867, "grad_norm": 0.1421431629435897, "learning_rate": 5.732609783230797e-05, "loss": 0.3438, "step": 1972 }, { "epoch": 0.5082268087709695, "grad_norm": 0.13481355771250744, "learning_rate": 5.728161038111151e-05, "loss": 0.3484, "step": 1973 }, { "epoch": 0.5084843996522523, "grad_norm": 0.17048488533693024, "learning_rate": 5.723711703971588e-05, "loss": 0.3526, "step": 1974 }, { "epoch": 0.5087419905335351, "grad_norm": 0.1679749446042187, "learning_rate": 5.719261784411233e-05, "loss": 0.3984, "step": 1975 }, { "epoch": 0.5087419905335351, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.8376113148245153, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4565873444080353, "eval_runtime": 16.5827, "eval_samples_per_second": 2.653, "eval_steps_per_second": 0.181, "step": 1975 }, { "epoch": 0.5089995814148179, "grad_norm": 0.2553390380469135, "learning_rate": 5.714811283029694e-05, "loss": 0.3878, "step": 1976 }, { "epoch": 0.5092571722961007, "grad_norm": 0.2161027084909971, "learning_rate": 5.710360203427043e-05, "loss": 0.3672, "step": 1977 }, { "epoch": 0.5095147631773835, "grad_norm": 0.1767957482547596, "learning_rate": 5.705908549203823e-05, "loss": 0.4114, "step": 1978 }, { "epoch": 0.5097723540586663, "grad_norm": 0.17507526801820886, "learning_rate": 5.701456323961042e-05, "loss": 0.3211, "step": 1979 }, { "epoch": 0.5100299449399491, "grad_norm": 0.14048278539458697, "learning_rate": 5.697003531300168e-05, "loss": 0.409, "step": 1980 }, { "epoch": 0.5100299449399491, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8297537977998952, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42356178164482117, "eval_runtime": 17.4379, "eval_samples_per_second": 2.523, "eval_steps_per_second": 0.172, "step": 1980 }, { "epoch": 0.5102875358212319, "grad_norm": 0.13573346631581343, "learning_rate": 5.692550174823129e-05, "loss": 0.3049, "step": 1981 }, { "epoch": 0.5105451267025147, "grad_norm": 0.17256451638062034, "learning_rate": 5.688096258132309e-05, "loss": 0.4616, "step": 1982 }, { "epoch": 0.5108027175837976, "grad_norm": 0.14297936717120371, "learning_rate": 5.6836417848305445e-05, "loss": 0.3963, "step": 1983 }, { "epoch": 0.5110603084650803, "grad_norm": 0.16522445090515758, "learning_rate": 5.6791867585211245e-05, "loss": 0.3736, "step": 1984 }, { "epoch": 0.5113178993463632, "grad_norm": 0.20338430664367346, "learning_rate": 5.674731182807781e-05, "loss": 0.4374, "step": 1985 }, { "epoch": 0.5113178993463632, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.821896280775275, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4228515625, "eval_runtime": 17.094, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.176, "step": 1985 }, { "epoch": 0.5115754902276459, "grad_norm": 0.12999984950500315, "learning_rate": 5.670275061294696e-05, "loss": 0.369, "step": 1986 }, { "epoch": 0.5118330811089288, "grad_norm": 0.1743338760043219, "learning_rate": 5.665818397586491e-05, "loss": 0.3906, "step": 1987 }, { "epoch": 0.5120906719902115, "grad_norm": 0.17552756964416863, "learning_rate": 5.6613611952882216e-05, "loss": 0.3259, "step": 1988 }, { "epoch": 0.5123482628714944, "grad_norm": 0.15397181421495884, "learning_rate": 5.656903458005385e-05, "loss": 0.3102, "step": 1989 }, { "epoch": 0.5126058537527771, "grad_norm": 0.15257446918957543, "learning_rate": 5.652445189343908e-05, "loss": 0.3983, "step": 1990 }, { "epoch": 0.5126058537527771, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.872093023255814, "eval_PRM F1 AUC": 0.6474594028287062, "eval_PRM F1 AUC (fixed)": 0.8323729701414353, "eval_PRM F1 Neg": 0.45, "eval_PRM NPV": 0.5294117647058824, "eval_PRM Precision": 0.8426966292134831, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4441583752632141, "eval_runtime": 17.6125, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 1990 }, { "epoch": 0.51286344463406, "grad_norm": 0.1409169791761317, "learning_rate": 5.6479863929101495e-05, "loss": 0.3922, "step": 1991 }, { "epoch": 0.5131210355153427, "grad_norm": 0.21740111372028942, "learning_rate": 5.643527072310891e-05, "loss": 0.425, "step": 1992 }, { "epoch": 0.5133786263966256, "grad_norm": 0.20517451234564513, "learning_rate": 5.639067231153345e-05, "loss": 0.4261, "step": 1993 }, { "epoch": 0.5136362172779083, "grad_norm": 0.2468330127772893, "learning_rate": 5.6346068730451396e-05, "loss": 0.4681, "step": 1994 }, { "epoch": 0.5138938081591912, "grad_norm": 0.19741523047466086, "learning_rate": 5.630146001594322e-05, "loss": 0.3992, "step": 1995 }, { "epoch": 0.5138938081591912, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8410162388685175, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4351917505264282, "eval_runtime": 17.2154, "eval_samples_per_second": 2.556, "eval_steps_per_second": 0.174, "step": 1995 }, { "epoch": 0.514151399040474, "grad_norm": 0.12890551397792285, "learning_rate": 5.625684620409353e-05, "loss": 0.3135, "step": 1996 }, { "epoch": 0.5144089899217568, "grad_norm": 0.11251994352966652, "learning_rate": 5.621222733099112e-05, "loss": 0.3119, "step": 1997 }, { "epoch": 0.5146665808030396, "grad_norm": 0.1448278326162604, "learning_rate": 5.61676034327288e-05, "loss": 0.3976, "step": 1998 }, { "epoch": 0.5149241716843224, "grad_norm": 0.1406071916187269, "learning_rate": 5.612297454540352e-05, "loss": 0.3249, "step": 1999 }, { "epoch": 0.5151817625656052, "grad_norm": 0.16046673155981866, "learning_rate": 5.607834070511619e-05, "loss": 0.3727, "step": 2000 }, { "epoch": 0.5151817625656052, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8420639078051336, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4142400622367859, "eval_runtime": 17.779, "eval_samples_per_second": 2.475, "eval_steps_per_second": 0.169, "step": 2000 }, { "epoch": 0.515439353446888, "grad_norm": 0.1576943422442954, "learning_rate": 5.6033701947971805e-05, "loss": 0.3773, "step": 2001 }, { "epoch": 0.5156969443281708, "grad_norm": 0.1874952534596437, "learning_rate": 5.5989058310079254e-05, "loss": 0.4354, "step": 2002 }, { "epoch": 0.5159545352094536, "grad_norm": 0.13372880522852698, "learning_rate": 5.594440982755146e-05, "loss": 0.3232, "step": 2003 }, { "epoch": 0.5162121260907364, "grad_norm": 0.1514057779131614, "learning_rate": 5.589975653650516e-05, "loss": 0.311, "step": 2004 }, { "epoch": 0.5164697169720192, "grad_norm": 0.20948284439508877, "learning_rate": 5.585509847306112e-05, "loss": 0.4186, "step": 2005 }, { "epoch": 0.5164697169720192, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8331587218438974, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4187677502632141, "eval_runtime": 17.0341, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2005 }, { "epoch": 0.516727307853302, "grad_norm": 0.15092735579258332, "learning_rate": 5.581043567334383e-05, "loss": 0.394, "step": 2006 }, { "epoch": 0.5169848987345848, "grad_norm": 0.14426891302448921, "learning_rate": 5.576576817348169e-05, "loss": 0.3616, "step": 2007 }, { "epoch": 0.5172424896158676, "grad_norm": 0.19486454565642172, "learning_rate": 5.5721096009606885e-05, "loss": 0.3272, "step": 2008 }, { "epoch": 0.5175000804971503, "grad_norm": 0.19109979412742129, "learning_rate": 5.567641921785537e-05, "loss": 0.4214, "step": 2009 }, { "epoch": 0.5177576713784332, "grad_norm": 0.15701301563469852, "learning_rate": 5.5631737834366836e-05, "loss": 0.3289, "step": 2010 }, { "epoch": 0.5177576713784332, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8606060606060606, "eval_PRM F1 AUC": 0.6885804085908852, "eval_PRM F1 AUC (fixed)": 0.8389209009952854, "eval_PRM F1 Neg": 0.5106382978723404, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8658536585365854, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4164595305919647, "eval_runtime": 17.4099, "eval_samples_per_second": 2.527, "eval_steps_per_second": 0.172, "step": 2010 }, { "epoch": 0.5180152622597161, "grad_norm": 0.12605676343069108, "learning_rate": 5.5587051895284695e-05, "loss": 0.3397, "step": 2011 }, { "epoch": 0.5182728531409988, "grad_norm": 0.1824585228760495, "learning_rate": 5.554236143675605e-05, "loss": 0.3743, "step": 2012 }, { "epoch": 0.5185304440222817, "grad_norm": 0.20069764307974666, "learning_rate": 5.5497666494931654e-05, "loss": 0.4296, "step": 2013 }, { "epoch": 0.5187880349035644, "grad_norm": 0.1403249954553184, "learning_rate": 5.5452967105965904e-05, "loss": 0.3772, "step": 2014 }, { "epoch": 0.5190456257848473, "grad_norm": 0.15452067087473162, "learning_rate": 5.5408263306016736e-05, "loss": 0.4272, "step": 2015 }, { "epoch": 0.5190456257848473, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8470403352540596, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4115767180919647, "eval_runtime": 17.1613, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 2015 }, { "epoch": 0.51930321666613, "grad_norm": 0.17455468940712443, "learning_rate": 5.536355513124574e-05, "loss": 0.3338, "step": 2016 }, { "epoch": 0.5195608075474129, "grad_norm": 0.2010758514492215, "learning_rate": 5.531884261781797e-05, "loss": 0.4625, "step": 2017 }, { "epoch": 0.5198183984286956, "grad_norm": 0.16226773402413, "learning_rate": 5.527412580190203e-05, "loss": 0.3552, "step": 2018 }, { "epoch": 0.5200759893099784, "grad_norm": 0.156114481596148, "learning_rate": 5.5229404719669984e-05, "loss": 0.3447, "step": 2019 }, { "epoch": 0.5203335801912612, "grad_norm": 0.182267158691678, "learning_rate": 5.518467940729739e-05, "loss": 0.443, "step": 2020 }, { "epoch": 0.5203335801912612, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.853850183342064, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4057173430919647, "eval_runtime": 17.0622, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 2020 }, { "epoch": 0.520591171072544, "grad_norm": 0.1405859308577178, "learning_rate": 5.5139949900963174e-05, "loss": 0.3475, "step": 2021 }, { "epoch": 0.5208487619538268, "grad_norm": 0.12624673647873447, "learning_rate": 5.509521623684968e-05, "loss": 0.3363, "step": 2022 }, { "epoch": 0.5211063528351096, "grad_norm": 0.11565588606367397, "learning_rate": 5.5050478451142586e-05, "loss": 0.3585, "step": 2023 }, { "epoch": 0.5213639437163924, "grad_norm": 0.21176890439543344, "learning_rate": 5.5005736580030963e-05, "loss": 0.3405, "step": 2024 }, { "epoch": 0.5216215345976752, "grad_norm": 0.1317224767338869, "learning_rate": 5.4960990659707136e-05, "loss": 0.3619, "step": 2025 }, { "epoch": 0.5216215345976752, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8501833420639078, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4074041247367859, "eval_runtime": 17.0383, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 2025 }, { "epoch": 0.5218791254789581, "grad_norm": 0.11847577493241711, "learning_rate": 5.491624072636674e-05, "loss": 0.297, "step": 2026 }, { "epoch": 0.5221367163602408, "grad_norm": 0.17280346995987633, "learning_rate": 5.487148681620862e-05, "loss": 0.4082, "step": 2027 }, { "epoch": 0.5223943072415237, "grad_norm": 0.17084021311446107, "learning_rate": 5.482672896543487e-05, "loss": 0.4101, "step": 2028 }, { "epoch": 0.5226518981228064, "grad_norm": 0.13621840520116943, "learning_rate": 5.478196721025073e-05, "loss": 0.3993, "step": 2029 }, { "epoch": 0.5229094890040893, "grad_norm": 0.13117663910236727, "learning_rate": 5.4737201586864675e-05, "loss": 0.3307, "step": 2030 }, { "epoch": 0.5229094890040893, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8407543216343635, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.39719459414482117, "eval_runtime": 16.8682, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 2030 }, { "epoch": 0.523167079885372, "grad_norm": 0.1383710235225394, "learning_rate": 5.469243213148822e-05, "loss": 0.3639, "step": 2031 }, { "epoch": 0.5234246707666549, "grad_norm": 0.15304363860482864, "learning_rate": 5.464765888033602e-05, "loss": 0.3882, "step": 2032 }, { "epoch": 0.5236822616479376, "grad_norm": 0.15212229570341806, "learning_rate": 5.460288186962583e-05, "loss": 0.3878, "step": 2033 }, { "epoch": 0.5239398525292205, "grad_norm": 0.13839664274067834, "learning_rate": 5.455810113557839e-05, "loss": 0.3708, "step": 2034 }, { "epoch": 0.5241974434105032, "grad_norm": 0.17316272691860943, "learning_rate": 5.451331671441751e-05, "loss": 0.4628, "step": 2035 }, { "epoch": 0.5241974434105032, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8423258250392878, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.39151278138160706, "eval_runtime": 16.9123, "eval_samples_per_second": 2.602, "eval_steps_per_second": 0.177, "step": 2035 }, { "epoch": 0.5244550342917861, "grad_norm": 0.14489451523876312, "learning_rate": 5.446852864236991e-05, "loss": 0.3221, "step": 2036 }, { "epoch": 0.5247126251730688, "grad_norm": 0.1988766080619215, "learning_rate": 5.442373695566534e-05, "loss": 0.4659, "step": 2037 }, { "epoch": 0.5249702160543517, "grad_norm": 0.1389776176471604, "learning_rate": 5.437894169053641e-05, "loss": 0.3277, "step": 2038 }, { "epoch": 0.5252278069356345, "grad_norm": 0.17073375948781336, "learning_rate": 5.4334142883218676e-05, "loss": 0.4109, "step": 2039 }, { "epoch": 0.5254853978169173, "grad_norm": 0.15091599719834037, "learning_rate": 5.428934056995052e-05, "loss": 0.3377, "step": 2040 }, { "epoch": 0.5254853978169173, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8386589837611316, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4031427502632141, "eval_runtime": 17.5676, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 2040 }, { "epoch": 0.5257429886982001, "grad_norm": 0.1726553264575567, "learning_rate": 5.4244534786973214e-05, "loss": 0.3972, "step": 2041 }, { "epoch": 0.5260005795794829, "grad_norm": 0.12642039827318133, "learning_rate": 5.4199725570530735e-05, "loss": 0.3027, "step": 2042 }, { "epoch": 0.5262581704607657, "grad_norm": 0.15104989331276478, "learning_rate": 5.415491295686995e-05, "loss": 0.4181, "step": 2043 }, { "epoch": 0.5265157613420485, "grad_norm": 0.23276158945096306, "learning_rate": 5.411009698224041e-05, "loss": 0.4327, "step": 2044 }, { "epoch": 0.5267733522233313, "grad_norm": 0.14805946848268564, "learning_rate": 5.406527768289441e-05, "loss": 0.3166, "step": 2045 }, { "epoch": 0.5267733522233313, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8418019905709795, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4216974377632141, "eval_runtime": 17.5049, "eval_samples_per_second": 2.514, "eval_steps_per_second": 0.171, "step": 2045 }, { "epoch": 0.5270309431046141, "grad_norm": 0.13143827483675186, "learning_rate": 5.402045509508692e-05, "loss": 0.3572, "step": 2046 }, { "epoch": 0.5272885339858969, "grad_norm": 0.1575077674791195, "learning_rate": 5.3975629255075554e-05, "loss": 0.2465, "step": 2047 }, { "epoch": 0.5275461248671797, "grad_norm": 0.2740141779719599, "learning_rate": 5.3930800199120616e-05, "loss": 0.4939, "step": 2048 }, { "epoch": 0.5278037157484625, "grad_norm": 0.18515637996824869, "learning_rate": 5.388596796348494e-05, "loss": 0.4005, "step": 2049 }, { "epoch": 0.5280613066297453, "grad_norm": 0.17690785782001883, "learning_rate": 5.3841132584433986e-05, "loss": 0.3552, "step": 2050 }, { "epoch": 0.5280613066297453, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8404924044002096, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4098011255264282, "eval_runtime": 17.0428, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 2050 }, { "epoch": 0.5283188975110281, "grad_norm": 0.14716600331952415, "learning_rate": 5.379629409823571e-05, "loss": 0.3991, "step": 2051 }, { "epoch": 0.5285764883923109, "grad_norm": 0.1572104453485029, "learning_rate": 5.375145254116065e-05, "loss": 0.3503, "step": 2052 }, { "epoch": 0.5288340792735937, "grad_norm": 0.14391001387350164, "learning_rate": 5.3706607949481736e-05, "loss": 0.3557, "step": 2053 }, { "epoch": 0.5290916701548766, "grad_norm": 0.19161756424057008, "learning_rate": 5.3661760359474446e-05, "loss": 0.3301, "step": 2054 }, { "epoch": 0.5293492610361593, "grad_norm": 0.2085656851277453, "learning_rate": 5.361690980741663e-05, "loss": 0.3831, "step": 2055 }, { "epoch": 0.5293492610361593, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.85, "eval_PRM F1 AUC": 0.7139863803038241, "eval_PRM F1 AUC (fixed)": 0.8412781561026716, "eval_PRM F1 Neg": 0.5384615384615384, "eval_PRM NPV": 0.4827586206896552, "eval_PRM Precision": 0.8831168831168831, "eval_PRM Recall": 0.8192771084337349, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.4046519994735718, "eval_runtime": 17.5267, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 2055 }, { "epoch": 0.5296068519174422, "grad_norm": 0.15938303163199383, "learning_rate": 5.357205632958852e-05, "loss": 0.3305, "step": 2056 }, { "epoch": 0.5298644427987249, "grad_norm": 0.1691346447226298, "learning_rate": 5.352719996227273e-05, "loss": 0.3886, "step": 2057 }, { "epoch": 0.5301220336800078, "grad_norm": 0.16082307158085632, "learning_rate": 5.348234074175428e-05, "loss": 0.3472, "step": 2058 }, { "epoch": 0.5303796245612905, "grad_norm": 0.18415935209890774, "learning_rate": 5.3437478704320375e-05, "loss": 0.3332, "step": 2059 }, { "epoch": 0.5306372154425734, "grad_norm": 0.16943370945706787, "learning_rate": 5.33926138862606e-05, "loss": 0.4161, "step": 2060 }, { "epoch": 0.5306372154425734, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.6511262441068623, "eval_PRM F1 AUC (fixed)": 0.8501833420639078, "eval_PRM F1 Neg": 0.45454545454545453, "eval_PRM NPV": 0.47619047619047616, "eval_PRM Precision": 0.8470588235294118, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.40518465638160706, "eval_runtime": 17.0928, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.176, "step": 2060 }, { "epoch": 0.5308948063238561, "grad_norm": 0.14028074670246027, "learning_rate": 5.3347746323866724e-05, "loss": 0.3035, "step": 2061 }, { "epoch": 0.531152397205139, "grad_norm": 0.32292804580343487, "learning_rate": 5.330287605343279e-05, "loss": 0.4956, "step": 2062 }, { "epoch": 0.5314099880864217, "grad_norm": 0.16444934025334107, "learning_rate": 5.325800311125497e-05, "loss": 0.3578, "step": 2063 }, { "epoch": 0.5316675789677046, "grad_norm": 0.16473755647300412, "learning_rate": 5.3213127533631666e-05, "loss": 0.3578, "step": 2064 }, { "epoch": 0.5319251698489873, "grad_norm": 0.15958162419322863, "learning_rate": 5.3168249356863354e-05, "loss": 0.4014, "step": 2065 }, { "epoch": 0.5319251698489873, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.6511262441068623, "eval_PRM F1 AUC (fixed)": 0.8543740178103719, "eval_PRM F1 Neg": 0.45454545454545453, "eval_PRM NPV": 0.47619047619047616, "eval_PRM Precision": 0.8470588235294118, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.40163353085517883, "eval_runtime": 17.0134, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 2065 }, { "epoch": 0.5321827607302702, "grad_norm": 0.20458510984275777, "learning_rate": 5.3123368617252654e-05, "loss": 0.4312, "step": 2066 }, { "epoch": 0.5324403516115529, "grad_norm": 0.17054775353840954, "learning_rate": 5.3078485351104226e-05, "loss": 0.4225, "step": 2067 }, { "epoch": 0.5326979424928358, "grad_norm": 0.16286686594336625, "learning_rate": 5.3033599594724794e-05, "loss": 0.4337, "step": 2068 }, { "epoch": 0.5329555333741186, "grad_norm": 0.13733316270492532, "learning_rate": 5.298871138442307e-05, "loss": 0.3359, "step": 2069 }, { "epoch": 0.5332131242554013, "grad_norm": 0.17278877168257112, "learning_rate": 5.294382075650981e-05, "loss": 0.4483, "step": 2070 }, { "epoch": 0.5332131242554013, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8462545835515977, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4013671875, "eval_runtime": 17.0377, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2070 }, { "epoch": 0.5334707151366842, "grad_norm": 0.1303627564951731, "learning_rate": 5.289892774729767e-05, "loss": 0.3618, "step": 2071 }, { "epoch": 0.533728306017967, "grad_norm": 0.15467466904494062, "learning_rate": 5.285403239310123e-05, "loss": 0.3879, "step": 2072 }, { "epoch": 0.5339858968992498, "grad_norm": 0.17260775514177185, "learning_rate": 5.280913473023702e-05, "loss": 0.4635, "step": 2073 }, { "epoch": 0.5342434877805325, "grad_norm": 0.15840090883749958, "learning_rate": 5.276423479502338e-05, "loss": 0.455, "step": 2074 }, { "epoch": 0.5345010786618154, "grad_norm": 0.14397270680650293, "learning_rate": 5.271933262378054e-05, "loss": 0.3334, "step": 2075 }, { "epoch": 0.5345010786618154, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8386589837611315, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.4106889069080353, "eval_runtime": 17.5082, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 2075 }, { "epoch": 0.5347586695430981, "grad_norm": 0.12572985271208612, "learning_rate": 5.267442825283048e-05, "loss": 0.3947, "step": 2076 }, { "epoch": 0.535016260424381, "grad_norm": 0.15807576156421438, "learning_rate": 5.2629521718497e-05, "loss": 0.3851, "step": 2077 }, { "epoch": 0.5352738513056637, "grad_norm": 0.13998319009380997, "learning_rate": 5.258461305710563e-05, "loss": 0.3512, "step": 2078 }, { "epoch": 0.5355314421869466, "grad_norm": 0.12643201934729273, "learning_rate": 5.253970230498367e-05, "loss": 0.3327, "step": 2079 }, { "epoch": 0.5357890330682293, "grad_norm": 0.13128534875393535, "learning_rate": 5.249478949846004e-05, "loss": 0.4037, "step": 2080 }, { "epoch": 0.5357890330682293, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8771929824561403, "eval_PRM F1 AUC": 0.6691985332634888, "eval_PRM F1 AUC (fixed)": 0.8420639078051335, "eval_PRM F1 Neg": 0.4878048780487805, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8522727272727273, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.42604759335517883, "eval_runtime": 17.7233, "eval_samples_per_second": 2.483, "eval_steps_per_second": 0.169, "step": 2080 }, { "epoch": 0.5360466239495122, "grad_norm": 0.16721180525336535, "learning_rate": 5.2449874673865365e-05, "loss": 0.3918, "step": 2081 }, { "epoch": 0.536304214830795, "grad_norm": 0.12368253443734306, "learning_rate": 5.2404957867531876e-05, "loss": 0.3693, "step": 2082 }, { "epoch": 0.5365618057120778, "grad_norm": 0.14511735553100816, "learning_rate": 5.236003911579345e-05, "loss": 0.313, "step": 2083 }, { "epoch": 0.5368193965933606, "grad_norm": 0.14055192834613478, "learning_rate": 5.231511845498548e-05, "loss": 0.349, "step": 2084 }, { "epoch": 0.5370769874746434, "grad_norm": 0.11673532612131145, "learning_rate": 5.2270195921444954e-05, "loss": 0.3176, "step": 2085 }, { "epoch": 0.5370769874746434, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8786127167630058, "eval_PRM F1 AUC": 0.6534834992142482, "eval_PRM F1 AUC (fixed)": 0.8520167627029858, "eval_PRM F1 Neg": 0.46153846153846156, "eval_PRM NPV": 0.5625, "eval_PRM Precision": 0.8444444444444444, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.391304347826087, "eval_loss": 0.4271129369735718, "eval_runtime": 16.8752, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 2085 }, { "epoch": 0.5373345783559262, "grad_norm": 0.12488802728660602, "learning_rate": 5.2225271551510345e-05, "loss": 0.3735, "step": 2086 }, { "epoch": 0.537592169237209, "grad_norm": 0.1577739570133298, "learning_rate": 5.2180345381521626e-05, "loss": 0.3625, "step": 2087 }, { "epoch": 0.5378497601184918, "grad_norm": 0.17065952863639855, "learning_rate": 5.213541744782022e-05, "loss": 0.3356, "step": 2088 }, { "epoch": 0.5381073509997746, "grad_norm": 0.20943735287421217, "learning_rate": 5.209048778674898e-05, "loss": 0.4261, "step": 2089 }, { "epoch": 0.5383649418810574, "grad_norm": 0.281969776040582, "learning_rate": 5.204555643465215e-05, "loss": 0.518, "step": 2090 }, { "epoch": 0.5383649418810574, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8837209302325582, "eval_PRM F1 AUC": 0.6752226296490309, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5882352941176471, "eval_PRM Precision": 0.8539325842696629, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4005681872367859, "eval_runtime": 16.9796, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 2090 }, { "epoch": 0.5386225327623402, "grad_norm": 0.1156186939061372, "learning_rate": 5.200062342787534e-05, "loss": 0.3143, "step": 2091 }, { "epoch": 0.538880123643623, "grad_norm": 0.15135735675938086, "learning_rate": 5.195568880276552e-05, "loss": 0.4564, "step": 2092 }, { "epoch": 0.5391377145249058, "grad_norm": 0.16978548643168587, "learning_rate": 5.191075259567093e-05, "loss": 0.4064, "step": 2093 }, { "epoch": 0.5393953054061886, "grad_norm": 0.21282430664393118, "learning_rate": 5.1865814842941154e-05, "loss": 0.4506, "step": 2094 }, { "epoch": 0.5396528962874714, "grad_norm": 0.16778315374927444, "learning_rate": 5.1820875580926944e-05, "loss": 0.4113, "step": 2095 }, { "epoch": 0.5396528962874714, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8679245283018868, "eval_PRM F1 AUC": 0.7634887375589314, "eval_PRM F1 AUC (fixed)": 0.8470403352540598, "eval_PRM F1 Neg": 0.6037735849056604, "eval_PRM NPV": 0.5333333333333333, "eval_PRM Precision": 0.9078947368421053, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6956521739130435, "eval_loss": 0.38858309388160706, "eval_runtime": 16.9531, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 2095 }, { "epoch": 0.5399104871687542, "grad_norm": 0.16713448520362614, "learning_rate": 5.1775934845980336e-05, "loss": 0.2613, "step": 2096 }, { "epoch": 0.5401680780500371, "grad_norm": 0.20617830957458205, "learning_rate": 5.173099267445451e-05, "loss": 0.4076, "step": 2097 }, { "epoch": 0.5404256689313198, "grad_norm": 0.15584144043550646, "learning_rate": 5.1686049102703883e-05, "loss": 0.3088, "step": 2098 }, { "epoch": 0.5406832598126027, "grad_norm": 0.13971603999676588, "learning_rate": 5.1641104167083897e-05, "loss": 0.3324, "step": 2099 }, { "epoch": 0.5409408506938854, "grad_norm": 0.15170984031034837, "learning_rate": 5.1596157903951205e-05, "loss": 0.3263, "step": 2100 }, { "epoch": 0.5409408506938854, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8412781561026715, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.38352271914482117, "eval_runtime": 17.1098, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 2100 }, { "epoch": 0.5411984415751683, "grad_norm": 0.1264933633203901, "learning_rate": 5.155121034966346e-05, "loss": 0.3324, "step": 2101 }, { "epoch": 0.541456032456451, "grad_norm": 0.13737548185601106, "learning_rate": 5.150626154057939e-05, "loss": 0.2788, "step": 2102 }, { "epoch": 0.5417136233377339, "grad_norm": 0.15823635750885143, "learning_rate": 5.146131151305873e-05, "loss": 0.3731, "step": 2103 }, { "epoch": 0.5419712142190166, "grad_norm": 0.1706746380591667, "learning_rate": 5.1416360303462206e-05, "loss": 0.3554, "step": 2104 }, { "epoch": 0.5422288051002995, "grad_norm": 0.11837053908751594, "learning_rate": 5.137140794815148e-05, "loss": 0.3516, "step": 2105 }, { "epoch": 0.5422288051002995, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8357778941854375, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4169921875, "eval_runtime": 16.4525, "eval_samples_per_second": 2.674, "eval_steps_per_second": 0.182, "step": 2105 }, { "epoch": 0.5424863959815822, "grad_norm": 0.16723448052502865, "learning_rate": 5.1326454483489196e-05, "loss": 0.4145, "step": 2106 }, { "epoch": 0.5427439868628651, "grad_norm": 0.20134589315950735, "learning_rate": 5.1281499945838816e-05, "loss": 0.4247, "step": 2107 }, { "epoch": 0.5430015777441478, "grad_norm": 0.20585582310824724, "learning_rate": 5.1236544371564735e-05, "loss": 0.4477, "step": 2108 }, { "epoch": 0.5432591686254307, "grad_norm": 0.14417732100778552, "learning_rate": 5.119158779703215e-05, "loss": 0.3215, "step": 2109 }, { "epoch": 0.5435167595067134, "grad_norm": 0.18355234493223777, "learning_rate": 5.11466302586071e-05, "loss": 0.4771, "step": 2110 }, { "epoch": 0.5435167595067134, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8404924044002096, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42018821835517883, "eval_runtime": 17.5956, "eval_samples_per_second": 2.501, "eval_steps_per_second": 0.17, "step": 2110 }, { "epoch": 0.5437743503879963, "grad_norm": 0.17354688880894878, "learning_rate": 5.110167179265636e-05, "loss": 0.3518, "step": 2111 }, { "epoch": 0.5440319412692791, "grad_norm": 0.1881262761253409, "learning_rate": 5.1056712435547474e-05, "loss": 0.4283, "step": 2112 }, { "epoch": 0.5442895321505619, "grad_norm": 0.22049463774032257, "learning_rate": 5.101175222364874e-05, "loss": 0.4017, "step": 2113 }, { "epoch": 0.5445471230318447, "grad_norm": 0.21867777753475734, "learning_rate": 5.096679119332909e-05, "loss": 0.4022, "step": 2114 }, { "epoch": 0.5448047139131275, "grad_norm": 0.11658058194358625, "learning_rate": 5.0921829380958174e-05, "loss": 0.311, "step": 2115 }, { "epoch": 0.5448047139131275, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8394447354635934, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.38210228085517883, "eval_runtime": 17.0375, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2115 }, { "epoch": 0.5450623047944103, "grad_norm": 0.15349217186802172, "learning_rate": 5.0876866822906245e-05, "loss": 0.4086, "step": 2116 }, { "epoch": 0.5453198956756931, "grad_norm": 0.16851131583427995, "learning_rate": 5.0831903555544135e-05, "loss": 0.4019, "step": 2117 }, { "epoch": 0.5455774865569759, "grad_norm": 0.20822578670286693, "learning_rate": 5.078693961524329e-05, "loss": 0.3894, "step": 2118 }, { "epoch": 0.5458350774382587, "grad_norm": 0.1843641977188793, "learning_rate": 5.07419750383757e-05, "loss": 0.3926, "step": 2119 }, { "epoch": 0.5460926683195415, "grad_norm": 0.21264790823720447, "learning_rate": 5.069700986131384e-05, "loss": 0.339, "step": 2120 }, { "epoch": 0.5460926683195415, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8404924044002096, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3820134997367859, "eval_runtime": 17.4691, "eval_samples_per_second": 2.519, "eval_steps_per_second": 0.172, "step": 2120 }, { "epoch": 0.5463502592008243, "grad_norm": 0.16334836817993717, "learning_rate": 5.0652044120430707e-05, "loss": 0.3713, "step": 2121 }, { "epoch": 0.5466078500821071, "grad_norm": 0.1623736795236759, "learning_rate": 5.060707785209972e-05, "loss": 0.3496, "step": 2122 }, { "epoch": 0.5468654409633898, "grad_norm": 0.1856282482779356, "learning_rate": 5.0562111092694744e-05, "loss": 0.3738, "step": 2123 }, { "epoch": 0.5471230318446727, "grad_norm": 0.16458214441897714, "learning_rate": 5.051714387859001e-05, "loss": 0.4095, "step": 2124 }, { "epoch": 0.5473806227259554, "grad_norm": 0.15882753369852362, "learning_rate": 5.0472176246160184e-05, "loss": 0.3166, "step": 2125 }, { "epoch": 0.5473806227259554, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8496595075955997, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.37890625, "eval_runtime": 17.4158, "eval_samples_per_second": 2.526, "eval_steps_per_second": 0.172, "step": 2125 }, { "epoch": 0.5476382136072383, "grad_norm": 0.1309588342317957, "learning_rate": 5.042720823178022e-05, "loss": 0.3712, "step": 2126 }, { "epoch": 0.5478958044885212, "grad_norm": 0.15892977107103531, "learning_rate": 5.0382239871825365e-05, "loss": 0.4008, "step": 2127 }, { "epoch": 0.5481533953698039, "grad_norm": 0.1375237916698276, "learning_rate": 5.03372712026712e-05, "loss": 0.3384, "step": 2128 }, { "epoch": 0.5484109862510868, "grad_norm": 0.2633674567019821, "learning_rate": 5.029230226069351e-05, "loss": 0.4293, "step": 2129 }, { "epoch": 0.5486685771323695, "grad_norm": 0.1312412710653147, "learning_rate": 5.024733308226833e-05, "loss": 0.3817, "step": 2130 }, { "epoch": 0.5486685771323695, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3759765625, "eval_runtime": 16.9679, "eval_samples_per_second": 2.593, "eval_steps_per_second": 0.177, "step": 2130 }, { "epoch": 0.5489261680136523, "grad_norm": 0.1328720900684053, "learning_rate": 5.020236370377186e-05, "loss": 0.3462, "step": 2131 }, { "epoch": 0.5491837588949351, "grad_norm": 0.1751367425938839, "learning_rate": 5.01573941615805e-05, "loss": 0.4523, "step": 2132 }, { "epoch": 0.549441349776218, "grad_norm": 0.11848844530055186, "learning_rate": 5.0112424492070716e-05, "loss": 0.3, "step": 2133 }, { "epoch": 0.5496989406575007, "grad_norm": 0.13458102728384466, "learning_rate": 5.006745473161917e-05, "loss": 0.3874, "step": 2134 }, { "epoch": 0.5499565315387835, "grad_norm": 0.1346350269991044, "learning_rate": 5.002248491660251e-05, "loss": 0.3357, "step": 2135 }, { "epoch": 0.5499565315387835, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.852016762702986, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3757990002632141, "eval_runtime": 17.0315, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2135 }, { "epoch": 0.5502141224200663, "grad_norm": 0.1280585930813598, "learning_rate": 4.99775150833975e-05, "loss": 0.3617, "step": 2136 }, { "epoch": 0.5504717133013491, "grad_norm": 0.23752514813094275, "learning_rate": 4.9932545268380824e-05, "loss": 0.4613, "step": 2137 }, { "epoch": 0.5507293041826319, "grad_norm": 0.12008766716175923, "learning_rate": 4.988757550792929e-05, "loss": 0.3089, "step": 2138 }, { "epoch": 0.5509868950639147, "grad_norm": 0.174931204391963, "learning_rate": 4.984260583841953e-05, "loss": 0.4089, "step": 2139 }, { "epoch": 0.5512444859451976, "grad_norm": 0.16401091970078174, "learning_rate": 4.979763629622815e-05, "loss": 0.3493, "step": 2140 }, { "epoch": 0.5512444859451976, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8493975903614458, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3702947497367859, "eval_runtime": 17.4167, "eval_samples_per_second": 2.526, "eval_steps_per_second": 0.172, "step": 2140 }, { "epoch": 0.5515020768264803, "grad_norm": 0.1421853946676774, "learning_rate": 4.975266691773168e-05, "loss": 0.373, "step": 2141 }, { "epoch": 0.5517596677077632, "grad_norm": 0.16680146122780656, "learning_rate": 4.9707697739306494e-05, "loss": 0.3754, "step": 2142 }, { "epoch": 0.5520172585890459, "grad_norm": 0.1493812218399558, "learning_rate": 4.9662728797328815e-05, "loss": 0.3307, "step": 2143 }, { "epoch": 0.5522748494703288, "grad_norm": 0.1417776209584457, "learning_rate": 4.961776012817464e-05, "loss": 0.338, "step": 2144 }, { "epoch": 0.5525324403516115, "grad_norm": 0.19235181629224005, "learning_rate": 4.9572791768219794e-05, "loss": 0.3649, "step": 2145 }, { "epoch": 0.5525324403516115, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.856469355683604, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3668323755264282, "eval_runtime": 17.471, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 2145 }, { "epoch": 0.5527900312328944, "grad_norm": 0.18791856734878726, "learning_rate": 4.9527823753839834e-05, "loss": 0.3634, "step": 2146 }, { "epoch": 0.5530476221141771, "grad_norm": 0.1584590627816371, "learning_rate": 4.9482856121409996e-05, "loss": 0.343, "step": 2147 }, { "epoch": 0.55330521299546, "grad_norm": 0.1355920607532572, "learning_rate": 4.943788890730529e-05, "loss": 0.386, "step": 2148 }, { "epoch": 0.5535628038767427, "grad_norm": 0.14377155856871848, "learning_rate": 4.9392922147900294e-05, "loss": 0.3652, "step": 2149 }, { "epoch": 0.5538203947580256, "grad_norm": 0.14175723136724785, "learning_rate": 4.9347955879569305e-05, "loss": 0.3691, "step": 2150 }, { "epoch": 0.5538203947580256, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8585646935568361, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.37109375, "eval_runtime": 16.885, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 2150 }, { "epoch": 0.5540779856393083, "grad_norm": 0.23453621043292955, "learning_rate": 4.930299013868615e-05, "loss": 0.5249, "step": 2151 }, { "epoch": 0.5543355765205912, "grad_norm": 0.1344789117262499, "learning_rate": 4.92580249616243e-05, "loss": 0.3675, "step": 2152 }, { "epoch": 0.5545931674018739, "grad_norm": 0.15020191341899067, "learning_rate": 4.9213060384756716e-05, "loss": 0.3039, "step": 2153 }, { "epoch": 0.5548507582831568, "grad_norm": 0.13188450363898974, "learning_rate": 4.916809644445588e-05, "loss": 0.3587, "step": 2154 }, { "epoch": 0.5551083491644396, "grad_norm": 0.15676676363128247, "learning_rate": 4.912313317709378e-05, "loss": 0.3547, "step": 2155 }, { "epoch": 0.5551083491644396, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8630172865374542, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3636363744735718, "eval_runtime": 17.2898, "eval_samples_per_second": 2.545, "eval_steps_per_second": 0.174, "step": 2155 }, { "epoch": 0.5553659400457224, "grad_norm": 0.12183958225770586, "learning_rate": 4.9078170619041824e-05, "loss": 0.3513, "step": 2156 }, { "epoch": 0.5556235309270052, "grad_norm": 0.14353723932149423, "learning_rate": 4.9033208806670925e-05, "loss": 0.3542, "step": 2157 }, { "epoch": 0.555881121808288, "grad_norm": 0.12241634739682451, "learning_rate": 4.898824777635126e-05, "loss": 0.3816, "step": 2158 }, { "epoch": 0.5561387126895708, "grad_norm": 0.17791820413785403, "learning_rate": 4.894328756445254e-05, "loss": 0.3862, "step": 2159 }, { "epoch": 0.5563963035708536, "grad_norm": 0.18737974074821792, "learning_rate": 4.8898328207343666e-05, "loss": 0.406, "step": 2160 }, { "epoch": 0.5563963035708536, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8596123624934521, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3660333752632141, "eval_runtime": 17.3906, "eval_samples_per_second": 2.53, "eval_steps_per_second": 0.173, "step": 2160 }, { "epoch": 0.5566538944521364, "grad_norm": 0.22074640164072148, "learning_rate": 4.885336974139292e-05, "loss": 0.5398, "step": 2161 }, { "epoch": 0.5569114853334192, "grad_norm": 0.16297530028327453, "learning_rate": 4.880841220296786e-05, "loss": 0.415, "step": 2162 }, { "epoch": 0.557169076214702, "grad_norm": 0.11433109053291302, "learning_rate": 4.876345562843527e-05, "loss": 0.3514, "step": 2163 }, { "epoch": 0.5574266670959848, "grad_norm": 0.1398536676505433, "learning_rate": 4.8718500054161195e-05, "loss": 0.3723, "step": 2164 }, { "epoch": 0.5576842579772676, "grad_norm": 0.1478329378108419, "learning_rate": 4.867354551651081e-05, "loss": 0.3927, "step": 2165 }, { "epoch": 0.5576842579772676, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8491356731272918, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3755326569080353, "eval_runtime": 17.1232, "eval_samples_per_second": 2.57, "eval_steps_per_second": 0.175, "step": 2165 }, { "epoch": 0.5579418488585504, "grad_norm": 0.13688230907613783, "learning_rate": 4.862859205184853e-05, "loss": 0.356, "step": 2166 }, { "epoch": 0.5581994397398332, "grad_norm": 0.14598957880294913, "learning_rate": 4.858363969653781e-05, "loss": 0.3203, "step": 2167 }, { "epoch": 0.558457030621116, "grad_norm": 0.14978586225686757, "learning_rate": 4.853868848694128e-05, "loss": 0.3873, "step": 2168 }, { "epoch": 0.5587146215023988, "grad_norm": 0.17697588446454016, "learning_rate": 4.8493738459420625e-05, "loss": 0.3713, "step": 2169 }, { "epoch": 0.5589722123836817, "grad_norm": 0.18040210280731417, "learning_rate": 4.844878965033655e-05, "loss": 0.3624, "step": 2170 }, { "epoch": 0.5589722123836817, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8446830801466736, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3761541247367859, "eval_runtime": 17.2164, "eval_samples_per_second": 2.556, "eval_steps_per_second": 0.174, "step": 2170 }, { "epoch": 0.5592298032649644, "grad_norm": 0.1964276593543136, "learning_rate": 4.84038420960488e-05, "loss": 0.3832, "step": 2171 }, { "epoch": 0.5594873941462473, "grad_norm": 0.16389978703949507, "learning_rate": 4.83588958329161e-05, "loss": 0.4719, "step": 2172 }, { "epoch": 0.55974498502753, "grad_norm": 0.12567930008990083, "learning_rate": 4.8313950897296135e-05, "loss": 0.3569, "step": 2173 }, { "epoch": 0.5600025759088129, "grad_norm": 0.11451491285445857, "learning_rate": 4.8269007325545506e-05, "loss": 0.3477, "step": 2174 }, { "epoch": 0.5602601667900956, "grad_norm": 0.1342974107810076, "learning_rate": 4.8224065154019676e-05, "loss": 0.3394, "step": 2175 }, { "epoch": 0.5602601667900956, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.8425877422734416, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3746448755264282, "eval_runtime": 17.0633, "eval_samples_per_second": 2.579, "eval_steps_per_second": 0.176, "step": 2175 }, { "epoch": 0.5605177576713785, "grad_norm": 0.19016684018239385, "learning_rate": 4.817912441907308e-05, "loss": 0.3162, "step": 2176 }, { "epoch": 0.5607753485526612, "grad_norm": 0.14054461274800253, "learning_rate": 4.813418515705885e-05, "loss": 0.3744, "step": 2177 }, { "epoch": 0.5610329394339441, "grad_norm": 0.16813177450742112, "learning_rate": 4.808924740432907e-05, "loss": 0.2878, "step": 2178 }, { "epoch": 0.5612905303152268, "grad_norm": 0.14553774665583524, "learning_rate": 4.804431119723449e-05, "loss": 0.358, "step": 2179 }, { "epoch": 0.5615481211965097, "grad_norm": 0.25533237074550735, "learning_rate": 4.799937657212467e-05, "loss": 0.5151, "step": 2180 }, { "epoch": 0.5615481211965097, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8399685699319015, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3894708752632141, "eval_runtime": 17.0529, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 2180 }, { "epoch": 0.5618057120777924, "grad_norm": 0.1297733900890675, "learning_rate": 4.7954443565347865e-05, "loss": 0.3325, "step": 2181 }, { "epoch": 0.5620633029590753, "grad_norm": 0.1673331346690515, "learning_rate": 4.7909512213251026e-05, "loss": 0.3791, "step": 2182 }, { "epoch": 0.5623208938403581, "grad_norm": 0.1343079400856452, "learning_rate": 4.7864582552179796e-05, "loss": 0.2454, "step": 2183 }, { "epoch": 0.5625784847216408, "grad_norm": 0.2087779801405549, "learning_rate": 4.781965461847838e-05, "loss": 0.3994, "step": 2184 }, { "epoch": 0.5628360756029237, "grad_norm": 0.141789777382412, "learning_rate": 4.7774728448489666e-05, "loss": 0.4016, "step": 2185 }, { "epoch": 0.5628360756029237, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8690476190476191, "eval_PRM F1 AUC": 0.678889470927187, "eval_PRM F1 AUC (fixed)": 0.8365636458878994, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.5238095238095238, "eval_PRM Precision": 0.8588235294117647, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.39089134335517883, "eval_runtime": 16.7172, "eval_samples_per_second": 2.632, "eval_steps_per_second": 0.179, "step": 2185 }, { "epoch": 0.5630936664842064, "grad_norm": 0.1965836602182714, "learning_rate": 4.7729804078555044e-05, "loss": 0.4113, "step": 2186 }, { "epoch": 0.5633512573654893, "grad_norm": 0.18292467806038407, "learning_rate": 4.768488154501454e-05, "loss": 0.3361, "step": 2187 }, { "epoch": 0.563608848246772, "grad_norm": 0.16613394402746923, "learning_rate": 4.7639960884206576e-05, "loss": 0.3961, "step": 2188 }, { "epoch": 0.5638664391280549, "grad_norm": 0.18376328117834048, "learning_rate": 4.759504213246813e-05, "loss": 0.3649, "step": 2189 }, { "epoch": 0.5641240300093376, "grad_norm": 0.15517133244551723, "learning_rate": 4.755012532613465e-05, "loss": 0.3249, "step": 2190 }, { "epoch": 0.5641240300093376, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8381351492928234, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3722478747367859, "eval_runtime": 16.9506, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 2190 }, { "epoch": 0.5643816208906205, "grad_norm": 0.12600302601372262, "learning_rate": 4.7505210501539966e-05, "loss": 0.366, "step": 2191 }, { "epoch": 0.5646392117719032, "grad_norm": 0.16316320475752782, "learning_rate": 4.746029769501634e-05, "loss": 0.3683, "step": 2192 }, { "epoch": 0.5648968026531861, "grad_norm": 0.18499636302691863, "learning_rate": 4.741538694289437e-05, "loss": 0.4064, "step": 2193 }, { "epoch": 0.5651543935344688, "grad_norm": 0.1303058154252544, "learning_rate": 4.7370478281503014e-05, "loss": 0.3632, "step": 2194 }, { "epoch": 0.5654119844157517, "grad_norm": 0.15355381606296517, "learning_rate": 4.7325571747169545e-05, "loss": 0.3509, "step": 2195 }, { "epoch": 0.5654119844157517, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8588957055214724, "eval_PRM F1 AUC": 0.7042954426401258, "eval_PRM F1 AUC (fixed)": 0.8410162388685175, "eval_PRM F1 Neg": 0.5306122448979592, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3628373444080353, "eval_runtime": 17.0342, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2195 }, { "epoch": 0.5656695752970344, "grad_norm": 0.1760926218321264, "learning_rate": 4.728066737621947e-05, "loss": 0.4315, "step": 2196 }, { "epoch": 0.5659271661783173, "grad_norm": 0.21462043388412655, "learning_rate": 4.723576520497663e-05, "loss": 0.4928, "step": 2197 }, { "epoch": 0.5661847570596001, "grad_norm": 0.12322984749559669, "learning_rate": 4.719086526976298e-05, "loss": 0.2569, "step": 2198 }, { "epoch": 0.5664423479408829, "grad_norm": 0.12928031124907874, "learning_rate": 4.714596760689878e-05, "loss": 0.3709, "step": 2199 }, { "epoch": 0.5666999388221657, "grad_norm": 0.14365617703509492, "learning_rate": 4.710107225270236e-05, "loss": 0.3403, "step": 2200 }, { "epoch": 0.5666999388221657, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8538501833420639, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35342684388160706, "eval_runtime": 16.8425, "eval_samples_per_second": 2.612, "eval_steps_per_second": 0.178, "step": 2200 }, { "epoch": 0.5669575297034485, "grad_norm": 0.12062531516149663, "learning_rate": 4.70561792434902e-05, "loss": 0.3082, "step": 2201 }, { "epoch": 0.5672151205847313, "grad_norm": 0.1526087638521343, "learning_rate": 4.7011288615576934e-05, "loss": 0.3406, "step": 2202 }, { "epoch": 0.5674727114660141, "grad_norm": 0.15644291328617355, "learning_rate": 4.6966400405275224e-05, "loss": 0.3636, "step": 2203 }, { "epoch": 0.5677303023472969, "grad_norm": 0.13913944417182417, "learning_rate": 4.6921514648895786e-05, "loss": 0.3085, "step": 2204 }, { "epoch": 0.5679878932285797, "grad_norm": 0.16084278441444716, "learning_rate": 4.687663138274735e-05, "loss": 0.3669, "step": 2205 }, { "epoch": 0.5679878932285797, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8627553693033002, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3511185944080353, "eval_runtime": 17.1619, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 2205 }, { "epoch": 0.5682454841098625, "grad_norm": 0.20549808343963985, "learning_rate": 4.683175064313666e-05, "loss": 0.4485, "step": 2206 }, { "epoch": 0.5685030749911453, "grad_norm": 0.12326408605710353, "learning_rate": 4.6786872466368346e-05, "loss": 0.3371, "step": 2207 }, { "epoch": 0.5687606658724281, "grad_norm": 0.1786740596929532, "learning_rate": 4.6741996888745034e-05, "loss": 0.3124, "step": 2208 }, { "epoch": 0.5690182567537109, "grad_norm": 0.15079983176315676, "learning_rate": 4.6697123946567227e-05, "loss": 0.3673, "step": 2209 }, { "epoch": 0.5692758476349937, "grad_norm": 0.19944306111265092, "learning_rate": 4.665225367613328e-05, "loss": 0.4476, "step": 2210 }, { "epoch": 0.5692758476349937, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8656364588789942, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3511185944080353, "eval_runtime": 16.9474, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 2210 }, { "epoch": 0.5695334385162765, "grad_norm": 0.14572671723711672, "learning_rate": 4.6607386113739413e-05, "loss": 0.3723, "step": 2211 }, { "epoch": 0.5697910293975593, "grad_norm": 0.15106906527292013, "learning_rate": 4.656252129567963e-05, "loss": 0.3103, "step": 2212 }, { "epoch": 0.5700486202788422, "grad_norm": 0.2634210600639788, "learning_rate": 4.6517659258245734e-05, "loss": 0.5098, "step": 2213 }, { "epoch": 0.5703062111601249, "grad_norm": 0.11451975560835995, "learning_rate": 4.647280003772728e-05, "loss": 0.3236, "step": 2214 }, { "epoch": 0.5705638020414078, "grad_norm": 0.1586227318953602, "learning_rate": 4.6427943670411495e-05, "loss": 0.3795, "step": 2215 }, { "epoch": 0.5705638020414078, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 AUC (fixed)": 0.8643268727082243, "eval_PRM F1 Neg": 0.625, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.34108665585517883, "eval_runtime": 17.7693, "eval_samples_per_second": 2.476, "eval_steps_per_second": 0.169, "step": 2215 }, { "epoch": 0.5708213929226905, "grad_norm": 0.15676782722268975, "learning_rate": 4.63830901925834e-05, "loss": 0.3931, "step": 2216 }, { "epoch": 0.5710789838039734, "grad_norm": 0.13454389321114535, "learning_rate": 4.633823964052555e-05, "loss": 0.369, "step": 2217 }, { "epoch": 0.5713365746852561, "grad_norm": 0.12218625857130747, "learning_rate": 4.629339205051827e-05, "loss": 0.3256, "step": 2218 }, { "epoch": 0.571594165566539, "grad_norm": 0.1375886521697247, "learning_rate": 4.6248547458839365e-05, "loss": 0.3486, "step": 2219 }, { "epoch": 0.5718517564478217, "grad_norm": 0.1461004670609193, "learning_rate": 4.62037059017643e-05, "loss": 0.3915, "step": 2220 }, { "epoch": 0.5718517564478217, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8834355828220859, "eval_PRM F1 AUC": 0.7598218962807753, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.6122448979591837, "eval_PRM NPV": 0.5769230769230769, "eval_PRM Precision": 0.9, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.34765625, "eval_runtime": 16.9494, "eval_samples_per_second": 2.596, "eval_steps_per_second": 0.177, "step": 2220 }, { "epoch": 0.5721093473291046, "grad_norm": 0.13185660987919753, "learning_rate": 4.615886741556604e-05, "loss": 0.3213, "step": 2221 }, { "epoch": 0.5723669382103873, "grad_norm": 0.16499953154104235, "learning_rate": 4.611403203651507e-05, "loss": 0.3698, "step": 2222 }, { "epoch": 0.5726245290916702, "grad_norm": 0.1837604920686579, "learning_rate": 4.60691998008794e-05, "loss": 0.3873, "step": 2223 }, { "epoch": 0.5728821199729529, "grad_norm": 0.142755388671106, "learning_rate": 4.602437074492445e-05, "loss": 0.4132, "step": 2224 }, { "epoch": 0.5731397108542358, "grad_norm": 0.15381425681621197, "learning_rate": 4.59795449049131e-05, "loss": 0.339, "step": 2225 }, { "epoch": 0.5731397108542358, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3608842194080353, "eval_runtime": 17.1193, "eval_samples_per_second": 2.57, "eval_steps_per_second": 0.175, "step": 2225 }, { "epoch": 0.5733973017355186, "grad_norm": 0.13265249259935646, "learning_rate": 4.593472231710559e-05, "loss": 0.296, "step": 2226 }, { "epoch": 0.5736548926168014, "grad_norm": 0.10971577687365057, "learning_rate": 4.58899030177596e-05, "loss": 0.2991, "step": 2227 }, { "epoch": 0.5739124834980842, "grad_norm": 0.1346092443842548, "learning_rate": 4.584508704313006e-05, "loss": 0.3516, "step": 2228 }, { "epoch": 0.574170074379367, "grad_norm": 0.28546397698404885, "learning_rate": 4.580027442946928e-05, "loss": 0.5096, "step": 2229 }, { "epoch": 0.5744276652606498, "grad_norm": 0.2153285699974356, "learning_rate": 4.575546521302681e-05, "loss": 0.4035, "step": 2230 }, { "epoch": 0.5744276652606498, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.855945521215296, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.376953125, "eval_runtime": 16.9774, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 2230 }, { "epoch": 0.5746852561419326, "grad_norm": 0.15833971603216263, "learning_rate": 4.571065943004947e-05, "loss": 0.403, "step": 2231 }, { "epoch": 0.5749428470232154, "grad_norm": 0.16444949348925209, "learning_rate": 4.566585711678133e-05, "loss": 0.3791, "step": 2232 }, { "epoch": 0.5752004379044982, "grad_norm": 0.1459790553316448, "learning_rate": 4.56210583094636e-05, "loss": 0.3827, "step": 2233 }, { "epoch": 0.575458028785781, "grad_norm": 0.13441591004776918, "learning_rate": 4.557626304433467e-05, "loss": 0.4107, "step": 2234 }, { "epoch": 0.5757156196670637, "grad_norm": 0.15489351648664135, "learning_rate": 4.5531471357630114e-05, "loss": 0.3618, "step": 2235 }, { "epoch": 0.5757156196670637, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8530644316396019, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37428978085517883, "eval_runtime": 17.4467, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 2235 }, { "epoch": 0.5759732105483466, "grad_norm": 0.1277990860423348, "learning_rate": 4.54866832855825e-05, "loss": 0.4014, "step": 2236 }, { "epoch": 0.5762308014296293, "grad_norm": 0.15228208517801683, "learning_rate": 4.544189886442162e-05, "loss": 0.372, "step": 2237 }, { "epoch": 0.5764883923109122, "grad_norm": 0.1254931002378707, "learning_rate": 4.5397118130374175e-05, "loss": 0.3067, "step": 2238 }, { "epoch": 0.5767459831921949, "grad_norm": 0.15408585564454477, "learning_rate": 4.535234111966399e-05, "loss": 0.4115, "step": 2239 }, { "epoch": 0.5770035740734778, "grad_norm": 0.15631776075479115, "learning_rate": 4.5307567868511795e-05, "loss": 0.4342, "step": 2240 }, { "epoch": 0.5770035740734778, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8473022524882137, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3833451569080353, "eval_runtime": 17.0431, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 2240 }, { "epoch": 0.5772611649547607, "grad_norm": 0.1204536283126352, "learning_rate": 4.5262798413135344e-05, "loss": 0.3439, "step": 2241 }, { "epoch": 0.5775187558360434, "grad_norm": 0.11277574795480862, "learning_rate": 4.5218032789749275e-05, "loss": 0.2972, "step": 2242 }, { "epoch": 0.5777763467173263, "grad_norm": 0.13040420288598253, "learning_rate": 4.517327103456515e-05, "loss": 0.3522, "step": 2243 }, { "epoch": 0.578033937598609, "grad_norm": 0.12038259999115875, "learning_rate": 4.5128513183791386e-05, "loss": 0.298, "step": 2244 }, { "epoch": 0.5782915284798918, "grad_norm": 0.12879970384020212, "learning_rate": 4.5083759273633267e-05, "loss": 0.3444, "step": 2245 }, { "epoch": 0.5782915284798918, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8473022524882137, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.38387784361839294, "eval_runtime": 16.4767, "eval_samples_per_second": 2.67, "eval_steps_per_second": 0.182, "step": 2245 }, { "epoch": 0.5785491193611746, "grad_norm": 0.1312248062851336, "learning_rate": 4.503900934029287e-05, "loss": 0.3658, "step": 2246 }, { "epoch": 0.5788067102424574, "grad_norm": 0.1264918196677566, "learning_rate": 4.4994263419969055e-05, "loss": 0.3519, "step": 2247 }, { "epoch": 0.5790643011237402, "grad_norm": 0.11470048536136435, "learning_rate": 4.4949521548857426e-05, "loss": 0.349, "step": 2248 }, { "epoch": 0.579321892005023, "grad_norm": 0.15467134731951687, "learning_rate": 4.490478376315035e-05, "loss": 0.3333, "step": 2249 }, { "epoch": 0.5795794828863058, "grad_norm": 0.1514767223007565, "learning_rate": 4.486005009903684e-05, "loss": 0.3993, "step": 2250 }, { "epoch": 0.5795794828863058, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.855945521215296, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3881392180919647, "eval_runtime": 17.398, "eval_samples_per_second": 2.529, "eval_steps_per_second": 0.172, "step": 2250 }, { "epoch": 0.5798370737675886, "grad_norm": 0.20915160984468872, "learning_rate": 4.481532059270262e-05, "loss": 0.3845, "step": 2251 }, { "epoch": 0.5800946646488714, "grad_norm": 0.16023912248270797, "learning_rate": 4.477059528033001e-05, "loss": 0.4117, "step": 2252 }, { "epoch": 0.5803522555301542, "grad_norm": 0.18700292286454162, "learning_rate": 4.472587419809798e-05, "loss": 0.4213, "step": 2253 }, { "epoch": 0.580609846411437, "grad_norm": 0.12058361241555736, "learning_rate": 4.468115738218206e-05, "loss": 0.4035, "step": 2254 }, { "epoch": 0.5808674372927198, "grad_norm": 0.15736977413293526, "learning_rate": 4.463644486875427e-05, "loss": 0.4465, "step": 2255 }, { "epoch": 0.5808674372927198, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8533263488737559, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37180396914482117, "eval_runtime": 16.8676, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 2255 }, { "epoch": 0.5811250281740027, "grad_norm": 0.14231846289545302, "learning_rate": 4.459173669398328e-05, "loss": 0.3966, "step": 2256 }, { "epoch": 0.5813826190552854, "grad_norm": 0.15200014494583405, "learning_rate": 4.454703289403411e-05, "loss": 0.4429, "step": 2257 }, { "epoch": 0.5816402099365683, "grad_norm": 0.1484057973180248, "learning_rate": 4.450233350506836e-05, "loss": 0.3177, "step": 2258 }, { "epoch": 0.581897800817851, "grad_norm": 0.1454146292852184, "learning_rate": 4.4457638563243954e-05, "loss": 0.3001, "step": 2259 }, { "epoch": 0.5821553916991339, "grad_norm": 0.18622364318324686, "learning_rate": 4.4412948104715316e-05, "loss": 0.3707, "step": 2260 }, { "epoch": 0.5821553916991339, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8467784180199056, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.37411221861839294, "eval_runtime": 17.0686, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2260 }, { "epoch": 0.5824129825804166, "grad_norm": 0.18289434281705721, "learning_rate": 4.436826216563318e-05, "loss": 0.3948, "step": 2261 }, { "epoch": 0.5826705734616995, "grad_norm": 0.12791602046198763, "learning_rate": 4.432358078214464e-05, "loss": 0.308, "step": 2262 }, { "epoch": 0.5829281643429822, "grad_norm": 0.14830241151439877, "learning_rate": 4.4278903990393127e-05, "loss": 0.2993, "step": 2263 }, { "epoch": 0.5831857552242651, "grad_norm": 0.15756705571132135, "learning_rate": 4.423423182651831e-05, "loss": 0.4263, "step": 2264 }, { "epoch": 0.5834433461055478, "grad_norm": 0.14695797512698278, "learning_rate": 4.418956432665618e-05, "loss": 0.4075, "step": 2265 }, { "epoch": 0.5834433461055478, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8470403352540599, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3751775622367859, "eval_runtime": 17.512, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 2265 }, { "epoch": 0.5837009369868307, "grad_norm": 0.13259319305805958, "learning_rate": 4.4144901526938886e-05, "loss": 0.398, "step": 2266 }, { "epoch": 0.5839585278681134, "grad_norm": 0.1593042136574566, "learning_rate": 4.410024346349484e-05, "loss": 0.4099, "step": 2267 }, { "epoch": 0.5842161187493963, "grad_norm": 0.1451339019173708, "learning_rate": 4.405559017244857e-05, "loss": 0.3785, "step": 2268 }, { "epoch": 0.5844737096306791, "grad_norm": 0.2515281631502885, "learning_rate": 4.401094168992075e-05, "loss": 0.4094, "step": 2269 }, { "epoch": 0.5847313005119619, "grad_norm": 0.19495752680724165, "learning_rate": 4.396629805202821e-05, "loss": 0.3853, "step": 2270 }, { "epoch": 0.5847313005119619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8446830801466737, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3761541247367859, "eval_runtime": 17.172, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 2270 }, { "epoch": 0.5849888913932447, "grad_norm": 0.15725677876385077, "learning_rate": 4.392165929488381e-05, "loss": 0.3737, "step": 2271 }, { "epoch": 0.5852464822745275, "grad_norm": 0.13637584450534468, "learning_rate": 4.387702545459649e-05, "loss": 0.3327, "step": 2272 }, { "epoch": 0.5855040731558103, "grad_norm": 0.1561340421962783, "learning_rate": 4.383239656727119e-05, "loss": 0.4173, "step": 2273 }, { "epoch": 0.5857616640370931, "grad_norm": 0.2638794545999978, "learning_rate": 4.378777266900889e-05, "loss": 0.5171, "step": 2274 }, { "epoch": 0.5860192549183759, "grad_norm": 0.12291816196261775, "learning_rate": 4.374315379590649e-05, "loss": 0.3587, "step": 2275 }, { "epoch": 0.5860192549183759, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8368255631220533, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37801846861839294, "eval_runtime": 17.4753, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 2275 }, { "epoch": 0.5862768457996587, "grad_norm": 0.1803958721122535, "learning_rate": 4.36985399840568e-05, "loss": 0.4139, "step": 2276 }, { "epoch": 0.5865344366809415, "grad_norm": 0.19998996472480873, "learning_rate": 4.365393126954863e-05, "loss": 0.3019, "step": 2277 }, { "epoch": 0.5867920275622243, "grad_norm": 0.14917447809816536, "learning_rate": 4.3609327688466546e-05, "loss": 0.3539, "step": 2278 }, { "epoch": 0.5870496184435071, "grad_norm": 0.154365871065513, "learning_rate": 4.356472927689109e-05, "loss": 0.3742, "step": 2279 }, { "epoch": 0.5873072093247899, "grad_norm": 0.12829951247327792, "learning_rate": 4.352013607089852e-05, "loss": 0.365, "step": 2280 }, { "epoch": 0.5873072093247899, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8302776322682034, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3888494372367859, "eval_runtime": 17.2207, "eval_samples_per_second": 2.555, "eval_steps_per_second": 0.174, "step": 2280 }, { "epoch": 0.5875648002060727, "grad_norm": 0.16134000007480917, "learning_rate": 4.347554810656093e-05, "loss": 0.4404, "step": 2281 }, { "epoch": 0.5878223910873555, "grad_norm": 0.13756861935496567, "learning_rate": 4.343096541994617e-05, "loss": 0.3328, "step": 2282 }, { "epoch": 0.5880799819686383, "grad_norm": 0.11227877119448444, "learning_rate": 4.3386388047117796e-05, "loss": 0.2859, "step": 2283 }, { "epoch": 0.5883375728499212, "grad_norm": 0.1295742460879775, "learning_rate": 4.334181602413511e-05, "loss": 0.3618, "step": 2284 }, { "epoch": 0.5885951637312039, "grad_norm": 0.13980724148963705, "learning_rate": 4.329724938705304e-05, "loss": 0.3653, "step": 2285 }, { "epoch": 0.5885951637312039, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8300157150340493, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4008345305919647, "eval_runtime": 17.3421, "eval_samples_per_second": 2.537, "eval_steps_per_second": 0.173, "step": 2285 }, { "epoch": 0.5888527546124868, "grad_norm": 0.13831366656318222, "learning_rate": 4.32526881719222e-05, "loss": 0.3624, "step": 2286 }, { "epoch": 0.5891103454937695, "grad_norm": 0.13796271646368452, "learning_rate": 4.320813241478876e-05, "loss": 0.3287, "step": 2287 }, { "epoch": 0.5893679363750524, "grad_norm": 0.20813717625802478, "learning_rate": 4.3163582151694573e-05, "loss": 0.3713, "step": 2288 }, { "epoch": 0.5896255272563351, "grad_norm": 0.12250415747063537, "learning_rate": 4.3119037418676933e-05, "loss": 0.2924, "step": 2289 }, { "epoch": 0.589883118137618, "grad_norm": 0.19821969688382862, "learning_rate": 4.3074498251768716e-05, "loss": 0.4017, "step": 2290 }, { "epoch": 0.589883118137618, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.8433734939759038, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4139293432235718, "eval_runtime": 17.5685, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 2290 }, { "epoch": 0.5901407090189007, "grad_norm": 0.11948246377924135, "learning_rate": 4.302996468699833e-05, "loss": 0.2829, "step": 2291 }, { "epoch": 0.5903982999001836, "grad_norm": 0.2492267578473308, "learning_rate": 4.298543676038958e-05, "loss": 0.4189, "step": 2292 }, { "epoch": 0.5906558907814663, "grad_norm": 0.19005796072967893, "learning_rate": 4.2940914507961775e-05, "loss": 0.3656, "step": 2293 }, { "epoch": 0.5909134816627492, "grad_norm": 0.24832687920935803, "learning_rate": 4.2896397965729575e-05, "loss": 0.3959, "step": 2294 }, { "epoch": 0.5911710725440319, "grad_norm": 0.2203340009224552, "learning_rate": 4.285188716970307e-05, "loss": 0.4418, "step": 2295 }, { "epoch": 0.5911710725440319, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8397066526977477, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3896484375, "eval_runtime": 17.6247, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 2295 }, { "epoch": 0.5914286634253147, "grad_norm": 0.13878427099407956, "learning_rate": 4.280738215588769e-05, "loss": 0.3719, "step": 2296 }, { "epoch": 0.5916862543065975, "grad_norm": 0.15998587752502577, "learning_rate": 4.276288296028413e-05, "loss": 0.3582, "step": 2297 }, { "epoch": 0.5919438451878803, "grad_norm": 0.16923710750646784, "learning_rate": 4.27183896188885e-05, "loss": 0.3764, "step": 2298 }, { "epoch": 0.5922014360691632, "grad_norm": 0.13725800110456088, "learning_rate": 4.267390216769205e-05, "loss": 0.3212, "step": 2299 }, { "epoch": 0.5924590269504459, "grad_norm": 0.1443056880246243, "learning_rate": 4.262942064268134e-05, "loss": 0.3848, "step": 2300 }, { "epoch": 0.5924590269504459, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 AUC (fixed)": 0.8397066526977476, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3832564055919647, "eval_runtime": 17.5859, "eval_samples_per_second": 2.502, "eval_steps_per_second": 0.171, "step": 2300 }, { "epoch": 0.5927166178317288, "grad_norm": 0.1925039231194253, "learning_rate": 4.2584945079838096e-05, "loss": 0.3163, "step": 2301 }, { "epoch": 0.5929742087130115, "grad_norm": 0.21111701745013034, "learning_rate": 4.2540475515139264e-05, "loss": 0.4348, "step": 2302 }, { "epoch": 0.5932317995942944, "grad_norm": 0.16305082349405703, "learning_rate": 4.249601198455691e-05, "loss": 0.3986, "step": 2303 }, { "epoch": 0.5934893904755771, "grad_norm": 0.13293669947815345, "learning_rate": 4.245155452405819e-05, "loss": 0.2639, "step": 2304 }, { "epoch": 0.59374698135686, "grad_norm": 0.18048699718115427, "learning_rate": 4.2407103169605436e-05, "loss": 0.4084, "step": 2305 }, { "epoch": 0.59374698135686, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8625, "eval_PRM F1 AUC": 0.7417496071241488, "eval_PRM F1 AUC (fixed)": 0.8441592456783658, "eval_PRM F1 Neg": 0.5769230769230769, "eval_PRM NPV": 0.5172413793103449, "eval_PRM Precision": 0.8961038961038961, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.37784090638160706, "eval_runtime": 16.8174, "eval_samples_per_second": 2.616, "eval_steps_per_second": 0.178, "step": 2305 }, { "epoch": 0.5940045722381427, "grad_norm": 0.1798571551854095, "learning_rate": 4.2362657957155934e-05, "loss": 0.4594, "step": 2306 }, { "epoch": 0.5942621631194256, "grad_norm": 0.14420653302408004, "learning_rate": 4.23182189226621e-05, "loss": 0.2714, "step": 2307 }, { "epoch": 0.5945197540007083, "grad_norm": 0.1505100604261495, "learning_rate": 4.2273786102071275e-05, "loss": 0.3587, "step": 2308 }, { "epoch": 0.5947773448819912, "grad_norm": 0.14331384765206512, "learning_rate": 4.2229359531325804e-05, "loss": 0.402, "step": 2309 }, { "epoch": 0.5950349357632739, "grad_norm": 0.14206105415515183, "learning_rate": 4.2184939246363005e-05, "loss": 0.4072, "step": 2310 }, { "epoch": 0.5950349357632739, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3757990002632141, "eval_runtime": 17.7482, "eval_samples_per_second": 2.479, "eval_steps_per_second": 0.169, "step": 2310 }, { "epoch": 0.5952925266445568, "grad_norm": 0.12844389785248492, "learning_rate": 4.214052528311506e-05, "loss": 0.3422, "step": 2311 }, { "epoch": 0.5955501175258396, "grad_norm": 0.1417563698914759, "learning_rate": 4.209611767750908e-05, "loss": 0.3675, "step": 2312 }, { "epoch": 0.5958077084071224, "grad_norm": 0.18466106503914595, "learning_rate": 4.2051716465466986e-05, "loss": 0.4099, "step": 2313 }, { "epoch": 0.5960652992884052, "grad_norm": 0.21904032491039754, "learning_rate": 4.20073216829056e-05, "loss": 0.4417, "step": 2314 }, { "epoch": 0.596322890169688, "grad_norm": 0.14913382778989, "learning_rate": 4.196293336573648e-05, "loss": 0.3804, "step": 2315 }, { "epoch": 0.596322890169688, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3802379369735718, "eval_runtime": 16.9919, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 2315 }, { "epoch": 0.5965804810509708, "grad_norm": 0.13716170546344314, "learning_rate": 4.1918551549865934e-05, "loss": 0.3671, "step": 2316 }, { "epoch": 0.5968380719322536, "grad_norm": 0.13506852473226214, "learning_rate": 4.187417627119511e-05, "loss": 0.3434, "step": 2317 }, { "epoch": 0.5970956628135364, "grad_norm": 0.1313861150309788, "learning_rate": 4.182980756561976e-05, "loss": 0.36, "step": 2318 }, { "epoch": 0.5973532536948192, "grad_norm": 0.12254271130288111, "learning_rate": 4.178544546903042e-05, "loss": 0.3909, "step": 2319 }, { "epoch": 0.597610844576102, "grad_norm": 0.14060596925147895, "learning_rate": 4.1741090017312166e-05, "loss": 0.3432, "step": 2320 }, { "epoch": 0.597610844576102, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 AUC (fixed)": 0.8444211629125197, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.38503196835517883, "eval_runtime": 17.1014, "eval_samples_per_second": 2.573, "eval_steps_per_second": 0.175, "step": 2320 }, { "epoch": 0.5978684354573848, "grad_norm": 0.168004846727644, "learning_rate": 4.169674124634481e-05, "loss": 0.4644, "step": 2321 }, { "epoch": 0.5981260263386676, "grad_norm": 0.1415225286134437, "learning_rate": 4.165239919200269e-05, "loss": 0.2826, "step": 2322 }, { "epoch": 0.5983836172199504, "grad_norm": 0.13137494742688535, "learning_rate": 4.1608063890154715e-05, "loss": 0.4054, "step": 2323 }, { "epoch": 0.5986412081012332, "grad_norm": 0.1470378613652157, "learning_rate": 4.156373537666437e-05, "loss": 0.3757, "step": 2324 }, { "epoch": 0.598898798982516, "grad_norm": 0.1269355336304008, "learning_rate": 4.1519413687389615e-05, "loss": 0.3243, "step": 2325 }, { "epoch": 0.598898798982516, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 AUC (fixed)": 0.8452069146149818, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3919566869735718, "eval_runtime": 17.288, "eval_samples_per_second": 2.545, "eval_steps_per_second": 0.174, "step": 2325 }, { "epoch": 0.5991563898637988, "grad_norm": 0.14258608967689515, "learning_rate": 4.147509885818292e-05, "loss": 0.3029, "step": 2326 }, { "epoch": 0.5994139807450817, "grad_norm": 0.13317579369354718, "learning_rate": 4.143079092489114e-05, "loss": 0.3345, "step": 2327 }, { "epoch": 0.5996715716263644, "grad_norm": 0.18059828585327012, "learning_rate": 4.138648992335566e-05, "loss": 0.4281, "step": 2328 }, { "epoch": 0.5999291625076473, "grad_norm": 0.13015801332157306, "learning_rate": 4.1342195889412166e-05, "loss": 0.4118, "step": 2329 }, { "epoch": 0.60018675338893, "grad_norm": 0.21798644743809673, "learning_rate": 4.129790885889072e-05, "loss": 0.4471, "step": 2330 }, { "epoch": 0.60018675338893, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8410162388685175, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4052290618419647, "eval_runtime": 17.4006, "eval_samples_per_second": 2.529, "eval_steps_per_second": 0.172, "step": 2330 }, { "epoch": 0.6004443442702129, "grad_norm": 0.13610508936668073, "learning_rate": 4.125362886761577e-05, "loss": 0.3657, "step": 2331 }, { "epoch": 0.6007019351514956, "grad_norm": 0.15504773900939664, "learning_rate": 4.1209355951406e-05, "loss": 0.4261, "step": 2332 }, { "epoch": 0.6009595260327785, "grad_norm": 0.1446863802292206, "learning_rate": 4.1165090146074446e-05, "loss": 0.3632, "step": 2333 }, { "epoch": 0.6012171169140612, "grad_norm": 0.13063788776631363, "learning_rate": 4.112083148742833e-05, "loss": 0.3635, "step": 2334 }, { "epoch": 0.6014747077953441, "grad_norm": 0.12052295245282314, "learning_rate": 4.107658001126913e-05, "loss": 0.3628, "step": 2335 }, { "epoch": 0.6014747077953441, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8305395495023573, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4041193127632141, "eval_runtime": 17.7381, "eval_samples_per_second": 2.481, "eval_steps_per_second": 0.169, "step": 2335 }, { "epoch": 0.6017322986766268, "grad_norm": 0.14273888256518527, "learning_rate": 4.1032335753392505e-05, "loss": 0.4155, "step": 2336 }, { "epoch": 0.6019898895579097, "grad_norm": 0.19249131742072517, "learning_rate": 4.098809874958822e-05, "loss": 0.4896, "step": 2337 }, { "epoch": 0.6022474804391924, "grad_norm": 0.1203162215241167, "learning_rate": 4.09438690356403e-05, "loss": 0.4073, "step": 2338 }, { "epoch": 0.6025050713204753, "grad_norm": 0.1726093816833048, "learning_rate": 4.089964664732674e-05, "loss": 0.4277, "step": 2339 }, { "epoch": 0.602762662201758, "grad_norm": 0.1295230914383838, "learning_rate": 4.085543162041969e-05, "loss": 0.3623, "step": 2340 }, { "epoch": 0.602762662201758, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8250392875851231, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.40065696835517883, "eval_runtime": 17.0919, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.176, "step": 2340 }, { "epoch": 0.6030202530830409, "grad_norm": 0.173569420588442, "learning_rate": 4.0811223990685306e-05, "loss": 0.38, "step": 2341 }, { "epoch": 0.6032778439643237, "grad_norm": 0.13684583572111672, "learning_rate": 4.0767023793883785e-05, "loss": 0.3606, "step": 2342 }, { "epoch": 0.6035354348456065, "grad_norm": 0.14005902767896153, "learning_rate": 4.0722831065769304e-05, "loss": 0.3749, "step": 2343 }, { "epoch": 0.6037930257268893, "grad_norm": 0.12740103105685202, "learning_rate": 4.067864584208997e-05, "loss": 0.3653, "step": 2344 }, { "epoch": 0.604050616608172, "grad_norm": 0.15660047142322808, "learning_rate": 4.063446815858788e-05, "loss": 0.3316, "step": 2345 }, { "epoch": 0.604050616608172, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.821634363541121, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.40731534361839294, "eval_runtime": 17.0906, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 2345 }, { "epoch": 0.6043082074894549, "grad_norm": 0.1520180262232338, "learning_rate": 4.0590298050998964e-05, "loss": 0.3688, "step": 2346 }, { "epoch": 0.6045657983707377, "grad_norm": 0.1483852238797389, "learning_rate": 4.05461355550531e-05, "loss": 0.3624, "step": 2347 }, { "epoch": 0.6048233892520205, "grad_norm": 0.1601064996885839, "learning_rate": 4.05019807064739e-05, "loss": 0.456, "step": 2348 }, { "epoch": 0.6050809801333032, "grad_norm": 0.1775581775355606, "learning_rate": 4.045783354097893e-05, "loss": 0.3666, "step": 2349 }, { "epoch": 0.6053385710145861, "grad_norm": 0.1391482916141042, "learning_rate": 4.041369409427941e-05, "loss": 0.3885, "step": 2350 }, { "epoch": 0.6053385710145861, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.8268727082242011, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.42001065611839294, "eval_runtime": 17.0055, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 2350 }, { "epoch": 0.6055961618958688, "grad_norm": 0.16933116300541795, "learning_rate": 4.0369562402080384e-05, "loss": 0.4159, "step": 2351 }, { "epoch": 0.6058537527771517, "grad_norm": 0.16754478600512965, "learning_rate": 4.032543850008063e-05, "loss": 0.3919, "step": 2352 }, { "epoch": 0.6061113436584344, "grad_norm": 0.19447554248718874, "learning_rate": 4.028132242397258e-05, "loss": 0.4139, "step": 2353 }, { "epoch": 0.6063689345397173, "grad_norm": 0.13432879039547974, "learning_rate": 4.0237214209442394e-05, "loss": 0.365, "step": 2354 }, { "epoch": 0.6066265254210002, "grad_norm": 0.15885519743295454, "learning_rate": 4.0193113892169804e-05, "loss": 0.3813, "step": 2355 }, { "epoch": 0.6066265254210002, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8622754491017964, "eval_PRM F1 AUC": 0.6728653745416449, "eval_PRM F1 AUC (fixed)": 0.8218962807752749, "eval_PRM F1 Neg": 0.4888888888888889, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8571428571428571, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4205433130264282, "eval_runtime": 17.5093, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 2355 }, { "epoch": 0.6068841163022829, "grad_norm": 0.16671735189095732, "learning_rate": 4.0149021507828224e-05, "loss": 0.4095, "step": 2356 }, { "epoch": 0.6071417071835657, "grad_norm": 0.17378346582878013, "learning_rate": 4.01049370920846e-05, "loss": 0.3777, "step": 2357 }, { "epoch": 0.6073992980648485, "grad_norm": 0.12070700699832426, "learning_rate": 4.006086068059943e-05, "loss": 0.3213, "step": 2358 }, { "epoch": 0.6076568889461313, "grad_norm": 0.16891870723656224, "learning_rate": 4.00167923090268e-05, "loss": 0.3578, "step": 2359 }, { "epoch": 0.6079144798274141, "grad_norm": 0.1308638140610988, "learning_rate": 3.9972732013014206e-05, "loss": 0.3198, "step": 2360 }, { "epoch": 0.6079144798274141, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.820848611838659, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.4169921875, "eval_runtime": 17.5358, "eval_samples_per_second": 2.509, "eval_steps_per_second": 0.171, "step": 2360 }, { "epoch": 0.6081720707086969, "grad_norm": 0.1317729555391042, "learning_rate": 3.992867982820268e-05, "loss": 0.3508, "step": 2361 }, { "epoch": 0.6084296615899797, "grad_norm": 0.1767411732431218, "learning_rate": 3.988463579022666e-05, "loss": 0.4106, "step": 2362 }, { "epoch": 0.6086872524712625, "grad_norm": 0.18155428167496843, "learning_rate": 3.984059993471399e-05, "loss": 0.4019, "step": 2363 }, { "epoch": 0.6089448433525453, "grad_norm": 0.19324560638494176, "learning_rate": 3.9796572297285926e-05, "loss": 0.51, "step": 2364 }, { "epoch": 0.6092024342338281, "grad_norm": 0.17087083249532514, "learning_rate": 3.9752552913557036e-05, "loss": 0.367, "step": 2365 }, { "epoch": 0.6092024342338281, "eval_PRM Accuracy": 0.7735849056603774, "eval_PRM F1": 0.8536585365853658, "eval_PRM F1 AUC": 0.6825563122053432, "eval_PRM F1 AUC (fixed)": 0.817967522262965, "eval_PRM F1 Neg": 0.5, "eval_PRM NPV": 0.48, "eval_PRM Precision": 0.8641975308641975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.41432884335517883, "eval_runtime": 17.0782, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 2365 }, { "epoch": 0.6094600251151109, "grad_norm": 0.15022774199433786, "learning_rate": 3.970854181913526e-05, "loss": 0.4312, "step": 2366 }, { "epoch": 0.6097176159963937, "grad_norm": 0.14147350650677862, "learning_rate": 3.966453904962176e-05, "loss": 0.2885, "step": 2367 }, { "epoch": 0.6099752068776765, "grad_norm": 0.1900434964583597, "learning_rate": 3.962054464061106e-05, "loss": 0.4551, "step": 2368 }, { "epoch": 0.6102327977589593, "grad_norm": 0.14243337413848095, "learning_rate": 3.9576558627690826e-05, "loss": 0.3873, "step": 2369 }, { "epoch": 0.6104903886402422, "grad_norm": 0.14661969644213976, "learning_rate": 3.9532581046442e-05, "loss": 0.2973, "step": 2370 }, { "epoch": 0.6104903886402422, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.874251497005988, "eval_PRM F1 AUC": 0.7006286013619696, "eval_PRM F1 AUC (fixed)": 0.8260869565217391, "eval_PRM F1 Neg": 0.5333333333333333, "eval_PRM NPV": 0.5454545454545454, "eval_PRM Precision": 0.8690476190476191, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.40731534361839294, "eval_runtime": 17.0664, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2370 }, { "epoch": 0.6107479795215249, "grad_norm": 0.11402039346775396, "learning_rate": 3.9488611932438666e-05, "loss": 0.3182, "step": 2371 }, { "epoch": 0.6110055704028078, "grad_norm": 0.15915651498180694, "learning_rate": 3.944465132124807e-05, "loss": 0.3995, "step": 2372 }, { "epoch": 0.6112631612840905, "grad_norm": 0.13158790616500857, "learning_rate": 3.94006992484306e-05, "loss": 0.2991, "step": 2373 }, { "epoch": 0.6115207521653734, "grad_norm": 0.11553152695883866, "learning_rate": 3.93567557495397e-05, "loss": 0.3199, "step": 2374 }, { "epoch": 0.6117783430466561, "grad_norm": 0.20815237796381744, "learning_rate": 3.931282086012191e-05, "loss": 0.4048, "step": 2375 }, { "epoch": 0.6117783430466561, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8757396449704142, "eval_PRM F1 AUC": 0.6849135673127291, "eval_PRM F1 AUC (fixed)": 0.820062860136197, "eval_PRM F1 Neg": 0.5116279069767442, "eval_PRM NPV": 0.55, "eval_PRM Precision": 0.8604651162790697, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.4189896881580353, "eval_runtime": 17.2565, "eval_samples_per_second": 2.55, "eval_steps_per_second": 0.174, "step": 2375 }, { "epoch": 0.612035933927939, "grad_norm": 0.11404295721713555, "learning_rate": 3.9268894615716804e-05, "loss": 0.2881, "step": 2376 }, { "epoch": 0.6122935248092217, "grad_norm": 0.1531556969722233, "learning_rate": 3.9224977051856904e-05, "loss": 0.446, "step": 2377 }, { "epoch": 0.6125511156905046, "grad_norm": 0.13607225651561186, "learning_rate": 3.918106820406782e-05, "loss": 0.2904, "step": 2378 }, { "epoch": 0.6128087065717873, "grad_norm": 0.1830553290422174, "learning_rate": 3.9137168107867994e-05, "loss": 0.4065, "step": 2379 }, { "epoch": 0.6130662974530702, "grad_norm": 0.1357494360307605, "learning_rate": 3.909327679876888e-05, "loss": 0.3653, "step": 2380 }, { "epoch": 0.6130662974530702, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8823529411764706, "eval_PRM F1 AUC": 0.6909376636982714, "eval_PRM F1 AUC (fixed)": 0.821634363541121, "eval_PRM F1 Neg": 0.5238095238095238, "eval_PRM NPV": 0.5789473684210527, "eval_PRM Precision": 0.8620689655172413, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.41317471861839294, "eval_runtime": 16.8684, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 2380 }, { "epoch": 0.6133238883343529, "grad_norm": 0.19432163887414694, "learning_rate": 3.9049394312274765e-05, "loss": 0.3545, "step": 2381 }, { "epoch": 0.6135814792156358, "grad_norm": 0.143143247958846, "learning_rate": 3.9005520683882854e-05, "loss": 0.3856, "step": 2382 }, { "epoch": 0.6138390700969185, "grad_norm": 0.13596461157727238, "learning_rate": 3.896165594908313e-05, "loss": 0.3579, "step": 2383 }, { "epoch": 0.6140966609782014, "grad_norm": 0.18731344597012275, "learning_rate": 3.8917800143358404e-05, "loss": 0.4522, "step": 2384 }, { "epoch": 0.6143542518594842, "grad_norm": 0.19021340220262192, "learning_rate": 3.887395330218429e-05, "loss": 0.3945, "step": 2385 }, { "epoch": 0.6143542518594842, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8205866946045051, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3953302502632141, "eval_runtime": 17.6129, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 2385 }, { "epoch": 0.614611842740767, "grad_norm": 0.1611457927631445, "learning_rate": 3.883011546102909e-05, "loss": 0.3255, "step": 2386 }, { "epoch": 0.6148694336220498, "grad_norm": 0.17976558652728208, "learning_rate": 3.878628665535392e-05, "loss": 0.3647, "step": 2387 }, { "epoch": 0.6151270245033326, "grad_norm": 0.18633645755451828, "learning_rate": 3.874246692061246e-05, "loss": 0.3515, "step": 2388 }, { "epoch": 0.6153846153846154, "grad_norm": 0.1476256519035803, "learning_rate": 3.869865629225119e-05, "loss": 0.3342, "step": 2389 }, { "epoch": 0.6156422062658982, "grad_norm": 0.13511375655045682, "learning_rate": 3.865485480570912e-05, "loss": 0.3907, "step": 2390 }, { "epoch": 0.6156422062658982, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8809523809523809, "eval_PRM F1 AUC": 0.7066526977475118, "eval_PRM F1 AUC (fixed)": 0.8190151911995809, "eval_PRM F1 Neg": 0.5454545454545454, "eval_PRM NPV": 0.5714285714285714, "eval_PRM Precision": 0.8705882352941177, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.40305396914482117, "eval_runtime": 16.8874, "eval_samples_per_second": 2.605, "eval_steps_per_second": 0.178, "step": 2390 }, { "epoch": 0.615899797147181, "grad_norm": 0.1454825346465254, "learning_rate": 3.861106249641789e-05, "loss": 0.3343, "step": 2391 }, { "epoch": 0.6161573880284638, "grad_norm": 0.15286212775344593, "learning_rate": 3.856727939980176e-05, "loss": 0.4346, "step": 2392 }, { "epoch": 0.6164149789097466, "grad_norm": 0.13970371113977845, "learning_rate": 3.852350555127748e-05, "loss": 0.3177, "step": 2393 }, { "epoch": 0.6166725697910294, "grad_norm": 0.19705685890823973, "learning_rate": 3.8479740986254365e-05, "loss": 0.356, "step": 2394 }, { "epoch": 0.6169301606723122, "grad_norm": 0.2535529334088201, "learning_rate": 3.843598574013418e-05, "loss": 0.4189, "step": 2395 }, { "epoch": 0.6169301606723122, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8276584599266632, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.412109375, "eval_runtime": 17.4744, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 2395 }, { "epoch": 0.617187751553595, "grad_norm": 0.18794186191451187, "learning_rate": 3.839223984831119e-05, "loss": 0.4021, "step": 2396 }, { "epoch": 0.6174453424348778, "grad_norm": 0.14441165243612405, "learning_rate": 3.8348503346172074e-05, "loss": 0.3452, "step": 2397 }, { "epoch": 0.6177029333161607, "grad_norm": 0.23925161516194815, "learning_rate": 3.830477626909589e-05, "loss": 0.4133, "step": 2398 }, { "epoch": 0.6179605241974434, "grad_norm": 0.17828211742232414, "learning_rate": 3.826105865245414e-05, "loss": 0.3388, "step": 2399 }, { "epoch": 0.6182181150787263, "grad_norm": 0.13630425549357833, "learning_rate": 3.82173505316106e-05, "loss": 0.3799, "step": 2400 }, { "epoch": 0.6182181150787263, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8901734104046243, "eval_PRM F1 AUC": 0.6812467260345731, "eval_PRM F1 AUC (fixed)": 0.8389209009952855, "eval_PRM F1 Neg": 0.5128205128205128, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.8555555555555555, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.43478260869565216, "eval_loss": 0.4106889069080353, "eval_runtime": 16.5579, "eval_samples_per_second": 2.657, "eval_steps_per_second": 0.181, "step": 2400 }, { "epoch": 0.618475705960009, "grad_norm": 0.13869335502670038, "learning_rate": 3.81736519419214e-05, "loss": 0.346, "step": 2401 }, { "epoch": 0.6187332968412919, "grad_norm": 0.21401245288632476, "learning_rate": 3.812996291873496e-05, "loss": 0.4715, "step": 2402 }, { "epoch": 0.6189908877225746, "grad_norm": 0.1699494837457687, "learning_rate": 3.808628349739198e-05, "loss": 0.3264, "step": 2403 }, { "epoch": 0.6192484786038575, "grad_norm": 0.12204448338944414, "learning_rate": 3.8042613713225346e-05, "loss": 0.3131, "step": 2404 }, { "epoch": 0.6195060694851402, "grad_norm": 0.1295816329473272, "learning_rate": 3.7998953601560175e-05, "loss": 0.3065, "step": 2405 }, { "epoch": 0.6195060694851402, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8888888888888888, "eval_PRM F1 AUC": 0.6969617600838135, "eval_PRM F1 AUC (fixed)": 0.8381351492928236, "eval_PRM F1 Neg": 0.5365853658536586, "eval_PRM NPV": 0.6111111111111112, "eval_PRM Precision": 0.8636363636363636, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.4782608695652174, "eval_loss": 0.3964399993419647, "eval_runtime": 17.0733, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 2405 }, { "epoch": 0.619763660366423, "grad_norm": 0.12782589842749065, "learning_rate": 3.7955303197713774e-05, "loss": 0.2942, "step": 2406 }, { "epoch": 0.6200212512477058, "grad_norm": 0.22347031911550472, "learning_rate": 3.791166253699555e-05, "loss": 0.3996, "step": 2407 }, { "epoch": 0.6202788421289887, "grad_norm": 0.15465719210193768, "learning_rate": 3.7868031654707105e-05, "loss": 0.3739, "step": 2408 }, { "epoch": 0.6205364330102714, "grad_norm": 0.15084946354307485, "learning_rate": 3.782441058614203e-05, "loss": 0.3447, "step": 2409 }, { "epoch": 0.6207940238915542, "grad_norm": 0.14473470469746796, "learning_rate": 3.778079936658611e-05, "loss": 0.3595, "step": 2410 }, { "epoch": 0.6207940238915542, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 AUC (fixed)": 0.8273965426925091, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3949751555919647, "eval_runtime": 17.4771, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 2410 }, { "epoch": 0.621051614772837, "grad_norm": 0.19841184109055246, "learning_rate": 3.773719803131702e-05, "loss": 0.2876, "step": 2411 }, { "epoch": 0.6213092056541198, "grad_norm": 0.18140941867294844, "learning_rate": 3.769360661560453e-05, "loss": 0.3564, "step": 2412 }, { "epoch": 0.6215667965354027, "grad_norm": 0.14336788233772046, "learning_rate": 3.765002515471035e-05, "loss": 0.38, "step": 2413 }, { "epoch": 0.6218243874166854, "grad_norm": 0.16433034958269993, "learning_rate": 3.760645368388817e-05, "loss": 0.4335, "step": 2414 }, { "epoch": 0.6220819782979683, "grad_norm": 0.130249698037053, "learning_rate": 3.7562892238383576e-05, "loss": 0.3519, "step": 2415 }, { "epoch": 0.6220819782979683, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 AUC (fixed)": 0.8349921424829754, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.38991478085517883, "eval_runtime": 16.4684, "eval_samples_per_second": 2.672, "eval_steps_per_second": 0.182, "step": 2415 }, { "epoch": 0.622339569179251, "grad_norm": 0.1691572313466575, "learning_rate": 3.7519340853434044e-05, "loss": 0.385, "step": 2416 }, { "epoch": 0.6225971600605339, "grad_norm": 0.3209029787796321, "learning_rate": 3.747579956426888e-05, "loss": 0.483, "step": 2417 }, { "epoch": 0.6228547509418166, "grad_norm": 0.14144139932379493, "learning_rate": 3.7432268406109326e-05, "loss": 0.3275, "step": 2418 }, { "epoch": 0.6231123418230995, "grad_norm": 0.17592595116774362, "learning_rate": 3.73887474141683e-05, "loss": 0.355, "step": 2419 }, { "epoch": 0.6233699327043822, "grad_norm": 0.1516450321416382, "learning_rate": 3.734523662365059e-05, "loss": 0.417, "step": 2420 }, { "epoch": 0.6233699327043822, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9036144578313253, "eval_PRM F1 AUC": 0.7778941854374019, "eval_PRM F1 AUC (fixed)": 0.8376113148245155, "eval_PRM F1 Neg": 0.6521739130434783, "eval_PRM NPV": 0.6521739130434783, "eval_PRM Precision": 0.9036144578313253, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.37863990664482117, "eval_runtime": 17.5193, "eval_samples_per_second": 2.512, "eval_steps_per_second": 0.171, "step": 2420 }, { "epoch": 0.6236275235856651, "grad_norm": 0.19136966587799933, "learning_rate": 3.730173606975268e-05, "loss": 0.4759, "step": 2421 }, { "epoch": 0.6238851144669478, "grad_norm": 0.16603655661634564, "learning_rate": 3.725824578766281e-05, "loss": 0.355, "step": 2422 }, { "epoch": 0.6241427053482307, "grad_norm": 0.2053708825957282, "learning_rate": 3.721476581256089e-05, "loss": 0.3731, "step": 2423 }, { "epoch": 0.6244002962295134, "grad_norm": 0.18248176347253492, "learning_rate": 3.7171296179618476e-05, "loss": 0.34, "step": 2424 }, { "epoch": 0.6246578871107963, "grad_norm": 0.12733024912347352, "learning_rate": 3.712783692399881e-05, "loss": 0.3072, "step": 2425 }, { "epoch": 0.6246578871107963, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 AUC (fixed)": 0.8404924044002094, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3765092194080353, "eval_runtime": 17.0684, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2425 }, { "epoch": 0.624915477992079, "grad_norm": 0.1621235773141948, "learning_rate": 3.708438808085668e-05, "loss": 0.2946, "step": 2426 }, { "epoch": 0.6251730688733619, "grad_norm": 0.15820404950724934, "learning_rate": 3.704094968533852e-05, "loss": 0.3633, "step": 2427 }, { "epoch": 0.6254306597546447, "grad_norm": 0.15525345620753025, "learning_rate": 3.69975217725822e-05, "loss": 0.3775, "step": 2428 }, { "epoch": 0.6256882506359275, "grad_norm": 0.13987459511490624, "learning_rate": 3.695410437771727e-05, "loss": 0.313, "step": 2429 }, { "epoch": 0.6259458415172103, "grad_norm": 0.16656774734893298, "learning_rate": 3.691069753586462e-05, "loss": 0.3671, "step": 2430 }, { "epoch": 0.6259458415172103, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8459926663174437, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3775745630264282, "eval_runtime": 17.0016, "eval_samples_per_second": 2.588, "eval_steps_per_second": 0.176, "step": 2430 }, { "epoch": 0.6262034323984931, "grad_norm": 0.12236490588156322, "learning_rate": 3.686730128213668e-05, "loss": 0.2818, "step": 2431 }, { "epoch": 0.6264610232797759, "grad_norm": 0.1527398652229691, "learning_rate": 3.682391565163732e-05, "loss": 0.3281, "step": 2432 }, { "epoch": 0.6267186141610587, "grad_norm": 0.15293359843564117, "learning_rate": 3.6780540679461784e-05, "loss": 0.3706, "step": 2433 }, { "epoch": 0.6269762050423415, "grad_norm": 0.16229893172953397, "learning_rate": 3.673717640069672e-05, "loss": 0.3909, "step": 2434 }, { "epoch": 0.6272337959236243, "grad_norm": 0.14385377128288312, "learning_rate": 3.669382285042011e-05, "loss": 0.2975, "step": 2435 }, { "epoch": 0.6272337959236243, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8483499214248297, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3722034692764282, "eval_runtime": 16.9658, "eval_samples_per_second": 2.593, "eval_steps_per_second": 0.177, "step": 2435 }, { "epoch": 0.6274913868049071, "grad_norm": 0.14195669348417514, "learning_rate": 3.6650480063701265e-05, "loss": 0.3913, "step": 2436 }, { "epoch": 0.6277489776861899, "grad_norm": 0.1711043094421518, "learning_rate": 3.66071480756008e-05, "loss": 0.4659, "step": 2437 }, { "epoch": 0.6280065685674727, "grad_norm": 0.15588465134278923, "learning_rate": 3.6563826921170544e-05, "loss": 0.3509, "step": 2438 }, { "epoch": 0.6282641594487555, "grad_norm": 0.18307559032814893, "learning_rate": 3.652051663545366e-05, "loss": 0.4066, "step": 2439 }, { "epoch": 0.6285217503300383, "grad_norm": 0.16824615853320427, "learning_rate": 3.64772172534844e-05, "loss": 0.2902, "step": 2440 }, { "epoch": 0.6285217503300383, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8504452592980618, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3701171875, "eval_runtime": 17.5261, "eval_samples_per_second": 2.511, "eval_steps_per_second": 0.171, "step": 2440 }, { "epoch": 0.6287793412113212, "grad_norm": 0.15941201118061468, "learning_rate": 3.643392881028829e-05, "loss": 0.384, "step": 2441 }, { "epoch": 0.6290369320926039, "grad_norm": 0.1481415780534842, "learning_rate": 3.639065134088196e-05, "loss": 0.3438, "step": 2442 }, { "epoch": 0.6292945229738868, "grad_norm": 0.13971340614909494, "learning_rate": 3.63473848802732e-05, "loss": 0.3288, "step": 2443 }, { "epoch": 0.6295521138551695, "grad_norm": 0.19468720322757044, "learning_rate": 3.630412946346084e-05, "loss": 0.4081, "step": 2444 }, { "epoch": 0.6298097047364524, "grad_norm": 0.14912771442970982, "learning_rate": 3.6260885125434815e-05, "loss": 0.3622, "step": 2445 }, { "epoch": 0.6298097047364524, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 AUC (fixed)": 0.8493975903614458, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3699840307235718, "eval_runtime": 16.9876, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 2445 }, { "epoch": 0.6300672956177351, "grad_norm": 0.19585779447466803, "learning_rate": 3.621765190117612e-05, "loss": 0.4418, "step": 2446 }, { "epoch": 0.630324886499018, "grad_norm": 0.15398334378027992, "learning_rate": 3.6174429825656685e-05, "loss": 0.2998, "step": 2447 }, { "epoch": 0.6305824773803007, "grad_norm": 0.18073986802135503, "learning_rate": 3.613121893383952e-05, "loss": 0.4453, "step": 2448 }, { "epoch": 0.6308400682615836, "grad_norm": 0.21775943023545297, "learning_rate": 3.6088019260678465e-05, "loss": 0.4535, "step": 2449 }, { "epoch": 0.6310976591428663, "grad_norm": 0.19220132536823256, "learning_rate": 3.6044830841118434e-05, "loss": 0.285, "step": 2450 }, { "epoch": 0.6310976591428663, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.855683603981142, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3622603118419647, "eval_runtime": 17.0728, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 2450 }, { "epoch": 0.6313552500241492, "grad_norm": 0.12850460632582075, "learning_rate": 3.600165371009511e-05, "loss": 0.2786, "step": 2451 }, { "epoch": 0.6316128409054319, "grad_norm": 0.17613917177631971, "learning_rate": 3.59584879025351e-05, "loss": 0.4074, "step": 2452 }, { "epoch": 0.6318704317867148, "grad_norm": 0.14661266019960154, "learning_rate": 3.591533345335587e-05, "loss": 0.3353, "step": 2453 }, { "epoch": 0.6321280226679975, "grad_norm": 0.13134303722339521, "learning_rate": 3.587219039746564e-05, "loss": 0.3593, "step": 2454 }, { "epoch": 0.6323856135492804, "grad_norm": 0.18462412448019225, "learning_rate": 3.5829058769763475e-05, "loss": 0.3275, "step": 2455 }, { "epoch": 0.6323856135492804, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 AUC (fixed)": 0.858040859088528, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.36581143736839294, "eval_runtime": 16.937, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 2455 }, { "epoch": 0.6326432044305632, "grad_norm": 0.17257292064812652, "learning_rate": 3.5785938605139145e-05, "loss": 0.3864, "step": 2456 }, { "epoch": 0.632900795311846, "grad_norm": 0.1569296924716655, "learning_rate": 3.57428299384732e-05, "loss": 0.4272, "step": 2457 }, { "epoch": 0.6331583861931288, "grad_norm": 0.13782728055888355, "learning_rate": 3.569973280463684e-05, "loss": 0.333, "step": 2458 }, { "epoch": 0.6334159770744116, "grad_norm": 0.2277672956516817, "learning_rate": 3.565664723849195e-05, "loss": 0.439, "step": 2459 }, { "epoch": 0.6336735679556944, "grad_norm": 0.16675031645959432, "learning_rate": 3.561357327489108e-05, "loss": 0.2939, "step": 2460 }, { "epoch": 0.6336735679556944, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8941176470588236, "eval_PRM F1 AUC": 0.7187008905185961, "eval_PRM F1 AUC (fixed)": 0.8546359350445258, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.631578947368421, "eval_PRM Precision": 0.8735632183908046, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.3665216565132141, "eval_runtime": 17.0327, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 2460 }, { "epoch": 0.6339311588369771, "grad_norm": 0.12459223290713027, "learning_rate": 3.557051094867735e-05, "loss": 0.2948, "step": 2461 }, { "epoch": 0.63418874971826, "grad_norm": 0.1423469842293259, "learning_rate": 3.552746029468452e-05, "loss": 0.3972, "step": 2462 }, { "epoch": 0.6344463405995427, "grad_norm": 0.1843782731483223, "learning_rate": 3.5484421347736874e-05, "loss": 0.3366, "step": 2463 }, { "epoch": 0.6347039314808256, "grad_norm": 0.15991191460921128, "learning_rate": 3.5441394142649245e-05, "loss": 0.3603, "step": 2464 }, { "epoch": 0.6349615223621083, "grad_norm": 0.16679660401059462, "learning_rate": 3.5398378714226946e-05, "loss": 0.3868, "step": 2465 }, { "epoch": 0.6349615223621083, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.9005847953216374, "eval_PRM F1 AUC": 0.7247249869041383, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.5853658536585366, "eval_PRM NPV": 0.6666666666666666, "eval_PRM Precision": 0.875, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5217391304347826, "eval_loss": 0.36843040585517883, "eval_runtime": 16.8694, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 2465 }, { "epoch": 0.6352191132433912, "grad_norm": 0.18915726926721044, "learning_rate": 3.535537509726575e-05, "loss": 0.3844, "step": 2466 }, { "epoch": 0.6354767041246739, "grad_norm": 0.1617886697675632, "learning_rate": 3.531238332655197e-05, "loss": 0.294, "step": 2467 }, { "epoch": 0.6357342950059568, "grad_norm": 0.1838773212150472, "learning_rate": 3.5269403436862175e-05, "loss": 0.3225, "step": 2468 }, { "epoch": 0.6359918858872395, "grad_norm": 0.20907038325245178, "learning_rate": 3.5226435462963504e-05, "loss": 0.314, "step": 2469 }, { "epoch": 0.6362494767685224, "grad_norm": 0.24405684396483357, "learning_rate": 3.518347943961331e-05, "loss": 0.4034, "step": 2470 }, { "epoch": 0.6362494767685224, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.858302776322682, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.36319246888160706, "eval_runtime": 17.5333, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 2470 }, { "epoch": 0.6365070676498052, "grad_norm": 0.18978304088865044, "learning_rate": 3.5140535401559336e-05, "loss": 0.4053, "step": 2471 }, { "epoch": 0.636764658531088, "grad_norm": 0.12154912178567832, "learning_rate": 3.509760338353967e-05, "loss": 0.3001, "step": 2472 }, { "epoch": 0.6370222494123708, "grad_norm": 0.14639788033094533, "learning_rate": 3.5054683420282605e-05, "loss": 0.3305, "step": 2473 }, { "epoch": 0.6372798402936536, "grad_norm": 0.17426631388467265, "learning_rate": 3.5011775546506736e-05, "loss": 0.4327, "step": 2474 }, { "epoch": 0.6375374311749364, "grad_norm": 0.18550190630188318, "learning_rate": 3.496887979692084e-05, "loss": 0.4209, "step": 2475 }, { "epoch": 0.6375374311749364, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8501833420639079, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3565784692764282, "eval_runtime": 16.9846, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 2475 }, { "epoch": 0.6377950220562192, "grad_norm": 0.19721703746705196, "learning_rate": 3.492599620622392e-05, "loss": 0.3477, "step": 2476 }, { "epoch": 0.638052612937502, "grad_norm": 0.1553088976127993, "learning_rate": 3.488312480910514e-05, "loss": 0.2938, "step": 2477 }, { "epoch": 0.6383102038187848, "grad_norm": 0.1360575047069072, "learning_rate": 3.484026564024373e-05, "loss": 0.3407, "step": 2478 }, { "epoch": 0.6385677947000676, "grad_norm": 0.21361931804260326, "learning_rate": 3.479741873430917e-05, "loss": 0.4115, "step": 2479 }, { "epoch": 0.6388253855813504, "grad_norm": 0.15468757231204278, "learning_rate": 3.4754584125960864e-05, "loss": 0.3112, "step": 2480 }, { "epoch": 0.6388253855813504, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8467784180199057, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.36305931210517883, "eval_runtime": 17.1046, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 2480 }, { "epoch": 0.6390829764626332, "grad_norm": 0.1495308777069929, "learning_rate": 3.471176184984839e-05, "loss": 0.3673, "step": 2481 }, { "epoch": 0.639340567343916, "grad_norm": 0.14968331179907596, "learning_rate": 3.466895194061128e-05, "loss": 0.3066, "step": 2482 }, { "epoch": 0.6395981582251988, "grad_norm": 0.22761623239442078, "learning_rate": 3.462615443287909e-05, "loss": 0.3957, "step": 2483 }, { "epoch": 0.6398557491064817, "grad_norm": 0.14780407170317722, "learning_rate": 3.458336936127134e-05, "loss": 0.3565, "step": 2484 }, { "epoch": 0.6401133399877644, "grad_norm": 0.16277120545258716, "learning_rate": 3.4540596760397484e-05, "loss": 0.3883, "step": 2485 }, { "epoch": 0.6401133399877644, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8452069146149817, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.37033912539482117, "eval_runtime": 16.8255, "eval_samples_per_second": 2.615, "eval_steps_per_second": 0.178, "step": 2485 }, { "epoch": 0.6403709308690473, "grad_norm": 0.16935247016016258, "learning_rate": 3.449783666485691e-05, "loss": 0.4021, "step": 2486 }, { "epoch": 0.64062852175033, "grad_norm": 0.14878556083839845, "learning_rate": 3.4455089109238835e-05, "loss": 0.3479, "step": 2487 }, { "epoch": 0.6408861126316129, "grad_norm": 0.22207223552251215, "learning_rate": 3.4412354128122424e-05, "loss": 0.4185, "step": 2488 }, { "epoch": 0.6411437035128956, "grad_norm": 0.12561016373143336, "learning_rate": 3.436963175607656e-05, "loss": 0.3105, "step": 2489 }, { "epoch": 0.6414012943941785, "grad_norm": 0.1504741636653908, "learning_rate": 3.4326922027660036e-05, "loss": 0.3924, "step": 2490 }, { "epoch": 0.6414012943941785, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8431115767417496, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3628373444080353, "eval_runtime": 17.2019, "eval_samples_per_second": 2.558, "eval_steps_per_second": 0.174, "step": 2490 }, { "epoch": 0.6416588852754612, "grad_norm": 0.12600048006648018, "learning_rate": 3.428422497742133e-05, "loss": 0.3471, "step": 2491 }, { "epoch": 0.6419164761567441, "grad_norm": 0.14653266088375858, "learning_rate": 3.42415406398987e-05, "loss": 0.3411, "step": 2492 }, { "epoch": 0.6421740670380268, "grad_norm": 0.14251994876680993, "learning_rate": 3.419886904962014e-05, "loss": 0.3597, "step": 2493 }, { "epoch": 0.6424316579193097, "grad_norm": 0.16747605739930146, "learning_rate": 3.4156210241103284e-05, "loss": 0.3475, "step": 2494 }, { "epoch": 0.6426892488005924, "grad_norm": 0.13704030627396535, "learning_rate": 3.411356424885549e-05, "loss": 0.3667, "step": 2495 }, { "epoch": 0.6426892488005924, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 AUC (fixed)": 0.8365636458878994, "eval_PRM F1 Neg": 0.625, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.36026278138160706, "eval_runtime": 16.9453, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 2495 }, { "epoch": 0.6429468396818753, "grad_norm": 0.3215333205805997, "learning_rate": 3.4070931107373675e-05, "loss": 0.3883, "step": 2496 }, { "epoch": 0.643204430563158, "grad_norm": 0.14689143727399998, "learning_rate": 3.402831085114444e-05, "loss": 0.3536, "step": 2497 }, { "epoch": 0.6434620214444409, "grad_norm": 0.22675565527247427, "learning_rate": 3.398570351464391e-05, "loss": 0.5071, "step": 2498 }, { "epoch": 0.6437196123257237, "grad_norm": 0.1408923021693267, "learning_rate": 3.394310913233774e-05, "loss": 0.303, "step": 2499 }, { "epoch": 0.6439772032070065, "grad_norm": 0.15506363825547645, "learning_rate": 3.390052773868116e-05, "loss": 0.3007, "step": 2500 }, { "epoch": 0.6439772032070065, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 AUC (fixed)": 0.8365636458878996, "eval_PRM F1 Neg": 0.625, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3553355932235718, "eval_runtime": 16.5546, "eval_samples_per_second": 2.658, "eval_steps_per_second": 0.181, "step": 2500 }, { "epoch": 0.6442347940882893, "grad_norm": 0.14873657646250013, "learning_rate": 3.3857959368118874e-05, "loss": 0.3583, "step": 2501 }, { "epoch": 0.6444923849695721, "grad_norm": 0.16040972779397752, "learning_rate": 3.3815404055085045e-05, "loss": 0.3418, "step": 2502 }, { "epoch": 0.6447499758508549, "grad_norm": 0.19628354525783215, "learning_rate": 3.377286183400328e-05, "loss": 0.3715, "step": 2503 }, { "epoch": 0.6450075667321377, "grad_norm": 0.23333807996267833, "learning_rate": 3.373033273928659e-05, "loss": 0.4204, "step": 2504 }, { "epoch": 0.6452651576134205, "grad_norm": 0.15238236387599147, "learning_rate": 3.368781680533737e-05, "loss": 0.323, "step": 2505 }, { "epoch": 0.6452651576134205, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8462545835515978, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3501420319080353, "eval_runtime": 16.7055, "eval_samples_per_second": 2.634, "eval_steps_per_second": 0.18, "step": 2505 }, { "epoch": 0.6455227484947033, "grad_norm": 0.154791537795474, "learning_rate": 3.364531406654736e-05, "loss": 0.3445, "step": 2506 }, { "epoch": 0.6457803393759861, "grad_norm": 0.13869050511999345, "learning_rate": 3.3602824557297666e-05, "loss": 0.2986, "step": 2507 }, { "epoch": 0.6460379302572689, "grad_norm": 0.10900705151009309, "learning_rate": 3.356034831195861e-05, "loss": 0.2838, "step": 2508 }, { "epoch": 0.6462955211385517, "grad_norm": 0.16012915495858335, "learning_rate": 3.35178853648899e-05, "loss": 0.3429, "step": 2509 }, { "epoch": 0.6465531120198345, "grad_norm": 0.188822535609594, "learning_rate": 3.3475435750440356e-05, "loss": 0.414, "step": 2510 }, { "epoch": 0.6465531120198345, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8567312729177581, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3461470305919647, "eval_runtime": 17.6969, "eval_samples_per_second": 2.486, "eval_steps_per_second": 0.17, "step": 2510 }, { "epoch": 0.6468107029011173, "grad_norm": 0.1709800133075916, "learning_rate": 3.3432999502948154e-05, "loss": 0.3722, "step": 2511 }, { "epoch": 0.6470682937824, "grad_norm": 0.14942482644257157, "learning_rate": 3.339057665674054e-05, "loss": 0.381, "step": 2512 }, { "epoch": 0.6473258846636829, "grad_norm": 0.17726803328848934, "learning_rate": 3.334816724613394e-05, "loss": 0.3147, "step": 2513 }, { "epoch": 0.6475834755449658, "grad_norm": 0.22306420205756, "learning_rate": 3.330577130543399e-05, "loss": 0.4232, "step": 2514 }, { "epoch": 0.6478410664262485, "grad_norm": 0.13931705972939903, "learning_rate": 3.326338886893534e-05, "loss": 0.309, "step": 2515 }, { "epoch": 0.6478410664262485, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3401544690132141, "eval_runtime": 16.8532, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 2515 }, { "epoch": 0.6480986573075314, "grad_norm": 0.20530377006264572, "learning_rate": 3.3221019970921766e-05, "loss": 0.3751, "step": 2516 }, { "epoch": 0.6483562481888141, "grad_norm": 0.17330808956810748, "learning_rate": 3.3178664645666066e-05, "loss": 0.4153, "step": 2517 }, { "epoch": 0.648613839070097, "grad_norm": 0.12881910684658696, "learning_rate": 3.3136322927430086e-05, "loss": 0.3523, "step": 2518 }, { "epoch": 0.6488714299513797, "grad_norm": 0.1374858295452381, "learning_rate": 3.309399485046466e-05, "loss": 0.3593, "step": 2519 }, { "epoch": 0.6491290208326626, "grad_norm": 0.20584361316619515, "learning_rate": 3.3051680449009535e-05, "loss": 0.4538, "step": 2520 }, { "epoch": 0.6491290208326626, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8567312729177581, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34543678164482117, "eval_runtime": 16.8519, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 2520 }, { "epoch": 0.6493866117139453, "grad_norm": 0.14377796745919497, "learning_rate": 3.300937975729347e-05, "loss": 0.3428, "step": 2521 }, { "epoch": 0.6496442025952281, "grad_norm": 0.1522137015431133, "learning_rate": 3.2967092809534083e-05, "loss": 0.3596, "step": 2522 }, { "epoch": 0.6499017934765109, "grad_norm": 0.18118934661681027, "learning_rate": 3.2924819639937924e-05, "loss": 0.427, "step": 2523 }, { "epoch": 0.6501593843577937, "grad_norm": 0.17093884238375687, "learning_rate": 3.2882560282700336e-05, "loss": 0.3756, "step": 2524 }, { "epoch": 0.6504169752390765, "grad_norm": 0.14721751872523076, "learning_rate": 3.284031477200553e-05, "loss": 0.3446, "step": 2525 }, { "epoch": 0.6504169752390765, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8512310110005239, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34872159361839294, "eval_runtime": 16.9321, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 2525 }, { "epoch": 0.6506745661203593, "grad_norm": 0.14190700115035357, "learning_rate": 3.2798083142026514e-05, "loss": 0.3009, "step": 2526 }, { "epoch": 0.6509321570016421, "grad_norm": 0.16798833482760195, "learning_rate": 3.275586542692504e-05, "loss": 0.3929, "step": 2527 }, { "epoch": 0.6511897478829249, "grad_norm": 0.13038401286059076, "learning_rate": 3.271366166085166e-05, "loss": 0.3491, "step": 2528 }, { "epoch": 0.6514473387642078, "grad_norm": 0.15305136825663915, "learning_rate": 3.267147187794556e-05, "loss": 0.3568, "step": 2529 }, { "epoch": 0.6517049296454905, "grad_norm": 0.1311699769335781, "learning_rate": 3.262929611233471e-05, "loss": 0.2919, "step": 2530 }, { "epoch": 0.6517049296454905, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8470403352540599, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3564453125, "eval_runtime": 17.7648, "eval_samples_per_second": 2.477, "eval_steps_per_second": 0.169, "step": 2530 }, { "epoch": 0.6519625205267734, "grad_norm": 0.18555112501180562, "learning_rate": 3.258713439813566e-05, "loss": 0.4333, "step": 2531 }, { "epoch": 0.6522201114080561, "grad_norm": 0.1432515596280174, "learning_rate": 3.2544986769453616e-05, "loss": 0.3027, "step": 2532 }, { "epoch": 0.652477702289339, "grad_norm": 0.16666607778718331, "learning_rate": 3.2502853260382436e-05, "loss": 0.3986, "step": 2533 }, { "epoch": 0.6527352931706217, "grad_norm": 0.1805640643644997, "learning_rate": 3.246073390500449e-05, "loss": 0.3662, "step": 2534 }, { "epoch": 0.6529928840519046, "grad_norm": 0.15817752408897212, "learning_rate": 3.241862873739075e-05, "loss": 0.3749, "step": 2535 }, { "epoch": 0.6529928840519046, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 AUC (fixed)": 0.8504452592980618, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3546253442764282, "eval_runtime": 17.0846, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 2535 }, { "epoch": 0.6532504749331873, "grad_norm": 0.2069291485258539, "learning_rate": 3.237653779160067e-05, "loss": 0.4628, "step": 2536 }, { "epoch": 0.6535080658144702, "grad_norm": 0.17594609060190622, "learning_rate": 3.2334461101682246e-05, "loss": 0.4072, "step": 2537 }, { "epoch": 0.6537656566957529, "grad_norm": 0.1454335036500637, "learning_rate": 3.229239870167191e-05, "loss": 0.3352, "step": 2538 }, { "epoch": 0.6540232475770358, "grad_norm": 0.1874278194677057, "learning_rate": 3.225035062559452e-05, "loss": 0.3919, "step": 2539 }, { "epoch": 0.6542808384583185, "grad_norm": 0.16750406533288847, "learning_rate": 3.220831690746339e-05, "loss": 0.41, "step": 2540 }, { "epoch": 0.6542808384583185, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 AUC (fixed)": 0.8454688318491357, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3556019067764282, "eval_runtime": 17.665, "eval_samples_per_second": 2.491, "eval_steps_per_second": 0.17, "step": 2540 }, { "epoch": 0.6545384293396014, "grad_norm": 0.16608541292512252, "learning_rate": 3.216629758128018e-05, "loss": 0.3982, "step": 2541 }, { "epoch": 0.6547960202208842, "grad_norm": 0.1763015395163615, "learning_rate": 3.212429268103495e-05, "loss": 0.4252, "step": 2542 }, { "epoch": 0.655053611102167, "grad_norm": 0.12489844211720086, "learning_rate": 3.208230224070605e-05, "loss": 0.2988, "step": 2543 }, { "epoch": 0.6553112019834498, "grad_norm": 0.17351401694461402, "learning_rate": 3.204032629426016e-05, "loss": 0.3988, "step": 2544 }, { "epoch": 0.6555687928647326, "grad_norm": 0.1337855883003999, "learning_rate": 3.199836487565222e-05, "loss": 0.3521, "step": 2545 }, { "epoch": 0.6555687928647326, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 AUC (fixed)": 0.8412781561026715, "eval_PRM F1 Neg": 0.625, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.35946378111839294, "eval_runtime": 16.9641, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 2545 }, { "epoch": 0.6558263837460154, "grad_norm": 0.18725366477704852, "learning_rate": 3.195641801882541e-05, "loss": 0.3138, "step": 2546 }, { "epoch": 0.6560839746272982, "grad_norm": 0.24688665103473245, "learning_rate": 3.191448575771119e-05, "loss": 0.4933, "step": 2547 }, { "epoch": 0.656341565508581, "grad_norm": 0.14498573625614256, "learning_rate": 3.1872568126229095e-05, "loss": 0.3223, "step": 2548 }, { "epoch": 0.6565991563898638, "grad_norm": 0.13504588754413635, "learning_rate": 3.1830665158286976e-05, "loss": 0.3042, "step": 2549 }, { "epoch": 0.6568567472711466, "grad_norm": 0.122929927826042, "learning_rate": 3.1788776887780684e-05, "loss": 0.3023, "step": 2550 }, { "epoch": 0.6568567472711466, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.896969696969697, "eval_PRM F1 AUC": 0.7718700890518595, "eval_PRM F1 AUC (fixed)": 0.8452069146149817, "eval_PRM F1 Neg": 0.6382978723404256, "eval_PRM NPV": 0.625, "eval_PRM Precision": 0.9024390243902439, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3597301244735718, "eval_runtime": 17.1128, "eval_samples_per_second": 2.571, "eval_steps_per_second": 0.175, "step": 2550 }, { "epoch": 0.6571143381524294, "grad_norm": 0.12923353371719942, "learning_rate": 3.17469033485943e-05, "loss": 0.3137, "step": 2551 }, { "epoch": 0.6573719290337122, "grad_norm": 0.16529377522823094, "learning_rate": 3.170504457459989e-05, "loss": 0.3606, "step": 2552 }, { "epoch": 0.657629519914995, "grad_norm": 0.12628829466835872, "learning_rate": 3.166320059965762e-05, "loss": 0.3095, "step": 2553 }, { "epoch": 0.6578871107962778, "grad_norm": 0.16930794155717083, "learning_rate": 3.16213714576157e-05, "loss": 0.3127, "step": 2554 }, { "epoch": 0.6581447016775606, "grad_norm": 0.11479473280686057, "learning_rate": 3.15795571823103e-05, "loss": 0.2792, "step": 2555 }, { "epoch": 0.6581447016775606, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8525405971712938, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3607066869735718, "eval_runtime": 17.3594, "eval_samples_per_second": 2.535, "eval_steps_per_second": 0.173, "step": 2555 }, { "epoch": 0.6584022925588434, "grad_norm": 0.1387933607014311, "learning_rate": 3.1537757807565614e-05, "loss": 0.2783, "step": 2556 }, { "epoch": 0.6586598834401263, "grad_norm": 0.1477684610839945, "learning_rate": 3.1495973367193734e-05, "loss": 0.3637, "step": 2557 }, { "epoch": 0.658917474321409, "grad_norm": 0.15011071090661027, "learning_rate": 3.1454203894994713e-05, "loss": 0.2746, "step": 2558 }, { "epoch": 0.6591750652026919, "grad_norm": 0.14828228800010632, "learning_rate": 3.1412449424756474e-05, "loss": 0.3308, "step": 2559 }, { "epoch": 0.6594326560839746, "grad_norm": 0.20438333584587137, "learning_rate": 3.1370709990254786e-05, "loss": 0.3942, "step": 2560 }, { "epoch": 0.6594326560839746, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 AUC (fixed)": 0.8598742797276061, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3662553131580353, "eval_runtime": 17.0899, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 2560 }, { "epoch": 0.6596902469652575, "grad_norm": 0.2516696310753756, "learning_rate": 3.1328985625253304e-05, "loss": 0.4709, "step": 2561 }, { "epoch": 0.6599478378465402, "grad_norm": 0.16598887701829515, "learning_rate": 3.1287276363503446e-05, "loss": 0.3714, "step": 2562 }, { "epoch": 0.6602054287278231, "grad_norm": 0.1591790676833675, "learning_rate": 3.1245582238744444e-05, "loss": 0.3606, "step": 2563 }, { "epoch": 0.6604630196091058, "grad_norm": 0.14624376218522936, "learning_rate": 3.120390328470326e-05, "loss": 0.3444, "step": 2564 }, { "epoch": 0.6607206104903887, "grad_norm": 0.17024500235389717, "learning_rate": 3.116223953509463e-05, "loss": 0.3374, "step": 2565 }, { "epoch": 0.6607206104903887, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8619696176008382, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3558238744735718, "eval_runtime": 17.573, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 2565 }, { "epoch": 0.6609782013716714, "grad_norm": 0.16071851788388838, "learning_rate": 3.112059102362093e-05, "loss": 0.4286, "step": 2566 }, { "epoch": 0.6612357922529543, "grad_norm": 0.17033435391975124, "learning_rate": 3.107895778397224e-05, "loss": 0.4324, "step": 2567 }, { "epoch": 0.661493383134237, "grad_norm": 0.16323632109513192, "learning_rate": 3.1037339849826315e-05, "loss": 0.3228, "step": 2568 }, { "epoch": 0.6617509740155199, "grad_norm": 0.2536498211462177, "learning_rate": 3.099573725484844e-05, "loss": 0.4613, "step": 2569 }, { "epoch": 0.6620085648968026, "grad_norm": 0.16031947266740823, "learning_rate": 3.095415003269163e-05, "loss": 0.3737, "step": 2570 }, { "epoch": 0.6620085648968026, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3516956567764282, "eval_runtime": 17.0658, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2570 }, { "epoch": 0.6622661557780855, "grad_norm": 0.12609206435852544, "learning_rate": 3.0912578216996315e-05, "loss": 0.2846, "step": 2571 }, { "epoch": 0.6625237466593683, "grad_norm": 0.16046671530905887, "learning_rate": 3.087102184139059e-05, "loss": 0.3817, "step": 2572 }, { "epoch": 0.662781337540651, "grad_norm": 0.17389660168352186, "learning_rate": 3.082948093948997e-05, "loss": 0.4318, "step": 2573 }, { "epoch": 0.6630389284219339, "grad_norm": 0.14324737030946294, "learning_rate": 3.078795554489748e-05, "loss": 0.3111, "step": 2574 }, { "epoch": 0.6632965193032166, "grad_norm": 0.14173912099647726, "learning_rate": 3.074644569120364e-05, "loss": 0.3851, "step": 2575 }, { "epoch": 0.6632965193032166, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.856993190151912, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35391512513160706, "eval_runtime": 17.0289, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 2575 }, { "epoch": 0.6635541101844995, "grad_norm": 0.11450529030492015, "learning_rate": 3.070495141198634e-05, "loss": 0.3292, "step": 2576 }, { "epoch": 0.6638117010657822, "grad_norm": 0.16428345459596733, "learning_rate": 3.066347274081091e-05, "loss": 0.403, "step": 2577 }, { "epoch": 0.6640692919470651, "grad_norm": 0.12045040511375114, "learning_rate": 3.0622009711230036e-05, "loss": 0.3525, "step": 2578 }, { "epoch": 0.6643268828283478, "grad_norm": 0.12680063256725685, "learning_rate": 3.058056235678378e-05, "loss": 0.3788, "step": 2579 }, { "epoch": 0.6645844737096307, "grad_norm": 0.16746684595194214, "learning_rate": 3.053913071099947e-05, "loss": 0.3487, "step": 2580 }, { "epoch": 0.6645844737096307, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.851754845468832, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3593306243419647, "eval_runtime": 17.14, "eval_samples_per_second": 2.567, "eval_steps_per_second": 0.175, "step": 2580 }, { "epoch": 0.6648420645909134, "grad_norm": 0.14915604575310126, "learning_rate": 3.0497714807391774e-05, "loss": 0.4035, "step": 2581 }, { "epoch": 0.6650996554721963, "grad_norm": 0.2030432434088284, "learning_rate": 3.0456314679462627e-05, "loss": 0.4354, "step": 2582 }, { "epoch": 0.665357246353479, "grad_norm": 0.16173799671708103, "learning_rate": 3.041493036070115e-05, "loss": 0.4492, "step": 2583 }, { "epoch": 0.6656148372347619, "grad_norm": 0.13206398818964307, "learning_rate": 3.0373561884583744e-05, "loss": 0.3664, "step": 2584 }, { "epoch": 0.6658724281160447, "grad_norm": 0.15272377410733054, "learning_rate": 3.0332209284573958e-05, "loss": 0.3629, "step": 2585 }, { "epoch": 0.6658724281160447, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8473022524882138, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36257103085517883, "eval_runtime": 16.9612, "eval_samples_per_second": 2.594, "eval_steps_per_second": 0.177, "step": 2585 }, { "epoch": 0.6661300189973275, "grad_norm": 0.13067819540064435, "learning_rate": 3.0290872594122487e-05, "loss": 0.3481, "step": 2586 }, { "epoch": 0.6663876098786103, "grad_norm": 0.1511483043515646, "learning_rate": 3.0249551846667207e-05, "loss": 0.3417, "step": 2587 }, { "epoch": 0.6666452007598931, "grad_norm": 0.15426699334791533, "learning_rate": 3.020824707563301e-05, "loss": 0.3745, "step": 2588 }, { "epoch": 0.6669027916411759, "grad_norm": 0.13848777860046718, "learning_rate": 3.0166958314431985e-05, "loss": 0.3631, "step": 2589 }, { "epoch": 0.6671603825224587, "grad_norm": 0.19336063860804856, "learning_rate": 3.0125685596463137e-05, "loss": 0.3885, "step": 2590 }, { "epoch": 0.6671603825224587, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8488737558931377, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3624378442764282, "eval_runtime": 17.2346, "eval_samples_per_second": 2.553, "eval_steps_per_second": 0.174, "step": 2590 }, { "epoch": 0.6674179734037415, "grad_norm": 0.14882306434604864, "learning_rate": 3.0084428955112626e-05, "loss": 0.4, "step": 2591 }, { "epoch": 0.6676755642850243, "grad_norm": 0.15076421723970607, "learning_rate": 3.0043188423753498e-05, "loss": 0.3672, "step": 2592 }, { "epoch": 0.6679331551663071, "grad_norm": 0.15032960970703027, "learning_rate": 3.000196403574581e-05, "loss": 0.4062, "step": 2593 }, { "epoch": 0.6681907460475899, "grad_norm": 0.13129512333552704, "learning_rate": 2.996075582443658e-05, "loss": 0.345, "step": 2594 }, { "epoch": 0.6684483369288727, "grad_norm": 0.2087041615741322, "learning_rate": 2.9919563823159713e-05, "loss": 0.3311, "step": 2595 }, { "epoch": 0.6684483369288727, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.854374017810372, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3663884997367859, "eval_runtime": 16.993, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 2595 }, { "epoch": 0.6687059278101555, "grad_norm": 0.1439844716504298, "learning_rate": 2.9878388065236017e-05, "loss": 0.3744, "step": 2596 }, { "epoch": 0.6689635186914383, "grad_norm": 0.12077440029401869, "learning_rate": 2.9837228583973143e-05, "loss": 0.3422, "step": 2597 }, { "epoch": 0.6692211095727211, "grad_norm": 0.13144361481789127, "learning_rate": 2.97960854126656e-05, "loss": 0.2947, "step": 2598 }, { "epoch": 0.6694787004540039, "grad_norm": 0.15236813351012043, "learning_rate": 2.9754958584594694e-05, "loss": 0.3451, "step": 2599 }, { "epoch": 0.6697362913352868, "grad_norm": 0.13679736408617219, "learning_rate": 2.971384813302847e-05, "loss": 0.2935, "step": 2600 }, { "epoch": 0.6697362913352868, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8624934520691461, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3698064684867859, "eval_runtime": 17.0757, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 2600 }, { "epoch": 0.6699938822165695, "grad_norm": 0.14424842156304019, "learning_rate": 2.9672754091221805e-05, "loss": 0.3358, "step": 2601 }, { "epoch": 0.6702514730978524, "grad_norm": 0.271654280797804, "learning_rate": 2.9631676492416228e-05, "loss": 0.3578, "step": 2602 }, { "epoch": 0.6705090639791351, "grad_norm": 0.16214664750967217, "learning_rate": 2.9590615369840025e-05, "loss": 0.3556, "step": 2603 }, { "epoch": 0.670766654860418, "grad_norm": 0.1341168484593591, "learning_rate": 2.9549570756708105e-05, "loss": 0.3674, "step": 2604 }, { "epoch": 0.6710242457417007, "grad_norm": 0.14645915108003033, "learning_rate": 2.9508542686222067e-05, "loss": 0.3712, "step": 2605 }, { "epoch": 0.6710242457417007, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8664222105814563, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3648792505264282, "eval_runtime": 17.011, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 2605 }, { "epoch": 0.6712818366229836, "grad_norm": 0.18243098306205288, "learning_rate": 2.9467531191570098e-05, "loss": 0.4229, "step": 2606 }, { "epoch": 0.6715394275042663, "grad_norm": 0.16135374167770358, "learning_rate": 2.9426536305926968e-05, "loss": 0.4295, "step": 2607 }, { "epoch": 0.6717970183855492, "grad_norm": 0.15824305201161903, "learning_rate": 2.938555806245406e-05, "loss": 0.3339, "step": 2608 }, { "epoch": 0.6720546092668319, "grad_norm": 0.1285985863255223, "learning_rate": 2.934459649429922e-05, "loss": 0.3539, "step": 2609 }, { "epoch": 0.6723122001481148, "grad_norm": 0.14343018905641086, "learning_rate": 2.9303651634596906e-05, "loss": 0.3753, "step": 2610 }, { "epoch": 0.6723122001481148, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3631036877632141, "eval_runtime": 17.0075, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 2610 }, { "epoch": 0.6725697910293975, "grad_norm": 0.1289836886527462, "learning_rate": 2.9262723516467938e-05, "loss": 0.3051, "step": 2611 }, { "epoch": 0.6728273819106804, "grad_norm": 0.17466695118132106, "learning_rate": 2.9221812173019725e-05, "loss": 0.435, "step": 2612 }, { "epoch": 0.6730849727919631, "grad_norm": 0.16372684068951407, "learning_rate": 2.9180917637345994e-05, "loss": 0.3557, "step": 2613 }, { "epoch": 0.673342563673246, "grad_norm": 0.18436446474435458, "learning_rate": 2.9140039942526932e-05, "loss": 0.4669, "step": 2614 }, { "epoch": 0.6736001545545288, "grad_norm": 0.18459854773941667, "learning_rate": 2.9099179121629117e-05, "loss": 0.3882, "step": 2615 }, { "epoch": 0.6736001545545288, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8436354112100576, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3697620630264282, "eval_runtime": 17.1329, "eval_samples_per_second": 2.568, "eval_steps_per_second": 0.175, "step": 2615 }, { "epoch": 0.6738577454358116, "grad_norm": 0.17466422864277772, "learning_rate": 2.9058335207705406e-05, "loss": 0.3659, "step": 2616 }, { "epoch": 0.6741153363170944, "grad_norm": 0.235969171921171, "learning_rate": 2.901750823379506e-05, "loss": 0.3938, "step": 2617 }, { "epoch": 0.6743729271983772, "grad_norm": 0.1705277553156338, "learning_rate": 2.8976698232923592e-05, "loss": 0.3951, "step": 2618 }, { "epoch": 0.67463051807966, "grad_norm": 0.15408788625297992, "learning_rate": 2.8935905238102834e-05, "loss": 0.3954, "step": 2619 }, { "epoch": 0.6748881089609428, "grad_norm": 0.13469875580433766, "learning_rate": 2.889512928233078e-05, "loss": 0.3426, "step": 2620 }, { "epoch": 0.6748881089609428, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8336825563122053, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3745560944080353, "eval_runtime": 17.4474, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 2620 }, { "epoch": 0.6751456998422256, "grad_norm": 0.11833188829156593, "learning_rate": 2.8854370398591696e-05, "loss": 0.3412, "step": 2621 }, { "epoch": 0.6754032907235084, "grad_norm": 0.139442085857202, "learning_rate": 2.881362861985606e-05, "loss": 0.3481, "step": 2622 }, { "epoch": 0.6756608816047912, "grad_norm": 0.14973091363678256, "learning_rate": 2.877290397908043e-05, "loss": 0.4451, "step": 2623 }, { "epoch": 0.675918472486074, "grad_norm": 0.13551257135595993, "learning_rate": 2.87321965092076e-05, "loss": 0.37, "step": 2624 }, { "epoch": 0.6761760633673568, "grad_norm": 0.1608691455557866, "learning_rate": 2.8691506243166365e-05, "loss": 0.3478, "step": 2625 }, { "epoch": 0.6761760633673568, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8336825563122053, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37930575013160706, "eval_runtime": 17.7761, "eval_samples_per_second": 2.475, "eval_steps_per_second": 0.169, "step": 2625 }, { "epoch": 0.6764336542486395, "grad_norm": 0.25653898986144474, "learning_rate": 2.8650833213871754e-05, "loss": 0.4363, "step": 2626 }, { "epoch": 0.6766912451299224, "grad_norm": 0.14824584340574268, "learning_rate": 2.8610177454224718e-05, "loss": 0.3604, "step": 2627 }, { "epoch": 0.6769488360112053, "grad_norm": 0.13973305765078076, "learning_rate": 2.856953899711226e-05, "loss": 0.3751, "step": 2628 }, { "epoch": 0.677206426892488, "grad_norm": 0.13738295217547944, "learning_rate": 2.8528917875407433e-05, "loss": 0.2925, "step": 2629 }, { "epoch": 0.6774640177737709, "grad_norm": 0.18460469582575612, "learning_rate": 2.848831412196925e-05, "loss": 0.2771, "step": 2630 }, { "epoch": 0.6774640177737709, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8315872184389732, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3798828125, "eval_runtime": 16.881, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 2630 }, { "epoch": 0.6777216086550536, "grad_norm": 0.14662183229158146, "learning_rate": 2.8447727769642697e-05, "loss": 0.2824, "step": 2631 }, { "epoch": 0.6779791995363365, "grad_norm": 0.1560827145014329, "learning_rate": 2.8407158851258598e-05, "loss": 0.3876, "step": 2632 }, { "epoch": 0.6782367904176192, "grad_norm": 0.1566681964080817, "learning_rate": 2.8366607399633773e-05, "loss": 0.3411, "step": 2633 }, { "epoch": 0.678494381298902, "grad_norm": 0.14392669910857436, "learning_rate": 2.8326073447570877e-05, "loss": 0.3229, "step": 2634 }, { "epoch": 0.6787519721801848, "grad_norm": 0.15826679514916564, "learning_rate": 2.828555702785838e-05, "loss": 0.3544, "step": 2635 }, { "epoch": 0.6787519721801848, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8368255631220535, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.37668678164482117, "eval_runtime": 17.1599, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 2635 }, { "epoch": 0.6790095630614676, "grad_norm": 0.1599950181363227, "learning_rate": 2.8245058173270622e-05, "loss": 0.3794, "step": 2636 }, { "epoch": 0.6792671539427504, "grad_norm": 0.12302097922258666, "learning_rate": 2.8204576916567683e-05, "loss": 0.3474, "step": 2637 }, { "epoch": 0.6795247448240332, "grad_norm": 0.14502002261600558, "learning_rate": 2.816411329049544e-05, "loss": 0.3901, "step": 2638 }, { "epoch": 0.679782335705316, "grad_norm": 0.17181379234799013, "learning_rate": 2.812366732778553e-05, "loss": 0.446, "step": 2639 }, { "epoch": 0.6800399265865988, "grad_norm": 0.10429743608354924, "learning_rate": 2.8083239061155232e-05, "loss": 0.2877, "step": 2640 }, { "epoch": 0.6800399265865988, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8376113148245155, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3638139069080353, "eval_runtime": 16.8599, "eval_samples_per_second": 2.61, "eval_steps_per_second": 0.178, "step": 2640 }, { "epoch": 0.6802975174678816, "grad_norm": 0.18565690935970933, "learning_rate": 2.804282852330756e-05, "loss": 0.3837, "step": 2641 }, { "epoch": 0.6805551083491644, "grad_norm": 0.1518437366251305, "learning_rate": 2.8002435746931194e-05, "loss": 0.3514, "step": 2642 }, { "epoch": 0.6808126992304473, "grad_norm": 0.18587792426939584, "learning_rate": 2.796206076470044e-05, "loss": 0.4258, "step": 2643 }, { "epoch": 0.68107029011173, "grad_norm": 0.13405425666410486, "learning_rate": 2.792170360927517e-05, "loss": 0.2691, "step": 2644 }, { "epoch": 0.6813278809930129, "grad_norm": 0.10515530517518289, "learning_rate": 2.7881364313300894e-05, "loss": 0.3167, "step": 2645 }, { "epoch": 0.6813278809930129, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8486118386589837, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35830965638160706, "eval_runtime": 17.227, "eval_samples_per_second": 2.554, "eval_steps_per_second": 0.174, "step": 2645 }, { "epoch": 0.6815854718742956, "grad_norm": 0.11524372373749776, "learning_rate": 2.784104290940862e-05, "loss": 0.3228, "step": 2646 }, { "epoch": 0.6818430627555785, "grad_norm": 0.15840319147870083, "learning_rate": 2.780073943021493e-05, "loss": 0.3861, "step": 2647 }, { "epoch": 0.6821006536368612, "grad_norm": 0.14653782775636837, "learning_rate": 2.7760453908321894e-05, "loss": 0.3372, "step": 2648 }, { "epoch": 0.6823582445181441, "grad_norm": 0.2162995700522589, "learning_rate": 2.7720186376317024e-05, "loss": 0.4424, "step": 2649 }, { "epoch": 0.6826158353994268, "grad_norm": 0.1404277759035153, "learning_rate": 2.7679936866773315e-05, "loss": 0.3406, "step": 2650 }, { "epoch": 0.6826158353994268, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35067471861839294, "eval_runtime": 17.4879, "eval_samples_per_second": 2.516, "eval_steps_per_second": 0.172, "step": 2650 }, { "epoch": 0.6828734262807097, "grad_norm": 0.14616004490769807, "learning_rate": 2.7639705412249183e-05, "loss": 0.3348, "step": 2651 }, { "epoch": 0.6831310171619924, "grad_norm": 0.20226492109006747, "learning_rate": 2.759949204528844e-05, "loss": 0.4407, "step": 2652 }, { "epoch": 0.6833886080432753, "grad_norm": 0.19134254631359318, "learning_rate": 2.7559296798420237e-05, "loss": 0.4001, "step": 2653 }, { "epoch": 0.683646198924558, "grad_norm": 0.152317104100875, "learning_rate": 2.7519119704159052e-05, "loss": 0.403, "step": 2654 }, { "epoch": 0.6839037898058409, "grad_norm": 0.15170475473427295, "learning_rate": 2.7478960795004788e-05, "loss": 0.3308, "step": 2655 }, { "epoch": 0.6839037898058409, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.855159769512834, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34659090638160706, "eval_runtime": 17.5469, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 2655 }, { "epoch": 0.6841613806871236, "grad_norm": 0.17995207857884746, "learning_rate": 2.743882010344251e-05, "loss": 0.3558, "step": 2656 }, { "epoch": 0.6844189715684065, "grad_norm": 0.12577112267556753, "learning_rate": 2.739869766194263e-05, "loss": 0.3235, "step": 2657 }, { "epoch": 0.6846765624496893, "grad_norm": 0.13602194909859155, "learning_rate": 2.7358593502960727e-05, "loss": 0.3663, "step": 2658 }, { "epoch": 0.6849341533309721, "grad_norm": 0.14515515627148598, "learning_rate": 2.7318507658937665e-05, "loss": 0.2859, "step": 2659 }, { "epoch": 0.6851917442122549, "grad_norm": 0.13895407389483255, "learning_rate": 2.7278440162299467e-05, "loss": 0.3585, "step": 2660 }, { "epoch": 0.6851917442122549, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.854635935044526, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3507190942764282, "eval_runtime": 16.9443, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 2660 }, { "epoch": 0.6854493350935377, "grad_norm": 0.17412406091282298, "learning_rate": 2.7238391045457272e-05, "loss": 0.3436, "step": 2661 }, { "epoch": 0.6857069259748205, "grad_norm": 0.1607797193978022, "learning_rate": 2.7198360340807404e-05, "loss": 0.3526, "step": 2662 }, { "epoch": 0.6859645168561033, "grad_norm": 0.22489188732297646, "learning_rate": 2.715834808073127e-05, "loss": 0.377, "step": 2663 }, { "epoch": 0.6862221077373861, "grad_norm": 0.142881788056936, "learning_rate": 2.7118354297595396e-05, "loss": 0.3452, "step": 2664 }, { "epoch": 0.6864796986186689, "grad_norm": 0.1412582378828825, "learning_rate": 2.7078379023751265e-05, "loss": 0.3499, "step": 2665 }, { "epoch": 0.6864796986186689, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8514929282346779, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35205078125, "eval_runtime": 17.1288, "eval_samples_per_second": 2.569, "eval_steps_per_second": 0.175, "step": 2665 }, { "epoch": 0.6867372894999517, "grad_norm": 0.13549520792037545, "learning_rate": 2.7038422291535505e-05, "loss": 0.3031, "step": 2666 }, { "epoch": 0.6869948803812345, "grad_norm": 0.12068220882639444, "learning_rate": 2.6998484133269652e-05, "loss": 0.3199, "step": 2667 }, { "epoch": 0.6872524712625173, "grad_norm": 0.17229188940030932, "learning_rate": 2.6958564581260264e-05, "loss": 0.3949, "step": 2668 }, { "epoch": 0.6875100621438001, "grad_norm": 0.16154767035065437, "learning_rate": 2.691866366779887e-05, "loss": 0.3745, "step": 2669 }, { "epoch": 0.6877676530250829, "grad_norm": 0.12551094272328808, "learning_rate": 2.6878781425161858e-05, "loss": 0.29, "step": 2670 }, { "epoch": 0.6877676530250829, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.853850183342064, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35524681210517883, "eval_runtime": 17.4355, "eval_samples_per_second": 2.524, "eval_steps_per_second": 0.172, "step": 2670 }, { "epoch": 0.6880252439063658, "grad_norm": 0.19720322634325504, "learning_rate": 2.683891788561055e-05, "loss": 0.4223, "step": 2671 }, { "epoch": 0.6882828347876485, "grad_norm": 0.15366709765352818, "learning_rate": 2.6799073081391147e-05, "loss": 0.3688, "step": 2672 }, { "epoch": 0.6885404256689314, "grad_norm": 0.1882979421870251, "learning_rate": 2.675924704473469e-05, "loss": 0.3844, "step": 2673 }, { "epoch": 0.6887980165502141, "grad_norm": 0.16691711318261465, "learning_rate": 2.6719439807857033e-05, "loss": 0.3684, "step": 2674 }, { "epoch": 0.689055607431497, "grad_norm": 0.15179654874853052, "learning_rate": 2.6679651402958768e-05, "loss": 0.3344, "step": 2675 }, { "epoch": 0.689055607431497, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8522786799371399, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3511185944080353, "eval_runtime": 17.0406, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 2675 }, { "epoch": 0.6893131983127797, "grad_norm": 0.1382970160096718, "learning_rate": 2.6639881862225385e-05, "loss": 0.3712, "step": 2676 }, { "epoch": 0.6895707891940626, "grad_norm": 0.1568546250266237, "learning_rate": 2.6600131217826985e-05, "loss": 0.418, "step": 2677 }, { "epoch": 0.6898283800753453, "grad_norm": 0.1286400446233427, "learning_rate": 2.6560399501918465e-05, "loss": 0.3097, "step": 2678 }, { "epoch": 0.6900859709566282, "grad_norm": 0.1658972291537468, "learning_rate": 2.6520686746639357e-05, "loss": 0.337, "step": 2679 }, { "epoch": 0.6903435618379109, "grad_norm": 0.1245252072082894, "learning_rate": 2.6480992984113877e-05, "loss": 0.3095, "step": 2680 }, { "epoch": 0.6903435618379109, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3512073755264282, "eval_runtime": 17.3116, "eval_samples_per_second": 2.542, "eval_steps_per_second": 0.173, "step": 2680 }, { "epoch": 0.6906011527191938, "grad_norm": 0.1515250169641165, "learning_rate": 2.644131824645092e-05, "loss": 0.3129, "step": 2681 }, { "epoch": 0.6908587436004765, "grad_norm": 0.16763732918130125, "learning_rate": 2.640166256574389e-05, "loss": 0.3398, "step": 2682 }, { "epoch": 0.6911163344817594, "grad_norm": 0.1382463052875121, "learning_rate": 2.6362025974070902e-05, "loss": 0.3468, "step": 2683 }, { "epoch": 0.6913739253630421, "grad_norm": 0.1953974501965342, "learning_rate": 2.6322408503494482e-05, "loss": 0.3896, "step": 2684 }, { "epoch": 0.691631516244325, "grad_norm": 0.1260736126806096, "learning_rate": 2.6282810186061862e-05, "loss": 0.2979, "step": 2685 }, { "epoch": 0.691631516244325, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8541121005762178, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34854403138160706, "eval_runtime": 17.6506, "eval_samples_per_second": 2.493, "eval_steps_per_second": 0.17, "step": 2685 }, { "epoch": 0.6918891071256078, "grad_norm": 0.2205195541459199, "learning_rate": 2.624323105380463e-05, "loss": 0.4454, "step": 2686 }, { "epoch": 0.6921466980068905, "grad_norm": 0.1661657499937164, "learning_rate": 2.6203671138738944e-05, "loss": 0.4094, "step": 2687 }, { "epoch": 0.6924042888881734, "grad_norm": 0.1811939366544613, "learning_rate": 2.616413047286536e-05, "loss": 0.3772, "step": 2688 }, { "epoch": 0.6926618797694561, "grad_norm": 0.18520135079202824, "learning_rate": 2.6124609088168905e-05, "loss": 0.3781, "step": 2689 }, { "epoch": 0.692919470650739, "grad_norm": 0.15492756717661885, "learning_rate": 2.6085107016619015e-05, "loss": 0.3544, "step": 2690 }, { "epoch": 0.692919470650739, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8522786799371399, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34854403138160706, "eval_runtime": 17.0113, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 2690 }, { "epoch": 0.6931770615320217, "grad_norm": 0.22411801493006525, "learning_rate": 2.604562429016944e-05, "loss": 0.4038, "step": 2691 }, { "epoch": 0.6934346524133046, "grad_norm": 0.1420288648821109, "learning_rate": 2.600616094075835e-05, "loss": 0.3692, "step": 2692 }, { "epoch": 0.6936922432945873, "grad_norm": 0.1423341400071091, "learning_rate": 2.5966717000308228e-05, "loss": 0.3552, "step": 2693 }, { "epoch": 0.6939498341758702, "grad_norm": 0.14850724416073355, "learning_rate": 2.5927292500725807e-05, "loss": 0.389, "step": 2694 }, { "epoch": 0.6942074250571529, "grad_norm": 0.13737435005751336, "learning_rate": 2.5887887473902182e-05, "loss": 0.3552, "step": 2695 }, { "epoch": 0.6942074250571529, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8551597695128339, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35329368710517883, "eval_runtime": 17.2152, "eval_samples_per_second": 2.556, "eval_steps_per_second": 0.174, "step": 2695 }, { "epoch": 0.6944650159384358, "grad_norm": 0.15195358397270992, "learning_rate": 2.584850195171259e-05, "loss": 0.4059, "step": 2696 }, { "epoch": 0.6947226068197185, "grad_norm": 0.13920732343492914, "learning_rate": 2.5809135966016562e-05, "loss": 0.3382, "step": 2697 }, { "epoch": 0.6949801977010014, "grad_norm": 0.1516401245351728, "learning_rate": 2.576978954865783e-05, "loss": 0.3832, "step": 2698 }, { "epoch": 0.6952377885822841, "grad_norm": 0.16267808720085594, "learning_rate": 2.5730462731464273e-05, "loss": 0.3678, "step": 2699 }, { "epoch": 0.695495379463567, "grad_norm": 0.1539062210313814, "learning_rate": 2.569115554624789e-05, "loss": 0.3503, "step": 2700 }, { "epoch": 0.695495379463567, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.854112100576218, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3552911877632141, "eval_runtime": 17.454, "eval_samples_per_second": 2.521, "eval_steps_per_second": 0.172, "step": 2700 }, { "epoch": 0.6957529703448498, "grad_norm": 0.13893228245162673, "learning_rate": 2.5651868024804848e-05, "loss": 0.3741, "step": 2701 }, { "epoch": 0.6960105612261326, "grad_norm": 0.13438617071079145, "learning_rate": 2.5612600198915404e-05, "loss": 0.3658, "step": 2702 }, { "epoch": 0.6962681521074154, "grad_norm": 0.15143362391177137, "learning_rate": 2.557335210034383e-05, "loss": 0.3986, "step": 2703 }, { "epoch": 0.6965257429886982, "grad_norm": 0.135959890874589, "learning_rate": 2.553412376083851e-05, "loss": 0.3645, "step": 2704 }, { "epoch": 0.696783333869981, "grad_norm": 0.2628741371875413, "learning_rate": 2.5494915212131765e-05, "loss": 0.4327, "step": 2705 }, { "epoch": 0.696783333869981, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8446830801466737, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35684481263160706, "eval_runtime": 17.2321, "eval_samples_per_second": 2.553, "eval_steps_per_second": 0.174, "step": 2705 }, { "epoch": 0.6970409247512638, "grad_norm": 0.17023455064399243, "learning_rate": 2.5455726485940012e-05, "loss": 0.3763, "step": 2706 }, { "epoch": 0.6972985156325466, "grad_norm": 0.1696502975632842, "learning_rate": 2.541655761396355e-05, "loss": 0.4026, "step": 2707 }, { "epoch": 0.6975561065138294, "grad_norm": 0.19135637232683286, "learning_rate": 2.537740862788662e-05, "loss": 0.36, "step": 2708 }, { "epoch": 0.6978136973951122, "grad_norm": 0.1941420190978459, "learning_rate": 2.5338279559377408e-05, "loss": 0.4501, "step": 2709 }, { "epoch": 0.698071288276395, "grad_norm": 0.18007504455414605, "learning_rate": 2.5299170440087993e-05, "loss": 0.3291, "step": 2710 }, { "epoch": 0.698071288276395, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8459926663174437, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35666725039482117, "eval_runtime": 17.4532, "eval_samples_per_second": 2.521, "eval_steps_per_second": 0.172, "step": 2710 }, { "epoch": 0.6983288791576778, "grad_norm": 0.14401464521530855, "learning_rate": 2.526008130165432e-05, "loss": 0.4013, "step": 2711 }, { "epoch": 0.6985864700389606, "grad_norm": 0.13094302556714996, "learning_rate": 2.522101217569611e-05, "loss": 0.3185, "step": 2712 }, { "epoch": 0.6988440609202434, "grad_norm": 0.17431301504577795, "learning_rate": 2.5181963093816962e-05, "loss": 0.4072, "step": 2713 }, { "epoch": 0.6991016518015263, "grad_norm": 0.1319443611792694, "learning_rate": 2.514293408760426e-05, "loss": 0.3078, "step": 2714 }, { "epoch": 0.699359242682809, "grad_norm": 0.16947826226563384, "learning_rate": 2.5103925188629084e-05, "loss": 0.4262, "step": 2715 }, { "epoch": 0.699359242682809, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8438973284442116, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3564896881580353, "eval_runtime": 17.5267, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 2715 }, { "epoch": 0.6996168335640919, "grad_norm": 0.16059942318850942, "learning_rate": 2.506493642844634e-05, "loss": 0.3947, "step": 2716 }, { "epoch": 0.6998744244453746, "grad_norm": 0.1413370424804344, "learning_rate": 2.5025967838594548e-05, "loss": 0.309, "step": 2717 }, { "epoch": 0.7001320153266575, "grad_norm": 0.1575776946224474, "learning_rate": 2.498701945059599e-05, "loss": 0.3426, "step": 2718 }, { "epoch": 0.7003896062079402, "grad_norm": 0.12915501393757087, "learning_rate": 2.4948091295956566e-05, "loss": 0.3574, "step": 2719 }, { "epoch": 0.7006471970892231, "grad_norm": 0.11879255785567668, "learning_rate": 2.4909183406165836e-05, "loss": 0.3417, "step": 2720 }, { "epoch": 0.7006471970892231, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8410162388685175, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3572443127632141, "eval_runtime": 17.4714, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 2720 }, { "epoch": 0.7009047879705058, "grad_norm": 0.14641264953618238, "learning_rate": 2.4870295812696926e-05, "loss": 0.3337, "step": 2721 }, { "epoch": 0.7011623788517887, "grad_norm": 0.2179540498024203, "learning_rate": 2.483142854700658e-05, "loss": 0.3628, "step": 2722 }, { "epoch": 0.7014199697330714, "grad_norm": 0.14540266069521307, "learning_rate": 2.4792581640535105e-05, "loss": 0.3378, "step": 2723 }, { "epoch": 0.7016775606143543, "grad_norm": 0.16549416288759555, "learning_rate": 2.4753755124706286e-05, "loss": 0.3234, "step": 2724 }, { "epoch": 0.701935151495637, "grad_norm": 0.16311065413664966, "learning_rate": 2.4714949030927487e-05, "loss": 0.3901, "step": 2725 }, { "epoch": 0.701935151495637, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8454688318491357, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35768821835517883, "eval_runtime": 17.0492, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 2725 }, { "epoch": 0.7021927423769199, "grad_norm": 0.14000386797128103, "learning_rate": 2.467616339058945e-05, "loss": 0.329, "step": 2726 }, { "epoch": 0.7024503332582026, "grad_norm": 0.16026256337928413, "learning_rate": 2.4637398235066527e-05, "loss": 0.3949, "step": 2727 }, { "epoch": 0.7027079241394855, "grad_norm": 0.15627168101176667, "learning_rate": 2.4598653595716365e-05, "loss": 0.3861, "step": 2728 }, { "epoch": 0.7029655150207683, "grad_norm": 0.13178721726537074, "learning_rate": 2.455992950388003e-05, "loss": 0.3664, "step": 2729 }, { "epoch": 0.7032231059020511, "grad_norm": 0.14552517768960338, "learning_rate": 2.452122599088203e-05, "loss": 0.2891, "step": 2730 }, { "epoch": 0.7032231059020511, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8438973284442117, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3614612817764282, "eval_runtime": 16.9344, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 2730 }, { "epoch": 0.7034806967833339, "grad_norm": 0.14414489002933717, "learning_rate": 2.4482543088030185e-05, "loss": 0.4093, "step": 2731 }, { "epoch": 0.7037382876646167, "grad_norm": 0.17593344705568692, "learning_rate": 2.4443880826615665e-05, "loss": 0.4037, "step": 2732 }, { "epoch": 0.7039958785458995, "grad_norm": 0.1223001057903308, "learning_rate": 2.44052392379129e-05, "loss": 0.3561, "step": 2733 }, { "epoch": 0.7042534694271823, "grad_norm": 0.17008409291662235, "learning_rate": 2.4366618353179644e-05, "loss": 0.3795, "step": 2734 }, { "epoch": 0.7045110603084651, "grad_norm": 0.16434909190618796, "learning_rate": 2.43280182036569e-05, "loss": 0.3797, "step": 2735 }, { "epoch": 0.7045110603084651, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8415400733368257, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3566228747367859, "eval_runtime": 17.0532, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 2735 }, { "epoch": 0.7047686511897479, "grad_norm": 0.13000640637875388, "learning_rate": 2.4289438820568845e-05, "loss": 0.3139, "step": 2736 }, { "epoch": 0.7050262420710307, "grad_norm": 0.15029391695982908, "learning_rate": 2.425088023512293e-05, "loss": 0.2792, "step": 2737 }, { "epoch": 0.7052838329523134, "grad_norm": 0.22057161618053767, "learning_rate": 2.421234247850972e-05, "loss": 0.3896, "step": 2738 }, { "epoch": 0.7055414238335963, "grad_norm": 0.18522255265204693, "learning_rate": 2.4173825581902975e-05, "loss": 0.3746, "step": 2739 }, { "epoch": 0.705799014714879, "grad_norm": 0.1937399712988186, "learning_rate": 2.4135329576459563e-05, "loss": 0.3207, "step": 2740 }, { "epoch": 0.705799014714879, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8407543216343635, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35768821835517883, "eval_runtime": 17.2614, "eval_samples_per_second": 2.549, "eval_steps_per_second": 0.174, "step": 2740 }, { "epoch": 0.7060566055961619, "grad_norm": 0.15836049317458623, "learning_rate": 2.4096854493319477e-05, "loss": 0.379, "step": 2741 }, { "epoch": 0.7063141964774446, "grad_norm": 0.2390188072952708, "learning_rate": 2.4058400363605728e-05, "loss": 0.453, "step": 2742 }, { "epoch": 0.7065717873587275, "grad_norm": 0.17286721909595393, "learning_rate": 2.4019967218424427e-05, "loss": 0.3891, "step": 2743 }, { "epoch": 0.7068293782400104, "grad_norm": 0.15192179987331367, "learning_rate": 2.398155508886472e-05, "loss": 0.3095, "step": 2744 }, { "epoch": 0.7070869691212931, "grad_norm": 0.16477307850149672, "learning_rate": 2.3943164005998697e-05, "loss": 0.384, "step": 2745 }, { "epoch": 0.7070869691212931, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8394447354635935, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36208274960517883, "eval_runtime": 17.5058, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 2745 }, { "epoch": 0.707344560002576, "grad_norm": 0.16623502164431952, "learning_rate": 2.3904794000881486e-05, "loss": 0.4262, "step": 2746 }, { "epoch": 0.7076021508838587, "grad_norm": 0.17309520719170254, "learning_rate": 2.3866445104551098e-05, "loss": 0.3891, "step": 2747 }, { "epoch": 0.7078597417651415, "grad_norm": 0.14559163997947372, "learning_rate": 2.3828117348028528e-05, "loss": 0.3471, "step": 2748 }, { "epoch": 0.7081173326464243, "grad_norm": 0.11142923579850252, "learning_rate": 2.3789810762317667e-05, "loss": 0.2911, "step": 2749 }, { "epoch": 0.7083749235277071, "grad_norm": 0.13960134559798204, "learning_rate": 2.375152537840522e-05, "loss": 0.3982, "step": 2750 }, { "epoch": 0.7083749235277071, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8446830801466737, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35799893736839294, "eval_runtime": 17.8042, "eval_samples_per_second": 2.471, "eval_steps_per_second": 0.168, "step": 2750 }, { "epoch": 0.7086325144089899, "grad_norm": 0.1454365178210285, "learning_rate": 2.3713261227260812e-05, "loss": 0.3578, "step": 2751 }, { "epoch": 0.7088901052902727, "grad_norm": 0.13251829233355425, "learning_rate": 2.3675018339836858e-05, "loss": 0.3375, "step": 2752 }, { "epoch": 0.7091476961715555, "grad_norm": 0.2148654472903786, "learning_rate": 2.3636796747068595e-05, "loss": 0.4192, "step": 2753 }, { "epoch": 0.7094052870528383, "grad_norm": 0.14156333761022905, "learning_rate": 2.3598596479874008e-05, "loss": 0.3641, "step": 2754 }, { "epoch": 0.7096628779341211, "grad_norm": 0.14510469467718043, "learning_rate": 2.3560417569153796e-05, "loss": 0.3197, "step": 2755 }, { "epoch": 0.7096628779341211, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8493975903614458, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34792259335517883, "eval_runtime": 17.5069, "eval_samples_per_second": 2.513, "eval_steps_per_second": 0.171, "step": 2755 }, { "epoch": 0.7099204688154039, "grad_norm": 0.14240734386176662, "learning_rate": 2.352226004579151e-05, "loss": 0.4157, "step": 2756 }, { "epoch": 0.7101780596966868, "grad_norm": 0.1502415215795503, "learning_rate": 2.3484123940653253e-05, "loss": 0.361, "step": 2757 }, { "epoch": 0.7104356505779695, "grad_norm": 0.14913094528465853, "learning_rate": 2.3446009284587915e-05, "loss": 0.3628, "step": 2758 }, { "epoch": 0.7106932414592524, "grad_norm": 0.1393740635701928, "learning_rate": 2.3407916108426946e-05, "loss": 0.3102, "step": 2759 }, { "epoch": 0.7109508323405351, "grad_norm": 0.15461891812931783, "learning_rate": 2.3369844442984484e-05, "loss": 0.3578, "step": 2760 }, { "epoch": 0.7109508323405351, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8473022524882137, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34561434388160706, "eval_runtime": 16.6556, "eval_samples_per_second": 2.642, "eval_steps_per_second": 0.18, "step": 2760 }, { "epoch": 0.711208423221818, "grad_norm": 0.1620128221439273, "learning_rate": 2.333179431905726e-05, "loss": 0.3858, "step": 2761 }, { "epoch": 0.7114660141031007, "grad_norm": 0.12484716096081154, "learning_rate": 2.3293765767424537e-05, "loss": 0.3949, "step": 2762 }, { "epoch": 0.7117236049843836, "grad_norm": 0.12417823636822578, "learning_rate": 2.325575881884819e-05, "loss": 0.3016, "step": 2763 }, { "epoch": 0.7119811958656663, "grad_norm": 0.1603996671736155, "learning_rate": 2.321777350407252e-05, "loss": 0.339, "step": 2764 }, { "epoch": 0.7122387867469492, "grad_norm": 0.1635755859000412, "learning_rate": 2.317980985382448e-05, "loss": 0.4179, "step": 2765 }, { "epoch": 0.7122387867469492, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.85358826610791, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3414417505264282, "eval_runtime": 17.0303, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 2765 }, { "epoch": 0.7124963776282319, "grad_norm": 0.1578545422391313, "learning_rate": 2.3141867898813358e-05, "loss": 0.34, "step": 2766 }, { "epoch": 0.7127539685095148, "grad_norm": 0.19707829642740438, "learning_rate": 2.310394766973097e-05, "loss": 0.4205, "step": 2767 }, { "epoch": 0.7130115593907975, "grad_norm": 0.16862116596731477, "learning_rate": 2.306604919725151e-05, "loss": 0.4188, "step": 2768 }, { "epoch": 0.7132691502720804, "grad_norm": 0.1173747837754076, "learning_rate": 2.3028172512031604e-05, "loss": 0.3259, "step": 2769 }, { "epoch": 0.7135267411533631, "grad_norm": 0.13781967857656147, "learning_rate": 2.2990317644710274e-05, "loss": 0.3662, "step": 2770 }, { "epoch": 0.7135267411533631, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34255149960517883, "eval_runtime": 17.0691, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2770 }, { "epoch": 0.713784332034646, "grad_norm": 0.12840077547265583, "learning_rate": 2.2952484625908827e-05, "loss": 0.3207, "step": 2771 }, { "epoch": 0.7140419229159288, "grad_norm": 0.13723383099874353, "learning_rate": 2.2914673486230954e-05, "loss": 0.4079, "step": 2772 }, { "epoch": 0.7142995137972116, "grad_norm": 0.14335730554159018, "learning_rate": 2.287688425626262e-05, "loss": 0.3296, "step": 2773 }, { "epoch": 0.7145571046784944, "grad_norm": 0.14139486566500542, "learning_rate": 2.2839116966572105e-05, "loss": 0.2804, "step": 2774 }, { "epoch": 0.7148146955597772, "grad_norm": 0.16000352992328196, "learning_rate": 2.280137164770989e-05, "loss": 0.364, "step": 2775 }, { "epoch": 0.7148146955597772, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.85489785227868, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.34237393736839294, "eval_runtime": 16.8733, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 2775 }, { "epoch": 0.71507228644106, "grad_norm": 0.1426100036868392, "learning_rate": 2.276364833020868e-05, "loss": 0.3776, "step": 2776 }, { "epoch": 0.7153298773223428, "grad_norm": 0.15906307930400226, "learning_rate": 2.272594704458344e-05, "loss": 0.3864, "step": 2777 }, { "epoch": 0.7155874682036256, "grad_norm": 0.17996034084740364, "learning_rate": 2.2688267821331278e-05, "loss": 0.4076, "step": 2778 }, { "epoch": 0.7158450590849084, "grad_norm": 0.1897824054477158, "learning_rate": 2.2650610690931467e-05, "loss": 0.4065, "step": 2779 }, { "epoch": 0.7161026499661912, "grad_norm": 0.13218113662802577, "learning_rate": 2.2612975683845372e-05, "loss": 0.2961, "step": 2780 }, { "epoch": 0.7161026499661912, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8522786799371398, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3450372815132141, "eval_runtime": 17.694, "eval_samples_per_second": 2.487, "eval_steps_per_second": 0.17, "step": 2780 }, { "epoch": 0.716360240847474, "grad_norm": 0.1569939201335511, "learning_rate": 2.2575362830516506e-05, "loss": 0.3165, "step": 2781 }, { "epoch": 0.7166178317287568, "grad_norm": 0.18097788321208738, "learning_rate": 2.253777216137047e-05, "loss": 0.4363, "step": 2782 }, { "epoch": 0.7168754226100396, "grad_norm": 0.13620805598169097, "learning_rate": 2.2500203706814856e-05, "loss": 0.3661, "step": 2783 }, { "epoch": 0.7171330134913224, "grad_norm": 0.10753286752324899, "learning_rate": 2.246265749723936e-05, "loss": 0.2783, "step": 2784 }, { "epoch": 0.7173906043726052, "grad_norm": 0.1300316161236073, "learning_rate": 2.2425133563015594e-05, "loss": 0.2907, "step": 2785 }, { "epoch": 0.7173906043726052, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.854112100576218, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3551136255264282, "eval_runtime": 17.4436, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 2785 }, { "epoch": 0.717648195253888, "grad_norm": 0.1701872693075267, "learning_rate": 2.238763193449729e-05, "loss": 0.4144, "step": 2786 }, { "epoch": 0.7179057861351709, "grad_norm": 0.1760300746742691, "learning_rate": 2.2350152642019983e-05, "loss": 0.3941, "step": 2787 }, { "epoch": 0.7181633770164536, "grad_norm": 0.14581543549786966, "learning_rate": 2.2312695715901266e-05, "loss": 0.3625, "step": 2788 }, { "epoch": 0.7184209678977365, "grad_norm": 0.24930305966943844, "learning_rate": 2.2275261186440537e-05, "loss": 0.4298, "step": 2789 }, { "epoch": 0.7186785587790192, "grad_norm": 0.18957999994987207, "learning_rate": 2.2237849083919142e-05, "loss": 0.3462, "step": 2790 }, { "epoch": 0.7186785587790192, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.851754845468832, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3500532805919647, "eval_runtime": 17.4986, "eval_samples_per_second": 2.514, "eval_steps_per_second": 0.171, "step": 2790 }, { "epoch": 0.7189361496603021, "grad_norm": 0.15553216172084486, "learning_rate": 2.2200459438600297e-05, "loss": 0.3787, "step": 2791 }, { "epoch": 0.7191937405415848, "grad_norm": 0.1609548296303529, "learning_rate": 2.216309228072897e-05, "loss": 0.3803, "step": 2792 }, { "epoch": 0.7194513314228677, "grad_norm": 0.21372436553220225, "learning_rate": 2.2125747640532023e-05, "loss": 0.3382, "step": 2793 }, { "epoch": 0.7197089223041504, "grad_norm": 0.13384594375374534, "learning_rate": 2.2088425548218065e-05, "loss": 0.2806, "step": 2794 }, { "epoch": 0.7199665131854333, "grad_norm": 0.14277732385378297, "learning_rate": 2.2051126033977494e-05, "loss": 0.34, "step": 2795 }, { "epoch": 0.7199665131854333, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8496595075955997, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3463689684867859, "eval_runtime": 16.9121, "eval_samples_per_second": 2.602, "eval_steps_per_second": 0.177, "step": 2795 }, { "epoch": 0.720224104066716, "grad_norm": 0.1341500531756553, "learning_rate": 2.20138491279824e-05, "loss": 0.3279, "step": 2796 }, { "epoch": 0.7204816949479989, "grad_norm": 0.16899171892652634, "learning_rate": 2.1976594860386597e-05, "loss": 0.3483, "step": 2797 }, { "epoch": 0.7207392858292816, "grad_norm": 0.14477035937310337, "learning_rate": 2.1939363261325606e-05, "loss": 0.2884, "step": 2798 }, { "epoch": 0.7209968767105644, "grad_norm": 0.13349709589620268, "learning_rate": 2.190215436091661e-05, "loss": 0.3415, "step": 2799 }, { "epoch": 0.7212544675918473, "grad_norm": 0.25768602565818954, "learning_rate": 2.1864968189258434e-05, "loss": 0.4377, "step": 2800 }, { "epoch": 0.7212544675918473, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8483499214248299, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3491654694080353, "eval_runtime": 17.1243, "eval_samples_per_second": 2.569, "eval_steps_per_second": 0.175, "step": 2800 }, { "epoch": 0.72151205847313, "grad_norm": 0.18235096954259772, "learning_rate": 2.1827804776431476e-05, "loss": 0.3697, "step": 2801 }, { "epoch": 0.7217696493544129, "grad_norm": 0.22471544209079214, "learning_rate": 2.1790664152497768e-05, "loss": 0.3636, "step": 2802 }, { "epoch": 0.7220272402356956, "grad_norm": 0.17327612172954443, "learning_rate": 2.1753546347500918e-05, "loss": 0.3078, "step": 2803 }, { "epoch": 0.7222848311169785, "grad_norm": 0.24146631371380453, "learning_rate": 2.1716451391466008e-05, "loss": 0.4625, "step": 2804 }, { "epoch": 0.7225424219982612, "grad_norm": 0.13098403629381128, "learning_rate": 2.167937931439972e-05, "loss": 0.3208, "step": 2805 }, { "epoch": 0.7225424219982612, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8480880041906758, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34938743710517883, "eval_runtime": 17.1567, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 2805 }, { "epoch": 0.7228000128795441, "grad_norm": 0.1753570422091817, "learning_rate": 2.1642330146290142e-05, "loss": 0.4, "step": 2806 }, { "epoch": 0.7230576037608268, "grad_norm": 0.132697904686546, "learning_rate": 2.160530391710694e-05, "loss": 0.3107, "step": 2807 }, { "epoch": 0.7233151946421097, "grad_norm": 0.12347173853975807, "learning_rate": 2.1568300656801126e-05, "loss": 0.2349, "step": 2808 }, { "epoch": 0.7235727855233924, "grad_norm": 0.17619796384247116, "learning_rate": 2.153132039530516e-05, "loss": 0.2991, "step": 2809 }, { "epoch": 0.7238303764046753, "grad_norm": 0.19431505394055815, "learning_rate": 2.1494363162532915e-05, "loss": 0.376, "step": 2810 }, { "epoch": 0.7238303764046753, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8504452592980618, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3519176244735718, "eval_runtime": 17.0949, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 2810 }, { "epoch": 0.724087967285958, "grad_norm": 0.1456938494015266, "learning_rate": 2.1457428988379635e-05, "loss": 0.3923, "step": 2811 }, { "epoch": 0.7243455581672409, "grad_norm": 0.28893525407443255, "learning_rate": 2.1420517902721914e-05, "loss": 0.4272, "step": 2812 }, { "epoch": 0.7246031490485236, "grad_norm": 0.16875241353218418, "learning_rate": 2.1383629935417633e-05, "loss": 0.3865, "step": 2813 }, { "epoch": 0.7248607399298065, "grad_norm": 0.16407317749283473, "learning_rate": 2.1346765116306007e-05, "loss": 0.405, "step": 2814 }, { "epoch": 0.7251183308110893, "grad_norm": 0.1699188422149344, "learning_rate": 2.1309923475207537e-05, "loss": 0.3776, "step": 2815 }, { "epoch": 0.7251183308110893, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8457307490832897, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35196200013160706, "eval_runtime": 16.9334, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 2815 }, { "epoch": 0.7253759216923721, "grad_norm": 0.20051875201203073, "learning_rate": 2.127310504192393e-05, "loss": 0.3865, "step": 2816 }, { "epoch": 0.7256335125736549, "grad_norm": 0.16568167623786675, "learning_rate": 2.1236309846238166e-05, "loss": 0.3963, "step": 2817 }, { "epoch": 0.7258911034549377, "grad_norm": 0.19477369321158514, "learning_rate": 2.1199537917914386e-05, "loss": 0.4678, "step": 2818 }, { "epoch": 0.7261486943362205, "grad_norm": 0.2569997922112408, "learning_rate": 2.116278928669794e-05, "loss": 0.2914, "step": 2819 }, { "epoch": 0.7264062852175033, "grad_norm": 0.16061324251902118, "learning_rate": 2.112606398231532e-05, "loss": 0.3937, "step": 2820 }, { "epoch": 0.7264062852175033, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8486118386589837, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35342684388160706, "eval_runtime": 16.9883, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 2820 }, { "epoch": 0.7266638760987861, "grad_norm": 0.17647205144652872, "learning_rate": 2.1089362034474174e-05, "loss": 0.3539, "step": 2821 }, { "epoch": 0.7269214669800689, "grad_norm": 0.17270817125147134, "learning_rate": 2.1052683472863206e-05, "loss": 0.3466, "step": 2822 }, { "epoch": 0.7271790578613517, "grad_norm": 0.13480061391904238, "learning_rate": 2.101602832715224e-05, "loss": 0.2718, "step": 2823 }, { "epoch": 0.7274366487426345, "grad_norm": 0.20601105689222124, "learning_rate": 2.0979396626992172e-05, "loss": 0.4099, "step": 2824 }, { "epoch": 0.7276942396239173, "grad_norm": 0.13614223332667116, "learning_rate": 2.0942788402014867e-05, "loss": 0.2952, "step": 2825 }, { "epoch": 0.7276942396239173, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8412781561026716, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35378196835517883, "eval_runtime": 16.9682, "eval_samples_per_second": 2.593, "eval_steps_per_second": 0.177, "step": 2825 }, { "epoch": 0.7279518305052001, "grad_norm": 0.21917858956071629, "learning_rate": 2.090620368183329e-05, "loss": 0.4518, "step": 2826 }, { "epoch": 0.7282094213864829, "grad_norm": 0.15729039477419035, "learning_rate": 2.0869642496041287e-05, "loss": 0.3691, "step": 2827 }, { "epoch": 0.7284670122677657, "grad_norm": 0.1579740569695876, "learning_rate": 2.08331048742138e-05, "loss": 0.4156, "step": 2828 }, { "epoch": 0.7287246031490485, "grad_norm": 0.2746904571365112, "learning_rate": 2.07965908459066e-05, "loss": 0.4188, "step": 2829 }, { "epoch": 0.7289821940303314, "grad_norm": 0.1393606165959669, "learning_rate": 2.0760100440656387e-05, "loss": 0.3145, "step": 2830 }, { "epoch": 0.7289821940303314, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8491356731272917, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3520951569080353, "eval_runtime": 16.8114, "eval_samples_per_second": 2.617, "eval_steps_per_second": 0.178, "step": 2830 }, { "epoch": 0.7292397849116141, "grad_norm": 0.12932326109029305, "learning_rate": 2.0723633687980796e-05, "loss": 0.3047, "step": 2831 }, { "epoch": 0.729497375792897, "grad_norm": 0.1498285785627019, "learning_rate": 2.068719061737831e-05, "loss": 0.3614, "step": 2832 }, { "epoch": 0.7297549666741797, "grad_norm": 0.20868169377215004, "learning_rate": 2.065077125832826e-05, "loss": 0.3363, "step": 2833 }, { "epoch": 0.7300125575554626, "grad_norm": 0.14402969023476137, "learning_rate": 2.061437564029076e-05, "loss": 0.3519, "step": 2834 }, { "epoch": 0.7302701484367453, "grad_norm": 0.15265662731074459, "learning_rate": 2.0578003792706768e-05, "loss": 0.2935, "step": 2835 }, { "epoch": 0.7302701484367453, "eval_PRM Accuracy": 0.7830188679245284, "eval_PRM F1": 0.8571428571428571, "eval_PRM F1 AUC": 0.7200104766893662, "eval_PRM F1 AUC (fixed)": 0.8488737558931377, "eval_PRM F1 Neg": 0.5490196078431373, "eval_PRM NPV": 0.5, "eval_PRM Precision": 0.8846153846153846, "eval_PRM Recall": 0.8313253012048193, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3531605005264282, "eval_runtime": 17.5934, "eval_samples_per_second": 2.501, "eval_steps_per_second": 0.171, "step": 2835 }, { "epoch": 0.7305277393180282, "grad_norm": 0.24287864454517327, "learning_rate": 2.0541655744998e-05, "loss": 0.4744, "step": 2836 }, { "epoch": 0.7307853301993109, "grad_norm": 0.15874048526571136, "learning_rate": 2.0505331526566895e-05, "loss": 0.3077, "step": 2837 }, { "epoch": 0.7310429210805938, "grad_norm": 0.1463427369358526, "learning_rate": 2.0469031166796655e-05, "loss": 0.3317, "step": 2838 }, { "epoch": 0.7313005119618765, "grad_norm": 0.18444488811203785, "learning_rate": 2.0432754695051136e-05, "loss": 0.3929, "step": 2839 }, { "epoch": 0.7315581028431594, "grad_norm": 0.20367463774789532, "learning_rate": 2.0396502140674912e-05, "loss": 0.4534, "step": 2840 }, { "epoch": 0.7315581028431594, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8501833420639078, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3519176244735718, "eval_runtime": 16.8662, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 2840 }, { "epoch": 0.7318156937244421, "grad_norm": 0.1991717128847312, "learning_rate": 2.0360273532993197e-05, "loss": 0.3871, "step": 2841 }, { "epoch": 0.732073284605725, "grad_norm": 0.20576862098770296, "learning_rate": 2.0324068901311845e-05, "loss": 0.3311, "step": 2842 }, { "epoch": 0.7323308754870078, "grad_norm": 0.16023628152659833, "learning_rate": 2.028788827491729e-05, "loss": 0.3438, "step": 2843 }, { "epoch": 0.7325884663682906, "grad_norm": 0.16413587615962985, "learning_rate": 2.0251731683076513e-05, "loss": 0.2958, "step": 2844 }, { "epoch": 0.7328460572495734, "grad_norm": 0.1841223663022876, "learning_rate": 2.021559915503719e-05, "loss": 0.3785, "step": 2845 }, { "epoch": 0.7328460572495734, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8525405971712938, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.34912109375, "eval_runtime": 17.3349, "eval_samples_per_second": 2.538, "eval_steps_per_second": 0.173, "step": 2845 }, { "epoch": 0.7331036481308562, "grad_norm": 0.12811717473489762, "learning_rate": 2.0179490720027372e-05, "loss": 0.3372, "step": 2846 }, { "epoch": 0.733361239012139, "grad_norm": 0.1688778809301542, "learning_rate": 2.014340640725574e-05, "loss": 0.3721, "step": 2847 }, { "epoch": 0.7336188298934218, "grad_norm": 0.1388623977493131, "learning_rate": 2.0107346245911363e-05, "loss": 0.3548, "step": 2848 }, { "epoch": 0.7338764207747046, "grad_norm": 0.17128413866710143, "learning_rate": 2.007131026516385e-05, "loss": 0.3845, "step": 2849 }, { "epoch": 0.7341340116559874, "grad_norm": 0.20677829508976778, "learning_rate": 2.0035298494163242e-05, "loss": 0.5202, "step": 2850 }, { "epoch": 0.7341340116559874, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.856469355683604, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3509410619735718, "eval_runtime": 16.7754, "eval_samples_per_second": 2.623, "eval_steps_per_second": 0.179, "step": 2850 }, { "epoch": 0.7343916025372702, "grad_norm": 0.1708544325194527, "learning_rate": 1.9999310962039934e-05, "loss": 0.2936, "step": 2851 }, { "epoch": 0.734649193418553, "grad_norm": 0.1266410946760741, "learning_rate": 1.996334769790479e-05, "loss": 0.3464, "step": 2852 }, { "epoch": 0.7349067842998358, "grad_norm": 0.2469503024356025, "learning_rate": 1.992740873084899e-05, "loss": 0.4851, "step": 2853 }, { "epoch": 0.7351643751811185, "grad_norm": 0.13580119361733087, "learning_rate": 1.989149408994412e-05, "loss": 0.3464, "step": 2854 }, { "epoch": 0.7354219660624014, "grad_norm": 0.16299674356087096, "learning_rate": 1.9855603804241996e-05, "loss": 0.3548, "step": 2855 }, { "epoch": 0.7354219660624014, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3465021252632141, "eval_runtime": 18.0216, "eval_samples_per_second": 2.442, "eval_steps_per_second": 0.166, "step": 2855 }, { "epoch": 0.7356795569436841, "grad_norm": 0.15873327356315253, "learning_rate": 1.9819737902774827e-05, "loss": 0.4211, "step": 2856 }, { "epoch": 0.735937147824967, "grad_norm": 0.15839506512733864, "learning_rate": 1.9783896414555025e-05, "loss": 0.3314, "step": 2857 }, { "epoch": 0.7361947387062499, "grad_norm": 0.1452327507498212, "learning_rate": 1.9748079368575295e-05, "loss": 0.3955, "step": 2858 }, { "epoch": 0.7364523295875326, "grad_norm": 0.15903516455174, "learning_rate": 1.971228679380858e-05, "loss": 0.3542, "step": 2859 }, { "epoch": 0.7367099204688154, "grad_norm": 0.17939374114155127, "learning_rate": 1.9676518719207977e-05, "loss": 0.4656, "step": 2860 }, { "epoch": 0.7367099204688154, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.855945521215296, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3450816869735718, "eval_runtime": 17.0479, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 2860 }, { "epoch": 0.7369675113500982, "grad_norm": 0.15200576468787627, "learning_rate": 1.964077517370681e-05, "loss": 0.3171, "step": 2861 }, { "epoch": 0.737225102231381, "grad_norm": 0.21334655667634317, "learning_rate": 1.9605056186218556e-05, "loss": 0.4409, "step": 2862 }, { "epoch": 0.7374826931126638, "grad_norm": 0.14205795400710666, "learning_rate": 1.9569361785636797e-05, "loss": 0.3282, "step": 2863 }, { "epoch": 0.7377402839939466, "grad_norm": 0.20040320969796976, "learning_rate": 1.953369200083527e-05, "loss": 0.3636, "step": 2864 }, { "epoch": 0.7379978748752294, "grad_norm": 0.11111142214894738, "learning_rate": 1.949804686066772e-05, "loss": 0.2554, "step": 2865 }, { "epoch": 0.7379978748752294, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8520167627029859, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3450372815132141, "eval_runtime": 17.6178, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 2865 }, { "epoch": 0.7382554657565122, "grad_norm": 0.18847941333564858, "learning_rate": 1.946242639396809e-05, "loss": 0.3828, "step": 2866 }, { "epoch": 0.738513056637795, "grad_norm": 0.18877652381601745, "learning_rate": 1.9426830629550242e-05, "loss": 0.4274, "step": 2867 }, { "epoch": 0.7387706475190778, "grad_norm": 0.16026963134003505, "learning_rate": 1.939125959620812e-05, "loss": 0.3781, "step": 2868 }, { "epoch": 0.7390282384003606, "grad_norm": 0.18082191678975715, "learning_rate": 1.935571332271562e-05, "loss": 0.3381, "step": 2869 }, { "epoch": 0.7392858292816434, "grad_norm": 0.15372085179022296, "learning_rate": 1.9320191837826645e-05, "loss": 0.4042, "step": 2870 }, { "epoch": 0.7392858292816434, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.8504452592980618, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3495649993419647, "eval_runtime": 16.936, "eval_samples_per_second": 2.598, "eval_steps_per_second": 0.177, "step": 2870 }, { "epoch": 0.7395434201629262, "grad_norm": 0.14695245780883914, "learning_rate": 1.9284695170275054e-05, "loss": 0.3517, "step": 2871 }, { "epoch": 0.739801011044209, "grad_norm": 0.12643757593323876, "learning_rate": 1.9249223348774576e-05, "loss": 0.3489, "step": 2872 }, { "epoch": 0.7400586019254919, "grad_norm": 0.19796817841926875, "learning_rate": 1.921377640201889e-05, "loss": 0.4138, "step": 2873 }, { "epoch": 0.7403161928067746, "grad_norm": 0.1298000475881407, "learning_rate": 1.917835435868155e-05, "loss": 0.3158, "step": 2874 }, { "epoch": 0.7405737836880575, "grad_norm": 0.13516710204554838, "learning_rate": 1.914295724741596e-05, "loss": 0.3638, "step": 2875 }, { "epoch": 0.7405737836880575, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8514929282346779, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3528497815132141, "eval_runtime": 17.5638, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 2875 }, { "epoch": 0.7408313745693402, "grad_norm": 0.17167873035919043, "learning_rate": 1.9107585096855347e-05, "loss": 0.3429, "step": 2876 }, { "epoch": 0.7410889654506231, "grad_norm": 0.13290459640636187, "learning_rate": 1.9072237935612723e-05, "loss": 0.3138, "step": 2877 }, { "epoch": 0.7413465563319058, "grad_norm": 0.19189743311010096, "learning_rate": 1.903691579228094e-05, "loss": 0.3939, "step": 2878 }, { "epoch": 0.7416041472131887, "grad_norm": 0.16895816792952276, "learning_rate": 1.9001618695432587e-05, "loss": 0.42, "step": 2879 }, { "epoch": 0.7418617380944714, "grad_norm": 0.14064985293965904, "learning_rate": 1.896634667362e-05, "loss": 0.3335, "step": 2880 }, { "epoch": 0.7418617380944714, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8551597695128339, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3513849377632141, "eval_runtime": 17.0451, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 2880 }, { "epoch": 0.7421193289757543, "grad_norm": 0.18602414961212507, "learning_rate": 1.8931099755375203e-05, "loss": 0.3734, "step": 2881 }, { "epoch": 0.742376919857037, "grad_norm": 0.15488617309263178, "learning_rate": 1.8895877969209942e-05, "loss": 0.3407, "step": 2882 }, { "epoch": 0.7426345107383199, "grad_norm": 0.15243021960849687, "learning_rate": 1.8860681343615637e-05, "loss": 0.396, "step": 2883 }, { "epoch": 0.7428921016196026, "grad_norm": 0.1580456194150447, "learning_rate": 1.8825509907063327e-05, "loss": 0.3891, "step": 2884 }, { "epoch": 0.7431496925008855, "grad_norm": 0.14722958450716395, "learning_rate": 1.8790363688003715e-05, "loss": 0.3335, "step": 2885 }, { "epoch": 0.7431496925008855, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8658536585365854, "eval_PRM F1 AUC": 0.710319539025668, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5416666666666666, "eval_PRM NPV": 0.52, "eval_PRM Precision": 0.8765432098765432, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.34659090638160706, "eval_runtime": 16.8948, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 2885 }, { "epoch": 0.7434072833821682, "grad_norm": 0.14951969006379529, "learning_rate": 1.8755242714867033e-05, "loss": 0.3679, "step": 2886 }, { "epoch": 0.7436648742634511, "grad_norm": 0.20213164773469453, "learning_rate": 1.872014701606321e-05, "loss": 0.3379, "step": 2887 }, { "epoch": 0.7439224651447339, "grad_norm": 0.15156321122722566, "learning_rate": 1.8685076619981608e-05, "loss": 0.4043, "step": 2888 }, { "epoch": 0.7441800560260167, "grad_norm": 0.1691706422290455, "learning_rate": 1.8650031554991204e-05, "loss": 0.397, "step": 2889 }, { "epoch": 0.7444376469072995, "grad_norm": 0.17246103476737243, "learning_rate": 1.861501184944043e-05, "loss": 0.4437, "step": 2890 }, { "epoch": 0.7444376469072995, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8543740178103718, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3437943756580353, "eval_runtime": 16.8841, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 2890 }, { "epoch": 0.7446952377885823, "grad_norm": 0.1400396128521265, "learning_rate": 1.858001753165724e-05, "loss": 0.3539, "step": 2891 }, { "epoch": 0.7449528286698651, "grad_norm": 0.17662014355854183, "learning_rate": 1.8545048629949053e-05, "loss": 0.4447, "step": 2892 }, { "epoch": 0.7452104195511479, "grad_norm": 0.1482406577038468, "learning_rate": 1.8510105172602693e-05, "loss": 0.3367, "step": 2893 }, { "epoch": 0.7454680104324307, "grad_norm": 0.12641438932045507, "learning_rate": 1.847518718788443e-05, "loss": 0.32, "step": 2894 }, { "epoch": 0.7457256013137135, "grad_norm": 0.1585391209790409, "learning_rate": 1.844029470403993e-05, "loss": 0.4044, "step": 2895 }, { "epoch": 0.7457256013137135, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8522786799371398, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3456587493419647, "eval_runtime": 17.5313, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 2895 }, { "epoch": 0.7459831921949963, "grad_norm": 0.16251051820303028, "learning_rate": 1.8405427749294234e-05, "loss": 0.3462, "step": 2896 }, { "epoch": 0.7462407830762791, "grad_norm": 0.17249731070989127, "learning_rate": 1.837058635185172e-05, "loss": 0.3703, "step": 2897 }, { "epoch": 0.7464983739575619, "grad_norm": 0.1519789464954743, "learning_rate": 1.8335770539896062e-05, "loss": 0.3211, "step": 2898 }, { "epoch": 0.7467559648388447, "grad_norm": 0.12250229087928584, "learning_rate": 1.8300980341590297e-05, "loss": 0.3416, "step": 2899 }, { "epoch": 0.7470135557201275, "grad_norm": 0.12434608201649983, "learning_rate": 1.8266215785076708e-05, "loss": 0.3311, "step": 2900 }, { "epoch": 0.7470135557201275, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.857778941854374, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3418412506580353, "eval_runtime": 17.0572, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 2900 }, { "epoch": 0.7472711466014104, "grad_norm": 0.1492807344471492, "learning_rate": 1.8231476898476867e-05, "loss": 0.331, "step": 2901 }, { "epoch": 0.7475287374826931, "grad_norm": 0.1413288815423703, "learning_rate": 1.8196763709891524e-05, "loss": 0.2894, "step": 2902 }, { "epoch": 0.747786328363976, "grad_norm": 0.1452211515922782, "learning_rate": 1.816207624740069e-05, "loss": 0.3075, "step": 2903 }, { "epoch": 0.7480439192452587, "grad_norm": 0.1480829176685368, "learning_rate": 1.812741453906357e-05, "loss": 0.3622, "step": 2904 }, { "epoch": 0.7483015101265416, "grad_norm": 0.15788110558347976, "learning_rate": 1.8092778612918482e-05, "loss": 0.3923, "step": 2905 }, { "epoch": 0.7483015101265416, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34512606263160706, "eval_runtime": 17.7062, "eval_samples_per_second": 2.485, "eval_steps_per_second": 0.169, "step": 2905 }, { "epoch": 0.7485591010078243, "grad_norm": 0.15126243423791813, "learning_rate": 1.8058168496982963e-05, "loss": 0.3614, "step": 2906 }, { "epoch": 0.7488166918891072, "grad_norm": 0.16507873655754893, "learning_rate": 1.8023584219253575e-05, "loss": 0.4163, "step": 2907 }, { "epoch": 0.7490742827703899, "grad_norm": 0.1488832117971817, "learning_rate": 1.798902580770611e-05, "loss": 0.3626, "step": 2908 }, { "epoch": 0.7493318736516728, "grad_norm": 0.1513545373401777, "learning_rate": 1.795449329029531e-05, "loss": 0.3941, "step": 2909 }, { "epoch": 0.7495894645329555, "grad_norm": 0.13517131173517444, "learning_rate": 1.791998669495506e-05, "loss": 0.3546, "step": 2910 }, { "epoch": 0.7495894645329555, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8590885280251441, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3465021252632141, "eval_runtime": 17.5578, "eval_samples_per_second": 2.506, "eval_steps_per_second": 0.171, "step": 2910 }, { "epoch": 0.7498470554142384, "grad_norm": 0.22523685544678199, "learning_rate": 1.78855060495982e-05, "loss": 0.4323, "step": 2911 }, { "epoch": 0.7501046462955211, "grad_norm": 0.1718645357263855, "learning_rate": 1.7851051382116646e-05, "loss": 0.4329, "step": 2912 }, { "epoch": 0.750362237176804, "grad_norm": 0.16909439145573646, "learning_rate": 1.7816622720381283e-05, "loss": 0.3165, "step": 2913 }, { "epoch": 0.7506198280580867, "grad_norm": 0.14053595469665883, "learning_rate": 1.778222009224192e-05, "loss": 0.3302, "step": 2914 }, { "epoch": 0.7508774189393695, "grad_norm": 0.1503230658218862, "learning_rate": 1.7747843525527353e-05, "loss": 0.3257, "step": 2915 }, { "epoch": 0.7508774189393695, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.854635935044526, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34787818789482117, "eval_runtime": 17.3232, "eval_samples_per_second": 2.54, "eval_steps_per_second": 0.173, "step": 2915 }, { "epoch": 0.7511350098206524, "grad_norm": 0.15720921123220546, "learning_rate": 1.7713493048045294e-05, "loss": 0.3257, "step": 2916 }, { "epoch": 0.7513926007019351, "grad_norm": 0.13069791043410423, "learning_rate": 1.767916868758231e-05, "loss": 0.3076, "step": 2917 }, { "epoch": 0.751650191583218, "grad_norm": 0.17679548430754036, "learning_rate": 1.7644870471903897e-05, "loss": 0.4254, "step": 2918 }, { "epoch": 0.7519077824645007, "grad_norm": 0.1207566534633257, "learning_rate": 1.7610598428754337e-05, "loss": 0.3105, "step": 2919 }, { "epoch": 0.7521653733457836, "grad_norm": 0.14864696819534934, "learning_rate": 1.7576352585856808e-05, "loss": 0.3577, "step": 2920 }, { "epoch": 0.7521653733457836, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.857778941854374, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.34912109375, "eval_runtime": 17.493, "eval_samples_per_second": 2.515, "eval_steps_per_second": 0.171, "step": 2920 }, { "epoch": 0.7524229642270663, "grad_norm": 0.16679396112225395, "learning_rate": 1.754213297091325e-05, "loss": 0.4314, "step": 2921 }, { "epoch": 0.7526805551083492, "grad_norm": 0.19271587669515353, "learning_rate": 1.7507939611604428e-05, "loss": 0.3953, "step": 2922 }, { "epoch": 0.7529381459896319, "grad_norm": 0.17871937531964524, "learning_rate": 1.747377253558982e-05, "loss": 0.4266, "step": 2923 }, { "epoch": 0.7531957368709148, "grad_norm": 0.13026572785919774, "learning_rate": 1.743963177050763e-05, "loss": 0.3305, "step": 2924 }, { "epoch": 0.7534533277521975, "grad_norm": 0.1453669538080503, "learning_rate": 1.7405517343974887e-05, "loss": 0.4153, "step": 2925 }, { "epoch": 0.7534533277521975, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.855683603981142, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35000887513160706, "eval_runtime": 17.4626, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 2925 }, { "epoch": 0.7537109186334804, "grad_norm": 0.24307759373423093, "learning_rate": 1.7371429283587177e-05, "loss": 0.3801, "step": 2926 }, { "epoch": 0.7539685095147631, "grad_norm": 0.14212415088413297, "learning_rate": 1.733736761691887e-05, "loss": 0.3175, "step": 2927 }, { "epoch": 0.754226100396046, "grad_norm": 0.15282471754587118, "learning_rate": 1.730333237152289e-05, "loss": 0.3233, "step": 2928 }, { "epoch": 0.7544836912773287, "grad_norm": 0.13897934498451875, "learning_rate": 1.7269323574930864e-05, "loss": 0.3659, "step": 2929 }, { "epoch": 0.7547412821586116, "grad_norm": 0.1695791763278988, "learning_rate": 1.7235341254653005e-05, "loss": 0.3957, "step": 2930 }, { "epoch": 0.7547412821586116, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8564693556836039, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3519176244735718, "eval_runtime": 17.0676, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 2930 }, { "epoch": 0.7549988730398944, "grad_norm": 0.16179982830368525, "learning_rate": 1.720138543817807e-05, "loss": 0.3185, "step": 2931 }, { "epoch": 0.7552564639211772, "grad_norm": 0.23922589104682979, "learning_rate": 1.7167456152973423e-05, "loss": 0.3178, "step": 2932 }, { "epoch": 0.75551405480246, "grad_norm": 0.20969924399766007, "learning_rate": 1.7133553426484944e-05, "loss": 0.4275, "step": 2933 }, { "epoch": 0.7557716456837428, "grad_norm": 0.16089740417640336, "learning_rate": 1.7099677286137066e-05, "loss": 0.3567, "step": 2934 }, { "epoch": 0.7560292365650256, "grad_norm": 0.12886208418372316, "learning_rate": 1.7065827759332635e-05, "loss": 0.3124, "step": 2935 }, { "epoch": 0.7560292365650256, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.85751702462022, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3492986559867859, "eval_runtime": 17.5164, "eval_samples_per_second": 2.512, "eval_steps_per_second": 0.171, "step": 2935 }, { "epoch": 0.7562868274463084, "grad_norm": 0.1337285576937397, "learning_rate": 1.7032004873453067e-05, "loss": 0.3412, "step": 2936 }, { "epoch": 0.7565444183275912, "grad_norm": 0.1664150507331768, "learning_rate": 1.6998208655858137e-05, "loss": 0.4291, "step": 2937 }, { "epoch": 0.756802009208874, "grad_norm": 0.13580790660922049, "learning_rate": 1.6964439133886113e-05, "loss": 0.3988, "step": 2938 }, { "epoch": 0.7570596000901568, "grad_norm": 0.1404404085199257, "learning_rate": 1.6930696334853662e-05, "loss": 0.345, "step": 2939 }, { "epoch": 0.7573171909714396, "grad_norm": 0.15238213854304544, "learning_rate": 1.689698028605578e-05, "loss": 0.3218, "step": 2940 }, { "epoch": 0.7573171909714396, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8596123624934521, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3463689684867859, "eval_runtime": 16.9174, "eval_samples_per_second": 2.601, "eval_steps_per_second": 0.177, "step": 2940 }, { "epoch": 0.7575747818527224, "grad_norm": 0.13425930199780564, "learning_rate": 1.6863291014765892e-05, "loss": 0.3337, "step": 2941 }, { "epoch": 0.7578323727340052, "grad_norm": 0.16054514975701115, "learning_rate": 1.6829628548235714e-05, "loss": 0.3058, "step": 2942 }, { "epoch": 0.758089963615288, "grad_norm": 0.16866158814780352, "learning_rate": 1.6795992913695336e-05, "loss": 0.3933, "step": 2943 }, { "epoch": 0.7583475544965709, "grad_norm": 0.13142791020502617, "learning_rate": 1.6762384138353078e-05, "loss": 0.318, "step": 2944 }, { "epoch": 0.7586051453778536, "grad_norm": 0.15822763947870488, "learning_rate": 1.6728802249395526e-05, "loss": 0.3451, "step": 2945 }, { "epoch": 0.7586051453778536, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8632792037716082, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34716796875, "eval_runtime": 16.8788, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 2945 }, { "epoch": 0.7588627362591365, "grad_norm": 0.17066267423933648, "learning_rate": 1.6695247273987624e-05, "loss": 0.3425, "step": 2946 }, { "epoch": 0.7591203271404192, "grad_norm": 0.11733629413361088, "learning_rate": 1.666171923927242e-05, "loss": 0.2829, "step": 2947 }, { "epoch": 0.7593779180217021, "grad_norm": 0.1925757723152739, "learning_rate": 1.6628218172371256e-05, "loss": 0.3487, "step": 2948 }, { "epoch": 0.7596355089029848, "grad_norm": 0.11046305102940092, "learning_rate": 1.65947441003836e-05, "loss": 0.2704, "step": 2949 }, { "epoch": 0.7598930997842677, "grad_norm": 0.12447076120217489, "learning_rate": 1.6561297050387115e-05, "loss": 0.357, "step": 2950 }, { "epoch": 0.7598930997842677, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8593504452592979, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3507634997367859, "eval_runtime": 17.1561, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 2950 }, { "epoch": 0.7601506906655504, "grad_norm": 0.20224682982646164, "learning_rate": 1.6527877049437622e-05, "loss": 0.442, "step": 2951 }, { "epoch": 0.7604082815468333, "grad_norm": 0.14177204700939802, "learning_rate": 1.649448412456901e-05, "loss": 0.2664, "step": 2952 }, { "epoch": 0.760665872428116, "grad_norm": 0.2889674168079724, "learning_rate": 1.646111830279331e-05, "loss": 0.5855, "step": 2953 }, { "epoch": 0.7609234633093989, "grad_norm": 0.16607495086402554, "learning_rate": 1.642777961110061e-05, "loss": 0.3882, "step": 2954 }, { "epoch": 0.7611810541906816, "grad_norm": 0.18332211113271998, "learning_rate": 1.6394468076459075e-05, "loss": 0.377, "step": 2955 }, { "epoch": 0.7611810541906816, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8564693556836039, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3504527807235718, "eval_runtime": 16.9539, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 2955 }, { "epoch": 0.7614386450719645, "grad_norm": 0.13803947369702252, "learning_rate": 1.6361183725814854e-05, "loss": 0.3689, "step": 2956 }, { "epoch": 0.7616962359532472, "grad_norm": 0.14152335309676822, "learning_rate": 1.6327926586092164e-05, "loss": 0.3651, "step": 2957 }, { "epoch": 0.7619538268345301, "grad_norm": 0.14016725907975244, "learning_rate": 1.6294696684193154e-05, "loss": 0.3171, "step": 2958 }, { "epoch": 0.7622114177158129, "grad_norm": 0.1701719017758532, "learning_rate": 1.626149404699799e-05, "loss": 0.3681, "step": 2959 }, { "epoch": 0.7624690085970957, "grad_norm": 0.14654085957327564, "learning_rate": 1.6228318701364766e-05, "loss": 0.3471, "step": 2960 }, { "epoch": 0.7624690085970957, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8522786799371399, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3520951569080353, "eval_runtime": 17.1812, "eval_samples_per_second": 2.561, "eval_steps_per_second": 0.175, "step": 2960 }, { "epoch": 0.7627265994783785, "grad_norm": 0.19656535107566206, "learning_rate": 1.619517067412947e-05, "loss": 0.3658, "step": 2961 }, { "epoch": 0.7629841903596613, "grad_norm": 0.14743344260199182, "learning_rate": 1.6162049992106028e-05, "loss": 0.402, "step": 2962 }, { "epoch": 0.7632417812409441, "grad_norm": 0.15003486832519877, "learning_rate": 1.6128956682086244e-05, "loss": 0.3789, "step": 2963 }, { "epoch": 0.7634993721222268, "grad_norm": 0.1478983781365589, "learning_rate": 1.6095890770839785e-05, "loss": 0.3257, "step": 2964 }, { "epoch": 0.7637569630035097, "grad_norm": 0.16434245775381556, "learning_rate": 1.6062852285114123e-05, "loss": 0.3357, "step": 2965 }, { "epoch": 0.7637569630035097, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35653409361839294, "eval_runtime": 17.0825, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 2965 }, { "epoch": 0.7640145538847924, "grad_norm": 0.18186633279718095, "learning_rate": 1.602984125163453e-05, "loss": 0.4663, "step": 2966 }, { "epoch": 0.7642721447660753, "grad_norm": 0.16844634436853015, "learning_rate": 1.5996857697104173e-05, "loss": 0.4044, "step": 2967 }, { "epoch": 0.764529735647358, "grad_norm": 0.1545485980685033, "learning_rate": 1.5963901648203873e-05, "loss": 0.4153, "step": 2968 }, { "epoch": 0.7647873265286409, "grad_norm": 0.2063714841277203, "learning_rate": 1.5930973131592287e-05, "loss": 0.4315, "step": 2969 }, { "epoch": 0.7650449174099236, "grad_norm": 0.1705379775897913, "learning_rate": 1.5898072173905726e-05, "loss": 0.3686, "step": 2970 }, { "epoch": 0.7650449174099236, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8567312729177581, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35684481263160706, "eval_runtime": 16.5503, "eval_samples_per_second": 2.659, "eval_steps_per_second": 0.181, "step": 2970 }, { "epoch": 0.7653025082912065, "grad_norm": 0.16356938844768326, "learning_rate": 1.586519880175827e-05, "loss": 0.3312, "step": 2971 }, { "epoch": 0.7655600991724892, "grad_norm": 0.15365701888615851, "learning_rate": 1.583235304174167e-05, "loss": 0.3351, "step": 2972 }, { "epoch": 0.7658176900537721, "grad_norm": 0.12856143044646068, "learning_rate": 1.5799534920425306e-05, "loss": 0.3165, "step": 2973 }, { "epoch": 0.766075280935055, "grad_norm": 0.16976094460049398, "learning_rate": 1.576674446435624e-05, "loss": 0.3903, "step": 2974 }, { "epoch": 0.7663328718163377, "grad_norm": 0.1349218547438422, "learning_rate": 1.573398170005915e-05, "loss": 0.3744, "step": 2975 }, { "epoch": 0.7663328718163377, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3609730005264282, "eval_runtime": 17.4479, "eval_samples_per_second": 2.522, "eval_steps_per_second": 0.172, "step": 2975 }, { "epoch": 0.7665904626976205, "grad_norm": 0.14586490633803456, "learning_rate": 1.570124665403632e-05, "loss": 0.2993, "step": 2976 }, { "epoch": 0.7668480535789033, "grad_norm": 0.17185579787156047, "learning_rate": 1.566853935276758e-05, "loss": 0.46, "step": 2977 }, { "epoch": 0.7671056444601861, "grad_norm": 0.15102550584338897, "learning_rate": 1.563585982271032e-05, "loss": 0.3124, "step": 2978 }, { "epoch": 0.7673632353414689, "grad_norm": 0.1813132581237937, "learning_rate": 1.5603208090299498e-05, "loss": 0.4488, "step": 2979 }, { "epoch": 0.7676208262227517, "grad_norm": 0.17197077484984621, "learning_rate": 1.557058418194757e-05, "loss": 0.4041, "step": 2980 }, { "epoch": 0.7676208262227517, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9058823529411765, "eval_PRM F1 AUC": 0.746464117338921, "eval_PRM F1 AUC (fixed)": 0.8538501833420639, "eval_PRM F1 Neg": 0.6190476190476191, "eval_PRM NPV": 0.6842105263157895, "eval_PRM Precision": 0.8850574712643678, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3643909692764282, "eval_runtime": 17.3241, "eval_samples_per_second": 2.54, "eval_steps_per_second": 0.173, "step": 2980 }, { "epoch": 0.7678784171040345, "grad_norm": 0.148938786911208, "learning_rate": 1.5537988124044495e-05, "loss": 0.346, "step": 2981 }, { "epoch": 0.7681360079853173, "grad_norm": 0.15400556027034898, "learning_rate": 1.5505419942957668e-05, "loss": 0.4183, "step": 2982 }, { "epoch": 0.7683935988666001, "grad_norm": 0.15300890855965438, "learning_rate": 1.5472879665031965e-05, "loss": 0.3504, "step": 2983 }, { "epoch": 0.7686511897478829, "grad_norm": 0.13426689113485515, "learning_rate": 1.544036731658971e-05, "loss": 0.3121, "step": 2984 }, { "epoch": 0.7689087806291657, "grad_norm": 0.15191938007208422, "learning_rate": 1.5407882923930565e-05, "loss": 0.3667, "step": 2985 }, { "epoch": 0.7689087806291657, "eval_PRM Accuracy": 0.8490566037735849, "eval_PRM F1": 0.9058823529411765, "eval_PRM F1 AUC": 0.746464117338921, "eval_PRM F1 AUC (fixed)": 0.8530644316396018, "eval_PRM F1 Neg": 0.6190476190476191, "eval_PRM NPV": 0.6842105263157895, "eval_PRM Precision": 0.8850574712643678, "eval_PRM Recall": 0.927710843373494, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3705610930919647, "eval_runtime": 16.981, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 2985 }, { "epoch": 0.7691663715104485, "grad_norm": 0.13208861504575023, "learning_rate": 1.537542651333167e-05, "loss": 0.3071, "step": 2986 }, { "epoch": 0.7694239623917314, "grad_norm": 0.12707672366812425, "learning_rate": 1.534299811104742e-05, "loss": 0.3703, "step": 2987 }, { "epoch": 0.7696815532730141, "grad_norm": 0.12697393465493456, "learning_rate": 1.5310597743309684e-05, "loss": 0.3754, "step": 2988 }, { "epoch": 0.769939144154297, "grad_norm": 0.12172270298945981, "learning_rate": 1.5278225436327536e-05, "loss": 0.316, "step": 2989 }, { "epoch": 0.7701967350355797, "grad_norm": 0.18743615861942842, "learning_rate": 1.5245881216287433e-05, "loss": 0.4215, "step": 2990 }, { "epoch": 0.7701967350355797, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8994082840236687, "eval_PRM F1 AUC": 0.7404400209533788, "eval_PRM F1 AUC (fixed)": 0.8486118386589837, "eval_PRM F1 Neg": 0.6046511627906976, "eval_PRM NPV": 0.65, "eval_PRM Precision": 0.8837209302325582, "eval_PRM Recall": 0.9156626506024096, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3681196868419647, "eval_runtime": 17.2366, "eval_samples_per_second": 2.553, "eval_steps_per_second": 0.174, "step": 2990 }, { "epoch": 0.7704543259168626, "grad_norm": 0.11547746948552717, "learning_rate": 1.5213565109353045e-05, "loss": 0.3056, "step": 2991 }, { "epoch": 0.7707119167981453, "grad_norm": 0.12374691774652735, "learning_rate": 1.5181277141665356e-05, "loss": 0.2785, "step": 2992 }, { "epoch": 0.7709695076794282, "grad_norm": 0.13162751974187664, "learning_rate": 1.5149017339342574e-05, "loss": 0.3711, "step": 2993 }, { "epoch": 0.7712270985607109, "grad_norm": 0.2034467324859911, "learning_rate": 1.5116785728480093e-05, "loss": 0.3958, "step": 2994 }, { "epoch": 0.7714846894419938, "grad_norm": 0.15343478310052172, "learning_rate": 1.5084582335150538e-05, "loss": 0.3587, "step": 2995 }, { "epoch": 0.7714846894419938, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8478260869565218, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3704723119735718, "eval_runtime": 16.8955, "eval_samples_per_second": 2.604, "eval_steps_per_second": 0.178, "step": 2995 }, { "epoch": 0.7717422803232765, "grad_norm": 0.1080886012047265, "learning_rate": 1.5052407185403694e-05, "loss": 0.2992, "step": 2996 }, { "epoch": 0.7719998712045594, "grad_norm": 0.12905574745651321, "learning_rate": 1.502026030526652e-05, "loss": 0.3368, "step": 2997 }, { "epoch": 0.7722574620858421, "grad_norm": 0.16972772518993512, "learning_rate": 1.4988141720743076e-05, "loss": 0.3682, "step": 2998 }, { "epoch": 0.772515052967125, "grad_norm": 0.17634437263973804, "learning_rate": 1.4956051457814523e-05, "loss": 0.3871, "step": 2999 }, { "epoch": 0.7727726438484077, "grad_norm": 0.18345313042461878, "learning_rate": 1.4923989542439159e-05, "loss": 0.4054, "step": 3000 }, { "epoch": 0.7727726438484077, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8486118386589838, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.36376953125, "eval_runtime": 17.6273, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 3000 }, { "epoch": 0.7730302347296906, "grad_norm": 0.14058774963976547, "learning_rate": 1.489195600055232e-05, "loss": 0.3141, "step": 3001 }, { "epoch": 0.7732878256109734, "grad_norm": 0.11834801102658438, "learning_rate": 1.4859950858066424e-05, "loss": 0.3114, "step": 3002 }, { "epoch": 0.7735454164922562, "grad_norm": 0.14146204912084168, "learning_rate": 1.4827974140870849e-05, "loss": 0.3947, "step": 3003 }, { "epoch": 0.773803007373539, "grad_norm": 0.14557895519871822, "learning_rate": 1.4796025874832042e-05, "loss": 0.3476, "step": 3004 }, { "epoch": 0.7740605982548218, "grad_norm": 0.16390764566271313, "learning_rate": 1.4764106085793427e-05, "loss": 0.287, "step": 3005 }, { "epoch": 0.7740605982548218, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8509690937663699, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3579545319080353, "eval_runtime": 16.7006, "eval_samples_per_second": 2.635, "eval_steps_per_second": 0.18, "step": 3005 }, { "epoch": 0.7743181891361046, "grad_norm": 0.15783892818399603, "learning_rate": 1.4732214799575356e-05, "loss": 0.3265, "step": 3006 }, { "epoch": 0.7745757800173874, "grad_norm": 0.16701388547454737, "learning_rate": 1.4700352041975168e-05, "loss": 0.3967, "step": 3007 }, { "epoch": 0.7748333708986702, "grad_norm": 0.1342244226008435, "learning_rate": 1.466851783876706e-05, "loss": 0.2996, "step": 3008 }, { "epoch": 0.775090961779953, "grad_norm": 0.15096247697832504, "learning_rate": 1.4636712215702247e-05, "loss": 0.4116, "step": 3009 }, { "epoch": 0.7753485526612358, "grad_norm": 0.15733531131676592, "learning_rate": 1.46049351985087e-05, "loss": 0.4415, "step": 3010 }, { "epoch": 0.7753485526612358, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.855945521215296, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35888671875, "eval_runtime": 17.1656, "eval_samples_per_second": 2.563, "eval_steps_per_second": 0.175, "step": 3010 }, { "epoch": 0.7756061435425186, "grad_norm": 0.16011601782689275, "learning_rate": 1.4573186812891343e-05, "loss": 0.4263, "step": 3011 }, { "epoch": 0.7758637344238014, "grad_norm": 0.1284198666376941, "learning_rate": 1.4541467084531863e-05, "loss": 0.3166, "step": 3012 }, { "epoch": 0.7761213253050842, "grad_norm": 0.1292310144891526, "learning_rate": 1.4509776039088818e-05, "loss": 0.3549, "step": 3013 }, { "epoch": 0.776378916186367, "grad_norm": 0.1549120024576305, "learning_rate": 1.447811370219757e-05, "loss": 0.3612, "step": 3014 }, { "epoch": 0.7766365070676498, "grad_norm": 0.1306904460810586, "learning_rate": 1.4446480099470206e-05, "loss": 0.3393, "step": 3015 }, { "epoch": 0.7766365070676498, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8590885280251441, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3525390625, "eval_runtime": 17.5607, "eval_samples_per_second": 2.506, "eval_steps_per_second": 0.171, "step": 3015 }, { "epoch": 0.7768940979489326, "grad_norm": 0.16467995650531836, "learning_rate": 1.4414875256495635e-05, "loss": 0.4474, "step": 3016 }, { "epoch": 0.7771516888302155, "grad_norm": 0.1247034305420687, "learning_rate": 1.4383299198839418e-05, "loss": 0.3611, "step": 3017 }, { "epoch": 0.7774092797114982, "grad_norm": 0.19180123036774666, "learning_rate": 1.435175195204394e-05, "loss": 0.3799, "step": 3018 }, { "epoch": 0.7776668705927811, "grad_norm": 0.1847733317728554, "learning_rate": 1.4320233541628197e-05, "loss": 0.4825, "step": 3019 }, { "epoch": 0.7779244614740638, "grad_norm": 0.1265021722333401, "learning_rate": 1.4288743993087867e-05, "loss": 0.2939, "step": 3020 }, { "epoch": 0.7779244614740638, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8577789418543741, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3505859375, "eval_runtime": 17.5839, "eval_samples_per_second": 2.502, "eval_steps_per_second": 0.171, "step": 3020 }, { "epoch": 0.7781820523553467, "grad_norm": 0.15997535301777288, "learning_rate": 1.4257283331895315e-05, "loss": 0.3022, "step": 3021 }, { "epoch": 0.7784396432366294, "grad_norm": 0.1544326027362218, "learning_rate": 1.4225851583499516e-05, "loss": 0.4364, "step": 3022 }, { "epoch": 0.7786972341179123, "grad_norm": 0.1213826151566587, "learning_rate": 1.4194448773326085e-05, "loss": 0.361, "step": 3023 }, { "epoch": 0.778954824999195, "grad_norm": 0.15962484723358972, "learning_rate": 1.4163074926777186e-05, "loss": 0.3715, "step": 3024 }, { "epoch": 0.7792124158804778, "grad_norm": 0.1577184412829596, "learning_rate": 1.4131730069231546e-05, "loss": 0.3616, "step": 3025 }, { "epoch": 0.7792124158804778, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.8569931901519119, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3513849377632141, "eval_runtime": 17.0796, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 3025 }, { "epoch": 0.7794700067617606, "grad_norm": 0.13538587204028882, "learning_rate": 1.4100414226044528e-05, "loss": 0.3105, "step": 3026 }, { "epoch": 0.7797275976430434, "grad_norm": 0.12051611552810815, "learning_rate": 1.4069127422547928e-05, "loss": 0.3154, "step": 3027 }, { "epoch": 0.7799851885243262, "grad_norm": 0.12716379710372344, "learning_rate": 1.4037869684050115e-05, "loss": 0.2933, "step": 3028 }, { "epoch": 0.780242779405609, "grad_norm": 0.11789709782620507, "learning_rate": 1.4006641035835888e-05, "loss": 0.2429, "step": 3029 }, { "epoch": 0.7805003702868919, "grad_norm": 0.14166167889211181, "learning_rate": 1.3975441503166575e-05, "loss": 0.3559, "step": 3030 }, { "epoch": 0.7805003702868919, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.860398114195914, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3520064055919647, "eval_runtime": 16.4473, "eval_samples_per_second": 2.675, "eval_steps_per_second": 0.182, "step": 3030 }, { "epoch": 0.7807579611681746, "grad_norm": 0.12712463415874173, "learning_rate": 1.3944271111279938e-05, "loss": 0.3194, "step": 3031 }, { "epoch": 0.7810155520494575, "grad_norm": 0.14169961581983545, "learning_rate": 1.391312988539012e-05, "loss": 0.3189, "step": 3032 }, { "epoch": 0.7812731429307402, "grad_norm": 0.14890365714154657, "learning_rate": 1.3882017850687723e-05, "loss": 0.3279, "step": 3033 }, { "epoch": 0.7815307338120231, "grad_norm": 0.1340802698123587, "learning_rate": 1.3850935032339718e-05, "loss": 0.3351, "step": 3034 }, { "epoch": 0.7817883246933058, "grad_norm": 0.21072470578371352, "learning_rate": 1.3819881455489458e-05, "loss": 0.3894, "step": 3035 }, { "epoch": 0.7817883246933058, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.861183865898376, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3512517809867859, "eval_runtime": 17.0334, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 3035 }, { "epoch": 0.7820459155745887, "grad_norm": 0.11579516212958814, "learning_rate": 1.3788857145256601e-05, "loss": 0.3099, "step": 3036 }, { "epoch": 0.7823035064558714, "grad_norm": 0.16587350270262458, "learning_rate": 1.3757862126737186e-05, "loss": 0.3777, "step": 3037 }, { "epoch": 0.7825610973371543, "grad_norm": 0.16105238268832156, "learning_rate": 1.3726896425003494e-05, "loss": 0.379, "step": 3038 }, { "epoch": 0.782818688218437, "grad_norm": 0.13665198318038102, "learning_rate": 1.3695960065104141e-05, "loss": 0.3353, "step": 3039 }, { "epoch": 0.7830762790997199, "grad_norm": 0.1518393503211405, "learning_rate": 1.3665053072064015e-05, "loss": 0.3444, "step": 3040 }, { "epoch": 0.7830762790997199, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8619696176008382, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.34494850039482117, "eval_runtime": 17.5324, "eval_samples_per_second": 2.51, "eval_steps_per_second": 0.171, "step": 3040 }, { "epoch": 0.7833338699810026, "grad_norm": 0.1378995176713397, "learning_rate": 1.3634175470884191e-05, "loss": 0.3505, "step": 3041 }, { "epoch": 0.7835914608622855, "grad_norm": 0.15155051752474802, "learning_rate": 1.3603327286542023e-05, "loss": 0.3067, "step": 3042 }, { "epoch": 0.7838490517435682, "grad_norm": 0.1423207225603477, "learning_rate": 1.3572508543991042e-05, "loss": 0.3027, "step": 3043 }, { "epoch": 0.7841066426248511, "grad_norm": 0.19797254317044372, "learning_rate": 1.354171926816099e-05, "loss": 0.4265, "step": 3044 }, { "epoch": 0.7843642335061339, "grad_norm": 0.18191445341381524, "learning_rate": 1.3510959483957747e-05, "loss": 0.408, "step": 3045 }, { "epoch": 0.7843642335061339, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8624934520691462, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3435724377632141, "eval_runtime": 17.4665, "eval_samples_per_second": 2.519, "eval_steps_per_second": 0.172, "step": 3045 }, { "epoch": 0.7846218243874167, "grad_norm": 0.13857225888396082, "learning_rate": 1.3480229216263301e-05, "loss": 0.3642, "step": 3046 }, { "epoch": 0.7848794152686995, "grad_norm": 0.15968303402814563, "learning_rate": 1.3449528489935882e-05, "loss": 0.3127, "step": 3047 }, { "epoch": 0.7851370061499823, "grad_norm": 0.17219086960992772, "learning_rate": 1.3418857329809686e-05, "loss": 0.383, "step": 3048 }, { "epoch": 0.7853945970312651, "grad_norm": 0.18186358036938544, "learning_rate": 1.33882157606951e-05, "loss": 0.3826, "step": 3049 }, { "epoch": 0.7856521879125479, "grad_norm": 0.15222456939919551, "learning_rate": 1.3357603807378494e-05, "loss": 0.3642, "step": 3050 }, { "epoch": 0.7856521879125479, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.859612362493452, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3444158434867859, "eval_runtime": 17.009, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 3050 }, { "epoch": 0.7859097787938307, "grad_norm": 0.16118023948393811, "learning_rate": 1.3327021494622327e-05, "loss": 0.3317, "step": 3051 }, { "epoch": 0.7861673696751135, "grad_norm": 0.1832818767072772, "learning_rate": 1.3296468847165094e-05, "loss": 0.352, "step": 3052 }, { "epoch": 0.7864249605563963, "grad_norm": 0.1236688381910297, "learning_rate": 1.3265945889721232e-05, "loss": 0.3155, "step": 3053 }, { "epoch": 0.7866825514376791, "grad_norm": 0.12641185997577145, "learning_rate": 1.3235452646981222e-05, "loss": 0.324, "step": 3054 }, { "epoch": 0.7869401423189619, "grad_norm": 0.1509307143906646, "learning_rate": 1.320498914361148e-05, "loss": 0.3155, "step": 3055 }, { "epoch": 0.7869401423189619, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8617077003666842, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34934303164482117, "eval_runtime": 17.1533, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 3055 }, { "epoch": 0.7871977332002447, "grad_norm": 0.1935152464744341, "learning_rate": 1.317455540425439e-05, "loss": 0.3599, "step": 3056 }, { "epoch": 0.7874553240815275, "grad_norm": 0.15161289717133192, "learning_rate": 1.314415145352821e-05, "loss": 0.3343, "step": 3057 }, { "epoch": 0.7877129149628103, "grad_norm": 0.1650799941746293, "learning_rate": 1.311377731602716e-05, "loss": 0.3511, "step": 3058 }, { "epoch": 0.7879705058440931, "grad_norm": 0.1478806408444346, "learning_rate": 1.308343301632129e-05, "loss": 0.3284, "step": 3059 }, { "epoch": 0.788228096725376, "grad_norm": 0.1537392022022734, "learning_rate": 1.3053118578956552e-05, "loss": 0.3842, "step": 3060 }, { "epoch": 0.788228096725376, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8603981141959139, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35098543763160706, "eval_runtime": 17.015, "eval_samples_per_second": 2.586, "eval_steps_per_second": 0.176, "step": 3060 }, { "epoch": 0.7884856876066587, "grad_norm": 0.14616295653136274, "learning_rate": 1.3022834028454745e-05, "loss": 0.3689, "step": 3061 }, { "epoch": 0.7887432784879416, "grad_norm": 0.23036871894570896, "learning_rate": 1.2992579389313447e-05, "loss": 0.4226, "step": 3062 }, { "epoch": 0.7890008693692243, "grad_norm": 0.17726641686505862, "learning_rate": 1.2962354686006084e-05, "loss": 0.389, "step": 3063 }, { "epoch": 0.7892584602505072, "grad_norm": 0.23808118890056537, "learning_rate": 1.2932159942981859e-05, "loss": 0.4003, "step": 3064 }, { "epoch": 0.7895160511317899, "grad_norm": 0.1888630927913337, "learning_rate": 1.2901995184665738e-05, "loss": 0.3082, "step": 3065 }, { "epoch": 0.7895160511317899, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8727272727272727, "eval_PRM F1 AUC": 0.7163436354112102, "eval_PRM F1 AUC (fixed)": 0.8598742797276061, "eval_PRM F1 Neg": 0.5531914893617021, "eval_PRM NPV": 0.5416666666666666, "eval_PRM Precision": 0.8780487804878049, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3521839380264282, "eval_runtime": 17.1927, "eval_samples_per_second": 2.559, "eval_steps_per_second": 0.174, "step": 3065 }, { "epoch": 0.7897736420130728, "grad_norm": 0.17660808710861764, "learning_rate": 1.2871860435458415e-05, "loss": 0.3739, "step": 3066 }, { "epoch": 0.7900312328943555, "grad_norm": 0.15476291567859546, "learning_rate": 1.2841755719736297e-05, "loss": 0.3816, "step": 3067 }, { "epoch": 0.7902888237756384, "grad_norm": 0.12893535183165825, "learning_rate": 1.2811681061851577e-05, "loss": 0.309, "step": 3068 }, { "epoch": 0.7905464146569211, "grad_norm": 0.1950505850576325, "learning_rate": 1.2781636486132032e-05, "loss": 0.4174, "step": 3069 }, { "epoch": 0.790804005538204, "grad_norm": 0.14358917460470716, "learning_rate": 1.2751622016881182e-05, "loss": 0.3717, "step": 3070 }, { "epoch": 0.790804005538204, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8603981141959142, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3463689684867859, "eval_runtime": 16.9011, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.178, "step": 3070 }, { "epoch": 0.7910615964194867, "grad_norm": 0.16288921010001353, "learning_rate": 1.2721637678378135e-05, "loss": 0.3157, "step": 3071 }, { "epoch": 0.7913191873007696, "grad_norm": 0.15466066163218317, "learning_rate": 1.269168349487766e-05, "loss": 0.3487, "step": 3072 }, { "epoch": 0.7915767781820524, "grad_norm": 0.14573254860745088, "learning_rate": 1.2661759490610147e-05, "loss": 0.4106, "step": 3073 }, { "epoch": 0.7918343690633352, "grad_norm": 0.18796138932114959, "learning_rate": 1.2631865689781519e-05, "loss": 0.3582, "step": 3074 }, { "epoch": 0.792091959944618, "grad_norm": 0.15013663863658994, "learning_rate": 1.2602002116573326e-05, "loss": 0.3096, "step": 3075 }, { "epoch": 0.792091959944618, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8585646935568361, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3478338122367859, "eval_runtime": 16.555, "eval_samples_per_second": 2.658, "eval_steps_per_second": 0.181, "step": 3075 }, { "epoch": 0.7923495508259008, "grad_norm": 0.2142982096339322, "learning_rate": 1.2572168795142625e-05, "loss": 0.4224, "step": 3076 }, { "epoch": 0.7926071417071836, "grad_norm": 0.1433498928638448, "learning_rate": 1.2542365749622049e-05, "loss": 0.3584, "step": 3077 }, { "epoch": 0.7928647325884663, "grad_norm": 0.15172777066050058, "learning_rate": 1.2512593004119665e-05, "loss": 0.3374, "step": 3078 }, { "epoch": 0.7931223234697492, "grad_norm": 0.12597397781523353, "learning_rate": 1.2482850582719113e-05, "loss": 0.2746, "step": 3079 }, { "epoch": 0.793379914351032, "grad_norm": 0.14939011073252528, "learning_rate": 1.245313850947944e-05, "loss": 0.3636, "step": 3080 }, { "epoch": 0.793379914351032, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8585646935568361, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3492986559867859, "eval_runtime": 16.4209, "eval_samples_per_second": 2.68, "eval_steps_per_second": 0.183, "step": 3080 }, { "epoch": 0.7936375052323148, "grad_norm": 0.14238863183396824, "learning_rate": 1.2423456808435169e-05, "loss": 0.3904, "step": 3081 }, { "epoch": 0.7938950961135975, "grad_norm": 0.13719461645791636, "learning_rate": 1.2393805503596278e-05, "loss": 0.357, "step": 3082 }, { "epoch": 0.7941526869948804, "grad_norm": 0.12705428374549121, "learning_rate": 1.236418461894811e-05, "loss": 0.3326, "step": 3083 }, { "epoch": 0.7944102778761631, "grad_norm": 0.21843707794248127, "learning_rate": 1.2334594178451425e-05, "loss": 0.4417, "step": 3084 }, { "epoch": 0.794667868757446, "grad_norm": 0.13831670552438846, "learning_rate": 1.2305034206042377e-05, "loss": 0.3232, "step": 3085 }, { "epoch": 0.794667868757446, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.861969617600838, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.345703125, "eval_runtime": 16.9733, "eval_samples_per_second": 2.592, "eval_steps_per_second": 0.177, "step": 3085 }, { "epoch": 0.7949254596387287, "grad_norm": 0.1904254167981357, "learning_rate": 1.227550472563242e-05, "loss": 0.4004, "step": 3086 }, { "epoch": 0.7951830505200116, "grad_norm": 0.15322394134665404, "learning_rate": 1.2246005761108409e-05, "loss": 0.3587, "step": 3087 }, { "epoch": 0.7954406414012944, "grad_norm": 0.17623590960873045, "learning_rate": 1.2216537336332435e-05, "loss": 0.3887, "step": 3088 }, { "epoch": 0.7956982322825772, "grad_norm": 0.15243977087247143, "learning_rate": 1.2187099475141983e-05, "loss": 0.3331, "step": 3089 }, { "epoch": 0.79595582316386, "grad_norm": 0.1479049088221529, "learning_rate": 1.2157692201349718e-05, "loss": 0.3229, "step": 3090 }, { "epoch": 0.79595582316386, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8603981141959142, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34765625, "eval_runtime": 16.4732, "eval_samples_per_second": 2.671, "eval_steps_per_second": 0.182, "step": 3090 }, { "epoch": 0.7962134140451428, "grad_norm": 0.1718959786852763, "learning_rate": 1.2128315538743646e-05, "loss": 0.4597, "step": 3091 }, { "epoch": 0.7964710049264256, "grad_norm": 0.12891371719175318, "learning_rate": 1.2098969511086926e-05, "loss": 0.2998, "step": 3092 }, { "epoch": 0.7967285958077084, "grad_norm": 0.15974397377931412, "learning_rate": 1.2069654142118013e-05, "loss": 0.3535, "step": 3093 }, { "epoch": 0.7969861866889912, "grad_norm": 0.11747097504418012, "learning_rate": 1.2040369455550532e-05, "loss": 0.2964, "step": 3094 }, { "epoch": 0.797243777570274, "grad_norm": 0.18298648103401638, "learning_rate": 1.2011115475073265e-05, "loss": 0.3676, "step": 3095 }, { "epoch": 0.797243777570274, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8614457831325301, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3492986559867859, "eval_runtime": 17.2897, "eval_samples_per_second": 2.545, "eval_steps_per_second": 0.174, "step": 3095 }, { "epoch": 0.7975013684515568, "grad_norm": 0.1367028762879542, "learning_rate": 1.1981892224350194e-05, "loss": 0.2908, "step": 3096 }, { "epoch": 0.7977589593328396, "grad_norm": 0.12675364225506255, "learning_rate": 1.1952699727020395e-05, "loss": 0.3565, "step": 3097 }, { "epoch": 0.7980165502141224, "grad_norm": 0.1855198861913975, "learning_rate": 1.1923538006698154e-05, "loss": 0.3594, "step": 3098 }, { "epoch": 0.7982741410954052, "grad_norm": 0.13936056534185942, "learning_rate": 1.1894407086972775e-05, "loss": 0.2921, "step": 3099 }, { "epoch": 0.798531731976688, "grad_norm": 0.1448164116050819, "learning_rate": 1.1865306991408659e-05, "loss": 0.3895, "step": 3100 }, { "epoch": 0.798531731976688, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.860660031430068, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3497869372367859, "eval_runtime": 17.364, "eval_samples_per_second": 2.534, "eval_steps_per_second": 0.173, "step": 3100 }, { "epoch": 0.7987893228579708, "grad_norm": 0.20255519007189515, "learning_rate": 1.183623774354531e-05, "loss": 0.4693, "step": 3101 }, { "epoch": 0.7990469137392536, "grad_norm": 0.155068593086326, "learning_rate": 1.180719936689726e-05, "loss": 0.4073, "step": 3102 }, { "epoch": 0.7993045046205365, "grad_norm": 0.18004378834161067, "learning_rate": 1.1778191884954076e-05, "loss": 0.3511, "step": 3103 }, { "epoch": 0.7995620955018192, "grad_norm": 0.15776600521402603, "learning_rate": 1.1749215321180313e-05, "loss": 0.3631, "step": 3104 }, { "epoch": 0.7998196863831021, "grad_norm": 0.12691647050918928, "learning_rate": 1.172026969901553e-05, "loss": 0.3415, "step": 3105 }, { "epoch": 0.7998196863831021, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8580408590885279, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3508966565132141, "eval_runtime": 17.6481, "eval_samples_per_second": 2.493, "eval_steps_per_second": 0.17, "step": 3105 }, { "epoch": 0.8000772772643848, "grad_norm": 0.16244118989262288, "learning_rate": 1.1691355041874275e-05, "loss": 0.3941, "step": 3106 }, { "epoch": 0.8003348681456677, "grad_norm": 0.14491588053618326, "learning_rate": 1.1662471373146e-05, "loss": 0.3353, "step": 3107 }, { "epoch": 0.8005924590269504, "grad_norm": 0.1446244331938275, "learning_rate": 1.1633618716195155e-05, "loss": 0.2622, "step": 3108 }, { "epoch": 0.8008500499082333, "grad_norm": 0.15880758606427098, "learning_rate": 1.160479709436103e-05, "loss": 0.3635, "step": 3109 }, { "epoch": 0.801107640789516, "grad_norm": 0.15047141070557518, "learning_rate": 1.1576006530957867e-05, "loss": 0.3485, "step": 3110 }, { "epoch": 0.801107640789516, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8543740178103719, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3545365631580353, "eval_runtime": 17.2581, "eval_samples_per_second": 2.55, "eval_steps_per_second": 0.174, "step": 3110 }, { "epoch": 0.8013652316707989, "grad_norm": 0.1794244797364346, "learning_rate": 1.1547247049274768e-05, "loss": 0.4048, "step": 3111 }, { "epoch": 0.8016228225520816, "grad_norm": 0.1226769223350654, "learning_rate": 1.1518518672575701e-05, "loss": 0.3596, "step": 3112 }, { "epoch": 0.8018804134333645, "grad_norm": 0.15319819350243052, "learning_rate": 1.148982142409944e-05, "loss": 0.3525, "step": 3113 }, { "epoch": 0.8021380043146472, "grad_norm": 0.15796474914424785, "learning_rate": 1.1461155327059609e-05, "loss": 0.385, "step": 3114 }, { "epoch": 0.8023955951959301, "grad_norm": 0.13525930432507258, "learning_rate": 1.1432520404644641e-05, "loss": 0.3774, "step": 3115 }, { "epoch": 0.8023955951959301, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3538707494735718, "eval_runtime": 16.7876, "eval_samples_per_second": 2.621, "eval_steps_per_second": 0.179, "step": 3115 }, { "epoch": 0.8026531860772129, "grad_norm": 0.13699153982417012, "learning_rate": 1.1403916680017713e-05, "loss": 0.3713, "step": 3116 }, { "epoch": 0.8029107769584957, "grad_norm": 0.17228564564699694, "learning_rate": 1.1375344176316816e-05, "loss": 0.4396, "step": 3117 }, { "epoch": 0.8031683678397785, "grad_norm": 0.16730840733033545, "learning_rate": 1.1346802916654609e-05, "loss": 0.4373, "step": 3118 }, { "epoch": 0.8034259587210613, "grad_norm": 0.2062059995826555, "learning_rate": 1.1318292924118584e-05, "loss": 0.5015, "step": 3119 }, { "epoch": 0.8036835496023441, "grad_norm": 0.11172843458227011, "learning_rate": 1.128981422177086e-05, "loss": 0.2863, "step": 3120 }, { "epoch": 0.8036835496023441, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.855683603981142, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35262784361839294, "eval_runtime": 17.33, "eval_samples_per_second": 2.539, "eval_steps_per_second": 0.173, "step": 3120 }, { "epoch": 0.8039411404836269, "grad_norm": 0.15137924988501691, "learning_rate": 1.1261366832648257e-05, "loss": 0.296, "step": 3121 }, { "epoch": 0.8041987313649097, "grad_norm": 0.1755519464843511, "learning_rate": 1.1232950779762286e-05, "loss": 0.3611, "step": 3122 }, { "epoch": 0.8044563222461925, "grad_norm": 0.22491056177565918, "learning_rate": 1.12045660860991e-05, "loss": 0.4576, "step": 3123 }, { "epoch": 0.8047139131274753, "grad_norm": 0.13124327151277423, "learning_rate": 1.1176212774619499e-05, "loss": 0.349, "step": 3124 }, { "epoch": 0.804971504008758, "grad_norm": 0.14885059959293062, "learning_rate": 1.1147890868258854e-05, "loss": 0.3466, "step": 3125 }, { "epoch": 0.804971504008758, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.85751702462022, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3494318127632141, "eval_runtime": 17.6073, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 3125 }, { "epoch": 0.8052290948900409, "grad_norm": 0.1866581950445014, "learning_rate": 1.1119600389927182e-05, "loss": 0.4162, "step": 3126 }, { "epoch": 0.8054866857713237, "grad_norm": 0.13912614718043878, "learning_rate": 1.1091341362509067e-05, "loss": 0.3716, "step": 3127 }, { "epoch": 0.8057442766526065, "grad_norm": 0.13576898242677826, "learning_rate": 1.1063113808863613e-05, "loss": 0.3328, "step": 3128 }, { "epoch": 0.8060018675338892, "grad_norm": 0.18353598050450984, "learning_rate": 1.1034917751824524e-05, "loss": 0.3874, "step": 3129 }, { "epoch": 0.8062594584151721, "grad_norm": 0.1319409433222276, "learning_rate": 1.1006753214199966e-05, "loss": 0.316, "step": 3130 }, { "epoch": 0.8062594584151721, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.854112100576218, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34938743710517883, "eval_runtime": 16.9028, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.177, "step": 3130 }, { "epoch": 0.806517049296455, "grad_norm": 0.1417513006446542, "learning_rate": 1.0978620218772655e-05, "loss": 0.3712, "step": 3131 }, { "epoch": 0.8067746401777377, "grad_norm": 0.16732661736257973, "learning_rate": 1.0950518788299775e-05, "loss": 0.418, "step": 3132 }, { "epoch": 0.8070322310590206, "grad_norm": 0.16315483241981468, "learning_rate": 1.092244894551298e-05, "loss": 0.4392, "step": 3133 }, { "epoch": 0.8072898219403033, "grad_norm": 0.18008478786485438, "learning_rate": 1.0894410713118352e-05, "loss": 0.4422, "step": 3134 }, { "epoch": 0.8075474128215862, "grad_norm": 0.1567798123794633, "learning_rate": 1.0866404113796436e-05, "loss": 0.356, "step": 3135 }, { "epoch": 0.8075474128215862, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3501420319080353, "eval_runtime": 17.0214, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 3135 }, { "epoch": 0.8078050037028689, "grad_norm": 0.14115786198396219, "learning_rate": 1.0838429170202174e-05, "loss": 0.3338, "step": 3136 }, { "epoch": 0.8080625945841517, "grad_norm": 0.20433883781901582, "learning_rate": 1.0810485904964885e-05, "loss": 0.3626, "step": 3137 }, { "epoch": 0.8083201854654345, "grad_norm": 0.1337168961416317, "learning_rate": 1.0782574340688294e-05, "loss": 0.3373, "step": 3138 }, { "epoch": 0.8085777763467173, "grad_norm": 0.14215427979065506, "learning_rate": 1.0754694499950446e-05, "loss": 0.3176, "step": 3139 }, { "epoch": 0.8088353672280001, "grad_norm": 0.189867895600534, "learning_rate": 1.0726846405303754e-05, "loss": 0.5076, "step": 3140 }, { "epoch": 0.8088353672280001, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8509690937663698, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.35165128111839294, "eval_runtime": 16.9871, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 3140 }, { "epoch": 0.809092958109283, "grad_norm": 0.15296995471496322, "learning_rate": 1.0699030079274958e-05, "loss": 0.3799, "step": 3141 }, { "epoch": 0.8093505489905657, "grad_norm": 0.12473336061974759, "learning_rate": 1.0671245544365055e-05, "loss": 0.3659, "step": 3142 }, { "epoch": 0.8096081398718485, "grad_norm": 0.13032999688279998, "learning_rate": 1.0643492823049372e-05, "loss": 0.3503, "step": 3143 }, { "epoch": 0.8098657307531313, "grad_norm": 0.1699417718984136, "learning_rate": 1.0615771937777474e-05, "loss": 0.3477, "step": 3144 }, { "epoch": 0.8101233216344141, "grad_norm": 0.15903429680986436, "learning_rate": 1.0588082910973206e-05, "loss": 0.3957, "step": 3145 }, { "epoch": 0.8101233216344141, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8695652173913043, "eval_PRM F1 AUC": 0.747773703509691, "eval_PRM F1 AUC (fixed)": 0.8517548454688317, "eval_PRM F1 Neg": 0.5882352941176471, "eval_PRM NPV": 0.5357142857142857, "eval_PRM Precision": 0.8974358974358975, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3560901880264282, "eval_runtime": 17.1877, "eval_samples_per_second": 2.56, "eval_steps_per_second": 0.175, "step": 3145 }, { "epoch": 0.810380912515697, "grad_norm": 0.16111186925042234, "learning_rate": 1.0560425765034605e-05, "loss": 0.3888, "step": 3146 }, { "epoch": 0.8106385033969797, "grad_norm": 0.12989359714129808, "learning_rate": 1.0532800522333902e-05, "loss": 0.3106, "step": 3147 }, { "epoch": 0.8108960942782626, "grad_norm": 0.18492630798190468, "learning_rate": 1.0505207205217604e-05, "loss": 0.3337, "step": 3148 }, { "epoch": 0.8111536851595453, "grad_norm": 0.1744833190072309, "learning_rate": 1.047764583600631e-05, "loss": 0.3269, "step": 3149 }, { "epoch": 0.8114112760408282, "grad_norm": 0.20134649912991798, "learning_rate": 1.0450116436994833e-05, "loss": 0.4545, "step": 3150 }, { "epoch": 0.8114112760408282, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8902439024390244, "eval_PRM F1 AUC": 0.7658459926663174, "eval_PRM F1 AUC (fixed)": 0.8517548454688317, "eval_PRM F1 Neg": 0.625, "eval_PRM NPV": 0.6, "eval_PRM Precision": 0.9012345679012346, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3551580309867859, "eval_runtime": 17.4766, "eval_samples_per_second": 2.518, "eval_steps_per_second": 0.172, "step": 3150 }, { "epoch": 0.8116688669221109, "grad_norm": 0.18164489180559934, "learning_rate": 1.0422619030452064e-05, "loss": 0.3894, "step": 3151 }, { "epoch": 0.8119264578033938, "grad_norm": 0.123378010825018, "learning_rate": 1.039515363862107e-05, "loss": 0.2914, "step": 3152 }, { "epoch": 0.8121840486846765, "grad_norm": 0.1366347948787281, "learning_rate": 1.0367720283719012e-05, "loss": 0.3445, "step": 3153 }, { "epoch": 0.8124416395659594, "grad_norm": 0.14385452868585336, "learning_rate": 1.0340318987937097e-05, "loss": 0.3949, "step": 3154 }, { "epoch": 0.8126992304472421, "grad_norm": 0.16585700968051362, "learning_rate": 1.0312949773440644e-05, "loss": 0.4334, "step": 3155 }, { "epoch": 0.8126992304472421, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8559455212152959, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3567560315132141, "eval_runtime": 17.3841, "eval_samples_per_second": 2.531, "eval_steps_per_second": 0.173, "step": 3155 }, { "epoch": 0.812956821328525, "grad_norm": 0.18009855187681467, "learning_rate": 1.0285612662369004e-05, "loss": 0.4135, "step": 3156 }, { "epoch": 0.8132144122098077, "grad_norm": 0.15790813627126485, "learning_rate": 1.0258307676835565e-05, "loss": 0.3662, "step": 3157 }, { "epoch": 0.8134720030910906, "grad_norm": 0.22398527724057288, "learning_rate": 1.0231034838927705e-05, "loss": 0.322, "step": 3158 }, { "epoch": 0.8137295939723734, "grad_norm": 0.1938050086703142, "learning_rate": 1.0203794170706831e-05, "loss": 0.3865, "step": 3159 }, { "epoch": 0.8139871848536562, "grad_norm": 0.12407783754503751, "learning_rate": 1.017658569420829e-05, "loss": 0.4043, "step": 3160 }, { "epoch": 0.8139871848536562, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.858302776322682, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3535600006580353, "eval_runtime": 16.7986, "eval_samples_per_second": 2.619, "eval_steps_per_second": 0.179, "step": 3160 }, { "epoch": 0.814244775734939, "grad_norm": 0.12081072034006296, "learning_rate": 1.014940943144142e-05, "loss": 0.3084, "step": 3161 }, { "epoch": 0.8145023666162218, "grad_norm": 0.1699187339002344, "learning_rate": 1.0122265404389503e-05, "loss": 0.4171, "step": 3162 }, { "epoch": 0.8147599574975046, "grad_norm": 0.18183723950406305, "learning_rate": 1.0095153635009707e-05, "loss": 0.2901, "step": 3163 }, { "epoch": 0.8150175483787874, "grad_norm": 0.1375987261153789, "learning_rate": 1.0068074145233147e-05, "loss": 0.3596, "step": 3164 }, { "epoch": 0.8152751392600702, "grad_norm": 0.14070175448365288, "learning_rate": 1.004102695696481e-05, "loss": 0.3185, "step": 3165 }, { "epoch": 0.8152751392600702, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8603981141959142, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3515625, "eval_runtime": 17.0501, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 3165 }, { "epoch": 0.815532730141353, "grad_norm": 0.1697032383303854, "learning_rate": 1.001401209208357e-05, "loss": 0.3208, "step": 3166 }, { "epoch": 0.8157903210226358, "grad_norm": 0.16952126988382185, "learning_rate": 9.987029572442119e-06, "loss": 0.3584, "step": 3167 }, { "epoch": 0.8160479119039186, "grad_norm": 0.15017925723040138, "learning_rate": 9.960079419866985e-06, "loss": 0.4175, "step": 3168 }, { "epoch": 0.8163055027852014, "grad_norm": 0.13446377710734514, "learning_rate": 9.933161656158579e-06, "loss": 0.3675, "step": 3169 }, { "epoch": 0.8165630936664842, "grad_norm": 0.18132250694224258, "learning_rate": 9.90627630309104e-06, "loss": 0.3244, "step": 3170 }, { "epoch": 0.8165630936664842, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8619696176008381, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3528497815132141, "eval_runtime": 16.8152, "eval_samples_per_second": 2.617, "eval_steps_per_second": 0.178, "step": 3170 }, { "epoch": 0.816820684547767, "grad_norm": 0.16339847616237516, "learning_rate": 9.879423382412328e-06, "loss": 0.2945, "step": 3171 }, { "epoch": 0.8170782754290498, "grad_norm": 0.11419782002990903, "learning_rate": 9.852602915844134e-06, "loss": 0.3089, "step": 3172 }, { "epoch": 0.8173358663103326, "grad_norm": 0.18400897972309438, "learning_rate": 9.82581492508194e-06, "loss": 0.3925, "step": 3173 }, { "epoch": 0.8175934571916155, "grad_norm": 0.1512950990795011, "learning_rate": 9.799059431794939e-06, "loss": 0.396, "step": 3174 }, { "epoch": 0.8178510480728982, "grad_norm": 0.1350873997772639, "learning_rate": 9.772336457626014e-06, "loss": 0.3173, "step": 3175 }, { "epoch": 0.8178510480728982, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 AUC (fixed)": 0.8664222105814562, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3508966565132141, "eval_runtime": 16.6788, "eval_samples_per_second": 2.638, "eval_steps_per_second": 0.18, "step": 3175 }, { "epoch": 0.8181086389541811, "grad_norm": 0.11788164787783686, "learning_rate": 9.745646024191784e-06, "loss": 0.2966, "step": 3176 }, { "epoch": 0.8183662298354638, "grad_norm": 0.1342480180843785, "learning_rate": 9.718988153082486e-06, "loss": 0.3782, "step": 3177 }, { "epoch": 0.8186238207167467, "grad_norm": 0.15336396210084371, "learning_rate": 9.692362865862115e-06, "loss": 0.4346, "step": 3178 }, { "epoch": 0.8188814115980294, "grad_norm": 0.1448123755114553, "learning_rate": 9.665770184068196e-06, "loss": 0.4017, "step": 3179 }, { "epoch": 0.8191390024793123, "grad_norm": 0.1416880556433745, "learning_rate": 9.639210129211967e-06, "loss": 0.3081, "step": 3180 }, { "epoch": 0.8191390024793123, "eval_PRM Accuracy": 0.839622641509434, "eval_PRM F1": 0.8982035928143712, "eval_PRM F1 AUC": 0.7561550550026193, "eval_PRM F1 AUC (fixed)": 0.8672079622839183, "eval_PRM F1 Neg": 0.6222222222222222, "eval_PRM NPV": 0.6363636363636364, "eval_PRM Precision": 0.8928571428571429, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35067471861839294, "eval_runtime": 17.6567, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 3180 }, { "epoch": 0.819396593360595, "grad_norm": 0.11894061964235332, "learning_rate": 9.612682722778204e-06, "loss": 0.2376, "step": 3181 }, { "epoch": 0.8196541842418779, "grad_norm": 0.13721099006899398, "learning_rate": 9.586187986225325e-06, "loss": 0.3583, "step": 3182 }, { "epoch": 0.8199117751231606, "grad_norm": 0.15576541354415627, "learning_rate": 9.559725940985314e-06, "loss": 0.3756, "step": 3183 }, { "epoch": 0.8201693660044435, "grad_norm": 0.19513516510858028, "learning_rate": 9.533296608463676e-06, "loss": 0.459, "step": 3184 }, { "epoch": 0.8204269568857262, "grad_norm": 0.12961128901552244, "learning_rate": 9.506900010039494e-06, "loss": 0.3916, "step": 3185 }, { "epoch": 0.8204269568857262, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8677317967522263, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3502752184867859, "eval_runtime": 17.0853, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 3185 }, { "epoch": 0.820684547767009, "grad_norm": 0.15283869491242777, "learning_rate": 9.48053616706534e-06, "loss": 0.3651, "step": 3186 }, { "epoch": 0.8209421386482918, "grad_norm": 0.1435069464764614, "learning_rate": 9.454205100867337e-06, "loss": 0.305, "step": 3187 }, { "epoch": 0.8211997295295747, "grad_norm": 0.14244665563034178, "learning_rate": 9.427906832745038e-06, "loss": 0.3396, "step": 3188 }, { "epoch": 0.8214573204108575, "grad_norm": 0.16728750954917396, "learning_rate": 9.401641383971477e-06, "loss": 0.4091, "step": 3189 }, { "epoch": 0.8217149112921402, "grad_norm": 0.20192621091368526, "learning_rate": 9.37540877579317e-06, "loss": 0.4489, "step": 3190 }, { "epoch": 0.8217149112921402, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8666841278156102, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35134056210517883, "eval_runtime": 17.0684, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 3190 }, { "epoch": 0.8219725021734231, "grad_norm": 0.12801980425683762, "learning_rate": 9.349209029430051e-06, "loss": 0.2949, "step": 3191 }, { "epoch": 0.8222300930547058, "grad_norm": 0.15978222205359233, "learning_rate": 9.32304216607548e-06, "loss": 0.3576, "step": 3192 }, { "epoch": 0.8224876839359887, "grad_norm": 0.16423040293279703, "learning_rate": 9.296908206896182e-06, "loss": 0.3091, "step": 3193 }, { "epoch": 0.8227452748172714, "grad_norm": 0.1595696241178257, "learning_rate": 9.270807173032314e-06, "loss": 0.4024, "step": 3194 }, { "epoch": 0.8230028656985543, "grad_norm": 0.16355760897009503, "learning_rate": 9.244739085597375e-06, "loss": 0.4338, "step": 3195 }, { "epoch": 0.8230028656985543, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8648507071765322, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3499200940132141, "eval_runtime": 16.8497, "eval_samples_per_second": 2.611, "eval_steps_per_second": 0.178, "step": 3195 }, { "epoch": 0.823260456579837, "grad_norm": 0.16353743835338685, "learning_rate": 9.218703965678204e-06, "loss": 0.3784, "step": 3196 }, { "epoch": 0.8235180474611199, "grad_norm": 0.17053224761398086, "learning_rate": 9.192701834334999e-06, "loss": 0.3804, "step": 3197 }, { "epoch": 0.8237756383424026, "grad_norm": 0.19982818106201172, "learning_rate": 9.166732712601228e-06, "loss": 0.3766, "step": 3198 }, { "epoch": 0.8240332292236855, "grad_norm": 0.14342544965844545, "learning_rate": 9.140796621483726e-06, "loss": 0.3612, "step": 3199 }, { "epoch": 0.8242908201049682, "grad_norm": 0.13243221494393803, "learning_rate": 9.114893581962552e-06, "loss": 0.3591, "step": 3200 }, { "epoch": 0.8242908201049682, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8638030382399161, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3496537506580353, "eval_runtime": 17.5712, "eval_samples_per_second": 2.504, "eval_steps_per_second": 0.171, "step": 3200 }, { "epoch": 0.8245484109862511, "grad_norm": 0.15511590241244955, "learning_rate": 9.089023614991033e-06, "loss": 0.3922, "step": 3201 }, { "epoch": 0.8248060018675339, "grad_norm": 0.19083610530015657, "learning_rate": 9.063186741495771e-06, "loss": 0.3469, "step": 3202 }, { "epoch": 0.8250635927488167, "grad_norm": 0.20708350599480913, "learning_rate": 9.03738298237658e-06, "loss": 0.4167, "step": 3203 }, { "epoch": 0.8253211836300995, "grad_norm": 0.1849384602200154, "learning_rate": 9.011612358506505e-06, "loss": 0.4379, "step": 3204 }, { "epoch": 0.8255787745113823, "grad_norm": 0.17365905387212774, "learning_rate": 8.985874890731748e-06, "loss": 0.3575, "step": 3205 }, { "epoch": 0.8255787745113823, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8614457831325303, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3487659692764282, "eval_runtime": 17.0978, "eval_samples_per_second": 2.573, "eval_steps_per_second": 0.175, "step": 3205 }, { "epoch": 0.8258363653926651, "grad_norm": 0.16868530415993457, "learning_rate": 8.96017059987173e-06, "loss": 0.4032, "step": 3206 }, { "epoch": 0.8260939562739479, "grad_norm": 0.15350447508423878, "learning_rate": 8.934499506719036e-06, "loss": 0.3026, "step": 3207 }, { "epoch": 0.8263515471552307, "grad_norm": 0.16050569369514797, "learning_rate": 8.90886163203935e-06, "loss": 0.3436, "step": 3208 }, { "epoch": 0.8266091380365135, "grad_norm": 0.1632798791957356, "learning_rate": 8.883256996571549e-06, "loss": 0.3671, "step": 3209 }, { "epoch": 0.8268667289177963, "grad_norm": 0.14654263592561342, "learning_rate": 8.857685621027568e-06, "loss": 0.3281, "step": 3210 }, { "epoch": 0.8268667289177963, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8624934520691462, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3517400622367859, "eval_runtime": 17.5781, "eval_samples_per_second": 2.503, "eval_steps_per_second": 0.171, "step": 3210 }, { "epoch": 0.8271243197990791, "grad_norm": 0.15643503809805195, "learning_rate": 8.83214752609246e-06, "loss": 0.3351, "step": 3211 }, { "epoch": 0.8273819106803619, "grad_norm": 0.1499880759789236, "learning_rate": 8.806642732424364e-06, "loss": 0.3811, "step": 3212 }, { "epoch": 0.8276395015616447, "grad_norm": 0.16453623680318505, "learning_rate": 8.781171260654487e-06, "loss": 0.3524, "step": 3213 }, { "epoch": 0.8278970924429275, "grad_norm": 0.1441905295854206, "learning_rate": 8.75573313138704e-06, "loss": 0.3384, "step": 3214 }, { "epoch": 0.8281546833242103, "grad_norm": 0.15291533738227753, "learning_rate": 8.730328365199309e-06, "loss": 0.2876, "step": 3215 }, { "epoch": 0.8281546833242103, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8645887899423781, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.34823331236839294, "eval_runtime": 16.8731, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 3215 }, { "epoch": 0.8284122742054931, "grad_norm": 0.1526283034776341, "learning_rate": 8.704956982641582e-06, "loss": 0.3422, "step": 3216 }, { "epoch": 0.828669865086776, "grad_norm": 0.12824227405763236, "learning_rate": 8.67961900423711e-06, "loss": 0.3258, "step": 3217 }, { "epoch": 0.8289274559680587, "grad_norm": 0.18859708864857164, "learning_rate": 8.654314450482177e-06, "loss": 0.4364, "step": 3218 }, { "epoch": 0.8291850468493416, "grad_norm": 0.14291776125128286, "learning_rate": 8.629043341845954e-06, "loss": 0.362, "step": 3219 }, { "epoch": 0.8294426377306243, "grad_norm": 0.12178353232351061, "learning_rate": 8.603805698770668e-06, "loss": 0.318, "step": 3220 }, { "epoch": 0.8294426377306243, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8661602933473022, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3502752184867859, "eval_runtime": 17.7108, "eval_samples_per_second": 2.484, "eval_steps_per_second": 0.169, "step": 3220 }, { "epoch": 0.8297002286119072, "grad_norm": 0.16525520969839252, "learning_rate": 8.578601541671367e-06, "loss": 0.4316, "step": 3221 }, { "epoch": 0.8299578194931899, "grad_norm": 0.19735557692981234, "learning_rate": 8.553430890936055e-06, "loss": 0.3822, "step": 3222 }, { "epoch": 0.8302154103744728, "grad_norm": 0.16431125779730293, "learning_rate": 8.528293766925643e-06, "loss": 0.397, "step": 3223 }, { "epoch": 0.8304730012557555, "grad_norm": 0.18940313759105748, "learning_rate": 8.503190189973914e-06, "loss": 0.3932, "step": 3224 }, { "epoch": 0.8307305921370384, "grad_norm": 0.1766486587621581, "learning_rate": 8.478120180387522e-06, "loss": 0.4043, "step": 3225 }, { "epoch": 0.8307305921370384, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8638030382399161, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35427024960517883, "eval_runtime": 16.9315, "eval_samples_per_second": 2.599, "eval_steps_per_second": 0.177, "step": 3225 }, { "epoch": 0.8309881830183211, "grad_norm": 0.1321673065049362, "learning_rate": 8.453083758445929e-06, "loss": 0.3093, "step": 3226 }, { "epoch": 0.831245773899604, "grad_norm": 0.16571976210127348, "learning_rate": 8.428080944401479e-06, "loss": 0.3449, "step": 3227 }, { "epoch": 0.8315033647808867, "grad_norm": 0.1764815295934946, "learning_rate": 8.403111758479304e-06, "loss": 0.3571, "step": 3228 }, { "epoch": 0.8317609556621696, "grad_norm": 0.13634101138649224, "learning_rate": 8.378176220877326e-06, "loss": 0.34, "step": 3229 }, { "epoch": 0.8320185465434523, "grad_norm": 0.182161798144851, "learning_rate": 8.353274351766282e-06, "loss": 0.3692, "step": 3230 }, { "epoch": 0.8320185465434523, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8622315348349922, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3614612817764282, "eval_runtime": 17.2507, "eval_samples_per_second": 2.551, "eval_steps_per_second": 0.174, "step": 3230 }, { "epoch": 0.8322761374247352, "grad_norm": 0.15826296959528402, "learning_rate": 8.328406171289621e-06, "loss": 0.3393, "step": 3231 }, { "epoch": 0.832533728306018, "grad_norm": 0.10225333810717532, "learning_rate": 8.30357169956359e-06, "loss": 0.2945, "step": 3232 }, { "epoch": 0.8327913191873008, "grad_norm": 0.22118037196993232, "learning_rate": 8.27877095667714e-06, "loss": 0.3736, "step": 3233 }, { "epoch": 0.8330489100685836, "grad_norm": 0.20154205343586643, "learning_rate": 8.254003962691975e-06, "loss": 0.4589, "step": 3234 }, { "epoch": 0.8333065009498664, "grad_norm": 0.1653200008773221, "learning_rate": 8.229270737642436e-06, "loss": 0.3701, "step": 3235 }, { "epoch": 0.8333065009498664, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.8928571428571429, "eval_PRM F1 AUC": 0.7344159245678366, "eval_PRM F1 AUC (fixed)": 0.85882661079099, "eval_PRM F1 Neg": 0.5909090909090909, "eval_PRM NPV": 0.6190476190476191, "eval_PRM Precision": 0.8823529411764706, "eval_PRM Recall": 0.9036144578313253, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.36434659361839294, "eval_runtime": 16.7554, "eval_samples_per_second": 2.626, "eval_steps_per_second": 0.179, "step": 3235 }, { "epoch": 0.8335640918311492, "grad_norm": 0.13615456699042447, "learning_rate": 8.204571301535596e-06, "loss": 0.3397, "step": 3236 }, { "epoch": 0.833821682712432, "grad_norm": 0.1535461393317119, "learning_rate": 8.179905674351206e-06, "loss": 0.3002, "step": 3237 }, { "epoch": 0.8340792735937148, "grad_norm": 0.15985385062435217, "learning_rate": 8.155273876041614e-06, "loss": 0.3746, "step": 3238 }, { "epoch": 0.8343368644749976, "grad_norm": 0.13271442629555014, "learning_rate": 8.130675926531856e-06, "loss": 0.344, "step": 3239 }, { "epoch": 0.8345944553562804, "grad_norm": 0.17761330348753104, "learning_rate": 8.106111845719538e-06, "loss": 0.3676, "step": 3240 }, { "epoch": 0.8345944553562804, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8577789418543741, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3603071868419647, "eval_runtime": 17.1595, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 3240 }, { "epoch": 0.8348520462375632, "grad_norm": 0.18452813168122292, "learning_rate": 8.081581653474945e-06, "loss": 0.4228, "step": 3241 }, { "epoch": 0.835109637118846, "grad_norm": 0.14432094368232395, "learning_rate": 8.057085369640877e-06, "loss": 0.3782, "step": 3242 }, { "epoch": 0.8353672280001287, "grad_norm": 0.18791697221273532, "learning_rate": 8.032623014032708e-06, "loss": 0.2653, "step": 3243 }, { "epoch": 0.8356248188814116, "grad_norm": 0.13870900446674556, "learning_rate": 8.008194606438418e-06, "loss": 0.4009, "step": 3244 }, { "epoch": 0.8358824097626945, "grad_norm": 0.14865322448540794, "learning_rate": 7.983800166618482e-06, "loss": 0.3506, "step": 3245 }, { "epoch": 0.8358824097626945, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.856731272917758, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36203834414482117, "eval_runtime": 17.6088, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 3245 }, { "epoch": 0.8361400006439772, "grad_norm": 0.16486101398095257, "learning_rate": 7.959439714305932e-06, "loss": 0.3079, "step": 3246 }, { "epoch": 0.83639759152526, "grad_norm": 0.16106189895239292, "learning_rate": 7.935113269206273e-06, "loss": 0.3249, "step": 3247 }, { "epoch": 0.8366551824065428, "grad_norm": 0.11647225143654803, "learning_rate": 7.910820850997497e-06, "loss": 0.3157, "step": 3248 }, { "epoch": 0.8369127732878257, "grad_norm": 0.11449709896017739, "learning_rate": 7.886562479330129e-06, "loss": 0.3033, "step": 3249 }, { "epoch": 0.8371703641691084, "grad_norm": 0.14521452508837873, "learning_rate": 7.862338173827088e-06, "loss": 0.362, "step": 3250 }, { "epoch": 0.8371703641691084, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.854112100576218, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.36532315611839294, "eval_runtime": 17.5366, "eval_samples_per_second": 2.509, "eval_steps_per_second": 0.171, "step": 3250 }, { "epoch": 0.8374279550503912, "grad_norm": 0.11777655819844253, "learning_rate": 7.83814795408378e-06, "loss": 0.3555, "step": 3251 }, { "epoch": 0.837685545931674, "grad_norm": 0.16135813457174544, "learning_rate": 7.813991839667995e-06, "loss": 0.4196, "step": 3252 }, { "epoch": 0.8379431368129568, "grad_norm": 0.17458238882470384, "learning_rate": 7.789869850119979e-06, "loss": 0.4, "step": 3253 }, { "epoch": 0.8382007276942396, "grad_norm": 0.20087031849085593, "learning_rate": 7.765782004952366e-06, "loss": 0.4697, "step": 3254 }, { "epoch": 0.8384583185755224, "grad_norm": 0.14022266421905447, "learning_rate": 7.741728323650133e-06, "loss": 0.3282, "step": 3255 }, { "epoch": 0.8384583185755224, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8530644316396019, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36514559388160706, "eval_runtime": 17.0843, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 3255 }, { "epoch": 0.8387159094568052, "grad_norm": 0.1213736288828905, "learning_rate": 7.71770882567066e-06, "loss": 0.3319, "step": 3256 }, { "epoch": 0.838973500338088, "grad_norm": 0.14912337959988659, "learning_rate": 7.693723530443675e-06, "loss": 0.3871, "step": 3257 }, { "epoch": 0.8392310912193708, "grad_norm": 0.1708246439180211, "learning_rate": 7.66977245737122e-06, "loss": 0.3978, "step": 3258 }, { "epoch": 0.8394886821006536, "grad_norm": 0.14251054176413233, "learning_rate": 7.645855625827658e-06, "loss": 0.4065, "step": 3259 }, { "epoch": 0.8397462729819365, "grad_norm": 0.24443152784361172, "learning_rate": 7.621973055159664e-06, "loss": 0.4167, "step": 3260 }, { "epoch": 0.8397462729819365, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8504452592980617, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36319246888160706, "eval_runtime": 17.8134, "eval_samples_per_second": 2.47, "eval_steps_per_second": 0.168, "step": 3260 }, { "epoch": 0.8400038638632192, "grad_norm": 0.14465370730815327, "learning_rate": 7.598124764686182e-06, "loss": 0.2937, "step": 3261 }, { "epoch": 0.8402614547445021, "grad_norm": 0.13652679362344977, "learning_rate": 7.574310773698445e-06, "loss": 0.3535, "step": 3262 }, { "epoch": 0.8405190456257848, "grad_norm": 0.18391641136636555, "learning_rate": 7.550531101459935e-06, "loss": 0.3748, "step": 3263 }, { "epoch": 0.8407766365070677, "grad_norm": 0.17848021726234092, "learning_rate": 7.526785767206357e-06, "loss": 0.4244, "step": 3264 }, { "epoch": 0.8410342273883504, "grad_norm": 0.1087760222856034, "learning_rate": 7.503074790145665e-06, "loss": 0.295, "step": 3265 }, { "epoch": 0.8410342273883504, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8475641697223677, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3642578125, "eval_runtime": 17.0969, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 3265 }, { "epoch": 0.8412918182696333, "grad_norm": 0.13442765343603139, "learning_rate": 7.4793981894580034e-06, "loss": 0.2538, "step": 3266 }, { "epoch": 0.841549409150916, "grad_norm": 0.11257869984721419, "learning_rate": 7.455755984295726e-06, "loss": 0.2851, "step": 3267 }, { "epoch": 0.8418070000321989, "grad_norm": 0.16575995821774783, "learning_rate": 7.432148193783345e-06, "loss": 0.4265, "step": 3268 }, { "epoch": 0.8420645909134816, "grad_norm": 0.15836730339554017, "learning_rate": 7.408574837017523e-06, "loss": 0.3479, "step": 3269 }, { "epoch": 0.8423221817947645, "grad_norm": 0.12730145492582412, "learning_rate": 7.385035933067108e-06, "loss": 0.3269, "step": 3270 }, { "epoch": 0.8423221817947645, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8530644316396019, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3617720305919647, "eval_runtime": 16.6159, "eval_samples_per_second": 2.648, "eval_steps_per_second": 0.181, "step": 3270 }, { "epoch": 0.8425797726760472, "grad_norm": 0.154307948275335, "learning_rate": 7.361531500973051e-06, "loss": 0.3578, "step": 3271 }, { "epoch": 0.8428373635573301, "grad_norm": 0.1464846068024724, "learning_rate": 7.3380615597484325e-06, "loss": 0.3528, "step": 3272 }, { "epoch": 0.8430949544386128, "grad_norm": 0.19502147010261306, "learning_rate": 7.3146261283784104e-06, "loss": 0.3955, "step": 3273 }, { "epoch": 0.8433525453198957, "grad_norm": 0.17313455437775152, "learning_rate": 7.291225225820247e-06, "loss": 0.3093, "step": 3274 }, { "epoch": 0.8436101362011785, "grad_norm": 0.17010851711129962, "learning_rate": 7.2678588710032855e-06, "loss": 0.3829, "step": 3275 }, { "epoch": 0.8436101362011785, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8517548454688317, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36155006289482117, "eval_runtime": 16.3725, "eval_samples_per_second": 2.687, "eval_steps_per_second": 0.183, "step": 3275 }, { "epoch": 0.8438677270824613, "grad_norm": 0.13434671331952297, "learning_rate": 7.244527082828878e-06, "loss": 0.3223, "step": 3276 }, { "epoch": 0.8441253179637441, "grad_norm": 0.12185736804251007, "learning_rate": 7.221229880170466e-06, "loss": 0.283, "step": 3277 }, { "epoch": 0.8443829088450269, "grad_norm": 0.18047817562611235, "learning_rate": 7.1979672818734576e-06, "loss": 0.4038, "step": 3278 }, { "epoch": 0.8446404997263097, "grad_norm": 0.1910014824609909, "learning_rate": 7.174739306755351e-06, "loss": 0.4078, "step": 3279 }, { "epoch": 0.8448980906075925, "grad_norm": 0.2109842675352553, "learning_rate": 7.1515459736055505e-06, "loss": 0.3808, "step": 3280 }, { "epoch": 0.8448980906075925, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3617720305919647, "eval_runtime": 16.5654, "eval_samples_per_second": 2.656, "eval_steps_per_second": 0.181, "step": 3280 }, { "epoch": 0.8451556814888753, "grad_norm": 0.12764894546435648, "learning_rate": 7.128387301185502e-06, "loss": 0.2964, "step": 3281 }, { "epoch": 0.8454132723701581, "grad_norm": 0.19950577963784955, "learning_rate": 7.105263308228566e-06, "loss": 0.4902, "step": 3282 }, { "epoch": 0.8456708632514409, "grad_norm": 0.1613182912440341, "learning_rate": 7.0821740134400796e-06, "loss": 0.3154, "step": 3283 }, { "epoch": 0.8459284541327237, "grad_norm": 0.17487314188165096, "learning_rate": 7.0591194354973246e-06, "loss": 0.4246, "step": 3284 }, { "epoch": 0.8461860450140065, "grad_norm": 0.1368775291480775, "learning_rate": 7.03609959304945e-06, "loss": 0.3659, "step": 3285 }, { "epoch": 0.8461860450140065, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8765432098765432, "eval_PRM F1 AUC": 0.7537977998952332, "eval_PRM F1 AUC (fixed)": 0.8512310110005238, "eval_PRM F1 Neg": 0.6, "eval_PRM NPV": 0.5555555555555556, "eval_PRM Precision": 0.8987341772151899, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6521739130434783, "eval_loss": 0.3613725006580353, "eval_runtime": 17.1456, "eval_samples_per_second": 2.566, "eval_steps_per_second": 0.175, "step": 3285 }, { "epoch": 0.8464436358952893, "grad_norm": 0.1636343044673799, "learning_rate": 7.0131145047175435e-06, "loss": 0.3714, "step": 3286 }, { "epoch": 0.8467012267765721, "grad_norm": 0.15558572514611352, "learning_rate": 6.990164189094589e-06, "loss": 0.3428, "step": 3287 }, { "epoch": 0.8469588176578549, "grad_norm": 0.1660442681960852, "learning_rate": 6.967248664745424e-06, "loss": 0.3766, "step": 3288 }, { "epoch": 0.8472164085391377, "grad_norm": 0.17263847391194753, "learning_rate": 6.944367950206737e-06, "loss": 0.3016, "step": 3289 }, { "epoch": 0.8474739994204206, "grad_norm": 0.12512233995548366, "learning_rate": 6.9215220639870575e-06, "loss": 0.3357, "step": 3290 }, { "epoch": 0.8474739994204206, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8517548454688317, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36075106263160706, "eval_runtime": 17.3665, "eval_samples_per_second": 2.534, "eval_steps_per_second": 0.173, "step": 3290 }, { "epoch": 0.8477315903017033, "grad_norm": 0.21828442735148088, "learning_rate": 6.8987110245667615e-06, "loss": 0.4941, "step": 3291 }, { "epoch": 0.8479891811829862, "grad_norm": 0.18453885626531297, "learning_rate": 6.875934850398031e-06, "loss": 0.4406, "step": 3292 }, { "epoch": 0.8482467720642689, "grad_norm": 0.12708050764978154, "learning_rate": 6.853193559904841e-06, "loss": 0.3202, "step": 3293 }, { "epoch": 0.8485043629455518, "grad_norm": 0.16043755909239493, "learning_rate": 6.830487171482935e-06, "loss": 0.3322, "step": 3294 }, { "epoch": 0.8487619538268345, "grad_norm": 0.15936318920355805, "learning_rate": 6.807815703499843e-06, "loss": 0.3442, "step": 3295 }, { "epoch": 0.8487619538268345, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8535882661079098, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3590642809867859, "eval_runtime": 16.7797, "eval_samples_per_second": 2.622, "eval_steps_per_second": 0.179, "step": 3295 }, { "epoch": 0.8490195447081174, "grad_norm": 0.16752323668914681, "learning_rate": 6.785179174294848e-06, "loss": 0.367, "step": 3296 }, { "epoch": 0.8492771355894001, "grad_norm": 0.20505683078590164, "learning_rate": 6.7625776021789545e-06, "loss": 0.4508, "step": 3297 }, { "epoch": 0.849534726470683, "grad_norm": 0.1941535089733828, "learning_rate": 6.74001100543491e-06, "loss": 0.3635, "step": 3298 }, { "epoch": 0.8497923173519657, "grad_norm": 0.13905729799556743, "learning_rate": 6.7174794023171224e-06, "loss": 0.3793, "step": 3299 }, { "epoch": 0.8500499082332486, "grad_norm": 0.1661573276025384, "learning_rate": 6.694982811051787e-06, "loss": 0.3833, "step": 3300 }, { "epoch": 0.8500499082332486, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.8520167627029858, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3591974377632141, "eval_runtime": 17.102, "eval_samples_per_second": 2.573, "eval_steps_per_second": 0.175, "step": 3300 }, { "epoch": 0.8503074991145313, "grad_norm": 0.1760250055773036, "learning_rate": 6.6725212498366885e-06, "loss": 0.3992, "step": 3301 }, { "epoch": 0.8505650899958141, "grad_norm": 0.18080349918718142, "learning_rate": 6.650094736841295e-06, "loss": 0.3345, "step": 3302 }, { "epoch": 0.850822680877097, "grad_norm": 0.18155874185490795, "learning_rate": 6.627703290206744e-06, "loss": 0.3731, "step": 3303 }, { "epoch": 0.8510802717583797, "grad_norm": 0.1295413423897453, "learning_rate": 6.605346928045808e-06, "loss": 0.3376, "step": 3304 }, { "epoch": 0.8513378626396626, "grad_norm": 0.13659799233135908, "learning_rate": 6.583025668442866e-06, "loss": 0.3345, "step": 3305 }, { "epoch": 0.8513378626396626, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8525405971712938, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36110618710517883, "eval_runtime": 17.0672, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 3305 }, { "epoch": 0.8515954535209453, "grad_norm": 0.14687265647840395, "learning_rate": 6.5607395294538964e-06, "loss": 0.3674, "step": 3306 }, { "epoch": 0.8518530444022282, "grad_norm": 0.1503375419496451, "learning_rate": 6.538488529106484e-06, "loss": 0.3468, "step": 3307 }, { "epoch": 0.8521106352835109, "grad_norm": 0.15846714400800355, "learning_rate": 6.516272685399793e-06, "loss": 0.3385, "step": 3308 }, { "epoch": 0.8523682261647938, "grad_norm": 0.2117545159996122, "learning_rate": 6.494092016304509e-06, "loss": 0.3813, "step": 3309 }, { "epoch": 0.8526258170460765, "grad_norm": 0.14344827190828335, "learning_rate": 6.4719465397629295e-06, "loss": 0.3872, "step": 3310 }, { "epoch": 0.8526258170460765, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8533263488737559, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36483487486839294, "eval_runtime": 16.9844, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 3310 }, { "epoch": 0.8528834079273594, "grad_norm": 0.19680766123057453, "learning_rate": 6.449836273688819e-06, "loss": 0.42, "step": 3311 }, { "epoch": 0.8531409988086421, "grad_norm": 0.21142968305749577, "learning_rate": 6.427761235967494e-06, "loss": 0.4344, "step": 3312 }, { "epoch": 0.853398589689925, "grad_norm": 0.15138172633877256, "learning_rate": 6.4057214444557865e-06, "loss": 0.4184, "step": 3313 }, { "epoch": 0.8536561805712077, "grad_norm": 0.1708192168332884, "learning_rate": 6.383716916981991e-06, "loss": 0.4119, "step": 3314 }, { "epoch": 0.8539137714524906, "grad_norm": 0.2195713542806808, "learning_rate": 6.36174767134588e-06, "loss": 0.3772, "step": 3315 }, { "epoch": 0.8539137714524906, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8533263488737559, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36692115664482117, "eval_runtime": 16.6136, "eval_samples_per_second": 2.648, "eval_steps_per_second": 0.181, "step": 3315 }, { "epoch": 0.8541713623337733, "grad_norm": 0.15086481837173732, "learning_rate": 6.339813725318694e-06, "loss": 0.3882, "step": 3316 }, { "epoch": 0.8544289532150562, "grad_norm": 0.1136570044644587, "learning_rate": 6.317915096643134e-06, "loss": 0.3, "step": 3317 }, { "epoch": 0.854686544096339, "grad_norm": 0.1923963498289537, "learning_rate": 6.296051803033287e-06, "loss": 0.4465, "step": 3318 }, { "epoch": 0.8549441349776218, "grad_norm": 0.1268709334384851, "learning_rate": 6.274223862174711e-06, "loss": 0.3177, "step": 3319 }, { "epoch": 0.8552017258589046, "grad_norm": 0.18206154913414113, "learning_rate": 6.2524312917243035e-06, "loss": 0.3773, "step": 3320 }, { "epoch": 0.8552017258589046, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8525405971712938, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36354759335517883, "eval_runtime": 16.8651, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 3320 }, { "epoch": 0.8554593167401874, "grad_norm": 0.11457661146940189, "learning_rate": 6.230674109310436e-06, "loss": 0.3387, "step": 3321 }, { "epoch": 0.8557169076214702, "grad_norm": 0.18358205228905566, "learning_rate": 6.208952332532786e-06, "loss": 0.4121, "step": 3322 }, { "epoch": 0.855974498502753, "grad_norm": 0.13825029339289172, "learning_rate": 6.187265978962392e-06, "loss": 0.373, "step": 3323 }, { "epoch": 0.8562320893840358, "grad_norm": 0.130969477292691, "learning_rate": 6.165615066141672e-06, "loss": 0.3471, "step": 3324 }, { "epoch": 0.8564896802653186, "grad_norm": 0.1294016210224661, "learning_rate": 6.143999611584362e-06, "loss": 0.3356, "step": 3325 }, { "epoch": 0.8564896802653186, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8504452592980618, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3652787506580353, "eval_runtime": 16.668, "eval_samples_per_second": 2.64, "eval_steps_per_second": 0.18, "step": 3325 }, { "epoch": 0.8567472711466014, "grad_norm": 0.12903558552884586, "learning_rate": 6.122419632775522e-06, "loss": 0.2608, "step": 3326 }, { "epoch": 0.8570048620278842, "grad_norm": 0.15959826961815204, "learning_rate": 6.100875147171486e-06, "loss": 0.3561, "step": 3327 }, { "epoch": 0.857262452909167, "grad_norm": 0.15259635244399197, "learning_rate": 6.079366172199908e-06, "loss": 0.365, "step": 3328 }, { "epoch": 0.8575200437904498, "grad_norm": 0.16994770356248887, "learning_rate": 6.057892725259717e-06, "loss": 0.2973, "step": 3329 }, { "epoch": 0.8577776346717326, "grad_norm": 0.1770224832366625, "learning_rate": 6.036454823721077e-06, "loss": 0.4061, "step": 3330 }, { "epoch": 0.8577776346717326, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8507071765322158, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3646129369735718, "eval_runtime": 16.4136, "eval_samples_per_second": 2.681, "eval_steps_per_second": 0.183, "step": 3330 }, { "epoch": 0.8580352255530154, "grad_norm": 0.15527961194438825, "learning_rate": 6.015052484925426e-06, "loss": 0.3721, "step": 3331 }, { "epoch": 0.8582928164342982, "grad_norm": 0.1894960741559075, "learning_rate": 5.993685726185405e-06, "loss": 0.4269, "step": 3332 }, { "epoch": 0.8585504073155811, "grad_norm": 0.1370667769893655, "learning_rate": 5.9723545647849045e-06, "loss": 0.3501, "step": 3333 }, { "epoch": 0.8588079981968638, "grad_norm": 0.21381596000328998, "learning_rate": 5.95105901797901e-06, "loss": 0.3849, "step": 3334 }, { "epoch": 0.8590655890781467, "grad_norm": 0.15588653014505088, "learning_rate": 5.929799102994005e-06, "loss": 0.3801, "step": 3335 }, { "epoch": 0.8590655890781467, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8525405971712939, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36403587460517883, "eval_runtime": 17.1788, "eval_samples_per_second": 2.561, "eval_steps_per_second": 0.175, "step": 3335 }, { "epoch": 0.8593231799594294, "grad_norm": 0.16862801856159054, "learning_rate": 5.908574837027309e-06, "loss": 0.3259, "step": 3336 }, { "epoch": 0.8595807708407123, "grad_norm": 0.14323363894646496, "learning_rate": 5.887386237247561e-06, "loss": 0.3896, "step": 3337 }, { "epoch": 0.859838361721995, "grad_norm": 0.12647774046313853, "learning_rate": 5.866233320794523e-06, "loss": 0.3055, "step": 3338 }, { "epoch": 0.8600959526032779, "grad_norm": 0.15752019743485443, "learning_rate": 5.845116104779075e-06, "loss": 0.3706, "step": 3339 }, { "epoch": 0.8603535434845606, "grad_norm": 0.13276557814829096, "learning_rate": 5.824034606283257e-06, "loss": 0.3012, "step": 3340 }, { "epoch": 0.8603535434845606, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36075106263160706, "eval_runtime": 16.9913, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 3340 }, { "epoch": 0.8606111343658435, "grad_norm": 0.20031095746321162, "learning_rate": 5.802988842360169e-06, "loss": 0.4597, "step": 3341 }, { "epoch": 0.8608687252471262, "grad_norm": 0.18214206155327745, "learning_rate": 5.781978830034063e-06, "loss": 0.468, "step": 3342 }, { "epoch": 0.8611263161284091, "grad_norm": 0.19257260101587756, "learning_rate": 5.761004586300234e-06, "loss": 0.4028, "step": 3343 }, { "epoch": 0.8613839070096918, "grad_norm": 0.15262747014013386, "learning_rate": 5.7400661281250215e-06, "loss": 0.3294, "step": 3344 }, { "epoch": 0.8616414978909747, "grad_norm": 0.19821515561157396, "learning_rate": 5.719163472445871e-06, "loss": 0.4017, "step": 3345 }, { "epoch": 0.8616414978909747, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36288174986839294, "eval_runtime": 17.2583, "eval_samples_per_second": 2.55, "eval_steps_per_second": 0.174, "step": 3345 }, { "epoch": 0.8618990887722575, "grad_norm": 0.14363485663612383, "learning_rate": 5.69829663617123e-06, "loss": 0.3379, "step": 3346 }, { "epoch": 0.8621566796535403, "grad_norm": 0.14217371462692246, "learning_rate": 5.677465636180596e-06, "loss": 0.3817, "step": 3347 }, { "epoch": 0.8624142705348231, "grad_norm": 0.14510477504005892, "learning_rate": 5.6566704893244445e-06, "loss": 0.3707, "step": 3348 }, { "epoch": 0.8626718614161059, "grad_norm": 0.1509310181880006, "learning_rate": 5.635911212424288e-06, "loss": 0.3105, "step": 3349 }, { "epoch": 0.8629294522973887, "grad_norm": 0.13576952621602237, "learning_rate": 5.615187822272583e-06, "loss": 0.3119, "step": 3350 }, { "epoch": 0.8629294522973887, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8572551073860659, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3600408434867859, "eval_runtime": 17.6362, "eval_samples_per_second": 2.495, "eval_steps_per_second": 0.17, "step": 3350 }, { "epoch": 0.8631870431786715, "grad_norm": 0.15214488739105575, "learning_rate": 5.594500335632785e-06, "loss": 0.3625, "step": 3351 }, { "epoch": 0.8634446340599543, "grad_norm": 0.12911877360725382, "learning_rate": 5.573848769239315e-06, "loss": 0.2916, "step": 3352 }, { "epoch": 0.863702224941237, "grad_norm": 0.28115534773851986, "learning_rate": 5.553233139797492e-06, "loss": 0.4511, "step": 3353 }, { "epoch": 0.8639598158225199, "grad_norm": 0.21741938901247673, "learning_rate": 5.532653463983617e-06, "loss": 0.4501, "step": 3354 }, { "epoch": 0.8642174067038026, "grad_norm": 0.14810263300735152, "learning_rate": 5.512109758444878e-06, "loss": 0.3377, "step": 3355 }, { "epoch": 0.8642174067038026, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8569931901519119, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3582652807235718, "eval_runtime": 16.9966, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 3355 }, { "epoch": 0.8644749975850855, "grad_norm": 0.15368587173991025, "learning_rate": 5.491602039799387e-06, "loss": 0.3551, "step": 3356 }, { "epoch": 0.8647325884663682, "grad_norm": 0.14526521831534006, "learning_rate": 5.4711303246361144e-06, "loss": 0.3122, "step": 3357 }, { "epoch": 0.8649901793476511, "grad_norm": 0.15246842368527974, "learning_rate": 5.450694629514913e-06, "loss": 0.3086, "step": 3358 }, { "epoch": 0.8652477702289338, "grad_norm": 0.16684370550958466, "learning_rate": 5.430294970966548e-06, "loss": 0.334, "step": 3359 }, { "epoch": 0.8655053611102167, "grad_norm": 0.13473379169677913, "learning_rate": 5.4099313654925656e-06, "loss": 0.2576, "step": 3360 }, { "epoch": 0.8655053611102167, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8569931901519119, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35862037539482117, "eval_runtime": 17.0855, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 3360 }, { "epoch": 0.8657629519914996, "grad_norm": 0.2534286544526206, "learning_rate": 5.389603829565393e-06, "loss": 0.4032, "step": 3361 }, { "epoch": 0.8660205428727823, "grad_norm": 0.124800943952739, "learning_rate": 5.369312379628255e-06, "loss": 0.3084, "step": 3362 }, { "epoch": 0.8662781337540651, "grad_norm": 0.11806770207957193, "learning_rate": 5.349057032095201e-06, "loss": 0.3192, "step": 3363 }, { "epoch": 0.8665357246353479, "grad_norm": 0.14609640205709506, "learning_rate": 5.328837803351083e-06, "loss": 0.2998, "step": 3364 }, { "epoch": 0.8667933155166307, "grad_norm": 0.17178728686196976, "learning_rate": 5.308654709751509e-06, "loss": 0.4625, "step": 3365 }, { "epoch": 0.8667933155166307, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8588266107909899, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3573774993419647, "eval_runtime": 17.6209, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 3365 }, { "epoch": 0.8670509063979135, "grad_norm": 0.14303261165364936, "learning_rate": 5.28850776762288e-06, "loss": 0.3448, "step": 3366 }, { "epoch": 0.8673084972791963, "grad_norm": 0.1247801467444584, "learning_rate": 5.268396993262353e-06, "loss": 0.3291, "step": 3367 }, { "epoch": 0.8675660881604791, "grad_norm": 0.14401997994572127, "learning_rate": 5.248322402937822e-06, "loss": 0.3542, "step": 3368 }, { "epoch": 0.8678236790417619, "grad_norm": 0.13438772649092728, "learning_rate": 5.228284012887907e-06, "loss": 0.3474, "step": 3369 }, { "epoch": 0.8680812699230447, "grad_norm": 0.1610405186158669, "learning_rate": 5.208281839321938e-06, "loss": 0.322, "step": 3370 }, { "epoch": 0.8680812699230447, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.861969617600838, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35653409361839294, "eval_runtime": 16.7888, "eval_samples_per_second": 2.621, "eval_steps_per_second": 0.179, "step": 3370 }, { "epoch": 0.8683388608043275, "grad_norm": 0.1589462698216017, "learning_rate": 5.188315898419971e-06, "loss": 0.3976, "step": 3371 }, { "epoch": 0.8685964516856103, "grad_norm": 0.2177911108681432, "learning_rate": 5.168386206332743e-06, "loss": 0.3543, "step": 3372 }, { "epoch": 0.8688540425668931, "grad_norm": 0.1727454096552039, "learning_rate": 5.148492779181674e-06, "loss": 0.4333, "step": 3373 }, { "epoch": 0.8691116334481759, "grad_norm": 0.15244128959146452, "learning_rate": 5.128635633058832e-06, "loss": 0.3475, "step": 3374 }, { "epoch": 0.8693692243294587, "grad_norm": 0.13862098098499673, "learning_rate": 5.10881478402695e-06, "loss": 0.3737, "step": 3375 }, { "epoch": 0.8693692243294587, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.862231534834992, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3571111559867859, "eval_runtime": 16.4753, "eval_samples_per_second": 2.671, "eval_steps_per_second": 0.182, "step": 3375 }, { "epoch": 0.8696268152107416, "grad_norm": 0.1701778142956791, "learning_rate": 5.089030248119408e-06, "loss": 0.4065, "step": 3376 }, { "epoch": 0.8698844060920243, "grad_norm": 0.17122321541566513, "learning_rate": 5.069282041340184e-06, "loss": 0.3961, "step": 3377 }, { "epoch": 0.8701419969733072, "grad_norm": 0.11360908711771076, "learning_rate": 5.04957017966391e-06, "loss": 0.2967, "step": 3378 }, { "epoch": 0.8703995878545899, "grad_norm": 0.1311991350392604, "learning_rate": 5.029894679035751e-06, "loss": 0.3074, "step": 3379 }, { "epoch": 0.8706571787358728, "grad_norm": 0.22086535680047703, "learning_rate": 5.010255555371551e-06, "loss": 0.3401, "step": 3380 }, { "epoch": 0.8706571787358728, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.860398114195914, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35498046875, "eval_runtime": 17.6551, "eval_samples_per_second": 2.492, "eval_steps_per_second": 0.17, "step": 3380 }, { "epoch": 0.8709147696171555, "grad_norm": 0.15012816852715252, "learning_rate": 4.990652824557651e-06, "loss": 0.3268, "step": 3381 }, { "epoch": 0.8711723604984384, "grad_norm": 0.15962416902318038, "learning_rate": 4.971086502450994e-06, "loss": 0.301, "step": 3382 }, { "epoch": 0.8714299513797211, "grad_norm": 0.18475450513934072, "learning_rate": 4.951556604879048e-06, "loss": 0.415, "step": 3383 }, { "epoch": 0.871687542261004, "grad_norm": 0.17130923311515397, "learning_rate": 4.932063147639826e-06, "loss": 0.3397, "step": 3384 }, { "epoch": 0.8719451331422867, "grad_norm": 0.19388737311848528, "learning_rate": 4.912606146501886e-06, "loss": 0.3528, "step": 3385 }, { "epoch": 0.8719451331422867, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.861183865898376, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35440340638160706, "eval_runtime": 17.4788, "eval_samples_per_second": 2.517, "eval_steps_per_second": 0.172, "step": 3385 }, { "epoch": 0.8722027240235696, "grad_norm": 0.14967404909595375, "learning_rate": 4.893185617204254e-06, "loss": 0.3369, "step": 3386 }, { "epoch": 0.8724603149048523, "grad_norm": 0.15771294984684486, "learning_rate": 4.873801575456482e-06, "loss": 0.3118, "step": 3387 }, { "epoch": 0.8727179057861352, "grad_norm": 0.20326520682578922, "learning_rate": 4.854454036938599e-06, "loss": 0.3624, "step": 3388 }, { "epoch": 0.872975496667418, "grad_norm": 0.13985547042581095, "learning_rate": 4.8351430173011195e-06, "loss": 0.332, "step": 3389 }, { "epoch": 0.8732330875487008, "grad_norm": 0.17482670597503344, "learning_rate": 4.815868532164991e-06, "loss": 0.3853, "step": 3390 }, { "epoch": 0.8732330875487008, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.861969617600838, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35475853085517883, "eval_runtime": 17.6039, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 3390 }, { "epoch": 0.8734906784299836, "grad_norm": 0.16706783944158435, "learning_rate": 4.796630597121615e-06, "loss": 0.3604, "step": 3391 }, { "epoch": 0.8737482693112664, "grad_norm": 0.13224174771504582, "learning_rate": 4.777429227732844e-06, "loss": 0.3099, "step": 3392 }, { "epoch": 0.8740058601925492, "grad_norm": 0.14123847384307184, "learning_rate": 4.758264439530935e-06, "loss": 0.3448, "step": 3393 }, { "epoch": 0.874263451073832, "grad_norm": 0.17080611571119608, "learning_rate": 4.739136248018577e-06, "loss": 0.3671, "step": 3394 }, { "epoch": 0.8745210419551148, "grad_norm": 0.1569547259625691, "learning_rate": 4.720044668668816e-06, "loss": 0.3358, "step": 3395 }, { "epoch": 0.8745210419551148, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8624934520691461, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3535600006580353, "eval_runtime": 17.0822, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 3395 }, { "epoch": 0.8747786328363976, "grad_norm": 0.15143190167386192, "learning_rate": 4.700989716925119e-06, "loss": 0.3957, "step": 3396 }, { "epoch": 0.8750362237176804, "grad_norm": 0.14311024718924314, "learning_rate": 4.681971408201313e-06, "loss": 0.3417, "step": 3397 }, { "epoch": 0.8752938145989632, "grad_norm": 0.1560350787452046, "learning_rate": 4.662989757881564e-06, "loss": 0.3314, "step": 3398 }, { "epoch": 0.875551405480246, "grad_norm": 0.18093472466459418, "learning_rate": 4.644044781320422e-06, "loss": 0.4352, "step": 3399 }, { "epoch": 0.8758089963615288, "grad_norm": 0.14235138369509262, "learning_rate": 4.625136493842724e-06, "loss": 0.3221, "step": 3400 }, { "epoch": 0.8758089963615288, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3559126555919647, "eval_runtime": 17.0664, "eval_samples_per_second": 2.578, "eval_steps_per_second": 0.176, "step": 3400 }, { "epoch": 0.8760665872428116, "grad_norm": 0.13346440586550953, "learning_rate": 4.606264910743691e-06, "loss": 0.2702, "step": 3401 }, { "epoch": 0.8763241781240944, "grad_norm": 0.1975675372901936, "learning_rate": 4.587430047288782e-06, "loss": 0.4439, "step": 3402 }, { "epoch": 0.8765817690053772, "grad_norm": 0.1750451273215324, "learning_rate": 4.568631918713822e-06, "loss": 0.3114, "step": 3403 }, { "epoch": 0.8768393598866601, "grad_norm": 0.15929251480990408, "learning_rate": 4.549870540224854e-06, "loss": 0.3256, "step": 3404 }, { "epoch": 0.8770969507679428, "grad_norm": 0.17053054730843406, "learning_rate": 4.531145926998248e-06, "loss": 0.3518, "step": 3405 }, { "epoch": 0.8770969507679428, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8606600314300681, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.359375, "eval_runtime": 17.1251, "eval_samples_per_second": 2.569, "eval_steps_per_second": 0.175, "step": 3405 }, { "epoch": 0.8773545416492257, "grad_norm": 0.1611383821537342, "learning_rate": 4.5124580941806165e-06, "loss": 0.3161, "step": 3406 }, { "epoch": 0.8776121325305084, "grad_norm": 0.1352857471888482, "learning_rate": 4.493807056888794e-06, "loss": 0.3104, "step": 3407 }, { "epoch": 0.8778697234117913, "grad_norm": 0.147846217965294, "learning_rate": 4.475192830209884e-06, "loss": 0.3727, "step": 3408 }, { "epoch": 0.878127314293074, "grad_norm": 0.2020811988957192, "learning_rate": 4.4566154292012e-06, "loss": 0.3767, "step": 3409 }, { "epoch": 0.8783849051743569, "grad_norm": 0.17699277683789505, "learning_rate": 4.438074868890285e-06, "loss": 0.4479, "step": 3410 }, { "epoch": 0.8783849051743569, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.856993190151912, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35768821835517883, "eval_runtime": 17.6059, "eval_samples_per_second": 2.499, "eval_steps_per_second": 0.17, "step": 3410 }, { "epoch": 0.8786424960556396, "grad_norm": 0.11529879894149396, "learning_rate": 4.4195711642748495e-06, "loss": 0.3358, "step": 3411 }, { "epoch": 0.8789000869369225, "grad_norm": 0.12418877708731489, "learning_rate": 4.401104330322797e-06, "loss": 0.3315, "step": 3412 }, { "epoch": 0.8791576778182052, "grad_norm": 0.2147454411249376, "learning_rate": 4.382674381972224e-06, "loss": 0.405, "step": 3413 }, { "epoch": 0.879415268699488, "grad_norm": 0.19830582636445251, "learning_rate": 4.364281334131376e-06, "loss": 0.404, "step": 3414 }, { "epoch": 0.8796728595807708, "grad_norm": 0.23224511172765894, "learning_rate": 4.3459252016786746e-06, "loss": 0.3277, "step": 3415 }, { "epoch": 0.8796728595807708, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.858302776322682, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3563121557235718, "eval_runtime": 16.8182, "eval_samples_per_second": 2.616, "eval_steps_per_second": 0.178, "step": 3415 }, { "epoch": 0.8799304504620536, "grad_norm": 0.2553873535803226, "learning_rate": 4.327605999462631e-06, "loss": 0.46, "step": 3416 }, { "epoch": 0.8801880413433364, "grad_norm": 0.15823541642932565, "learning_rate": 4.3093237423019185e-06, "loss": 0.3001, "step": 3417 }, { "epoch": 0.8804456322246192, "grad_norm": 0.12995475327006994, "learning_rate": 4.291078444985336e-06, "loss": 0.335, "step": 3418 }, { "epoch": 0.8807032231059021, "grad_norm": 0.11434637296968787, "learning_rate": 4.272870122271738e-06, "loss": 0.2605, "step": 3419 }, { "epoch": 0.8809608139871848, "grad_norm": 0.21628393439448532, "learning_rate": 4.254698788890127e-06, "loss": 0.3854, "step": 3420 }, { "epoch": 0.8809608139871848, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8585646935568362, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3566228747367859, "eval_runtime": 17.0729, "eval_samples_per_second": 2.577, "eval_steps_per_second": 0.176, "step": 3420 }, { "epoch": 0.8812184048684677, "grad_norm": 0.15118312512675022, "learning_rate": 4.236564459539516e-06, "loss": 0.3596, "step": 3421 }, { "epoch": 0.8814759957497504, "grad_norm": 0.15231327306852804, "learning_rate": 4.218467148889071e-06, "loss": 0.3229, "step": 3422 }, { "epoch": 0.8817335866310333, "grad_norm": 0.13684028357673278, "learning_rate": 4.200406871577945e-06, "loss": 0.3541, "step": 3423 }, { "epoch": 0.881991177512316, "grad_norm": 0.1640679125574751, "learning_rate": 4.182383642215343e-06, "loss": 0.3757, "step": 3424 }, { "epoch": 0.8822487683935989, "grad_norm": 0.16237750566583656, "learning_rate": 4.164397475380527e-06, "loss": 0.2981, "step": 3425 }, { "epoch": 0.8822487683935989, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.859088528025144, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3569779694080353, "eval_runtime": 16.9431, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 3425 }, { "epoch": 0.8825063592748816, "grad_norm": 0.1864322170812912, "learning_rate": 4.146448385622764e-06, "loss": 0.3593, "step": 3426 }, { "epoch": 0.8827639501561645, "grad_norm": 0.20572086068999337, "learning_rate": 4.12853638746134e-06, "loss": 0.4415, "step": 3427 }, { "epoch": 0.8830215410374472, "grad_norm": 0.15490396690465924, "learning_rate": 4.110661495385515e-06, "loss": 0.341, "step": 3428 }, { "epoch": 0.8832791319187301, "grad_norm": 0.16366345159076146, "learning_rate": 4.092823723854549e-06, "loss": 0.3829, "step": 3429 }, { "epoch": 0.8835367228000128, "grad_norm": 0.17399125297625062, "learning_rate": 4.075023087297669e-06, "loss": 0.3804, "step": 3430 }, { "epoch": 0.8835367228000128, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35617896914482117, "eval_runtime": 17.6808, "eval_samples_per_second": 2.489, "eval_steps_per_second": 0.17, "step": 3430 }, { "epoch": 0.8837943136812957, "grad_norm": 0.12752266712989935, "learning_rate": 4.057259600114072e-06, "loss": 0.2918, "step": 3431 }, { "epoch": 0.8840519045625785, "grad_norm": 0.16144533462809998, "learning_rate": 4.0395332766728966e-06, "loss": 0.3624, "step": 3432 }, { "epoch": 0.8843094954438613, "grad_norm": 0.16273780246855526, "learning_rate": 4.021844131313213e-06, "loss": 0.42, "step": 3433 }, { "epoch": 0.8845670863251441, "grad_norm": 0.1748600648022127, "learning_rate": 4.004192178344029e-06, "loss": 0.3057, "step": 3434 }, { "epoch": 0.8848246772064269, "grad_norm": 0.15656929075101317, "learning_rate": 3.986577432044264e-06, "loss": 0.3731, "step": 3435 }, { "epoch": 0.8848246772064269, "eval_PRM Accuracy": 0.7924528301886793, "eval_PRM F1": 0.8641975308641975, "eval_PRM F1 AUC": 0.7260345730749084, "eval_PRM F1 AUC (fixed)": 0.857778941854374, "eval_PRM F1 Neg": 0.56, "eval_PRM NPV": 0.5185185185185185, "eval_PRM Precision": 0.8860759493670886, "eval_PRM Recall": 0.8433734939759037, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35458096861839294, "eval_runtime": 16.9808, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 3435 }, { "epoch": 0.8850822680877097, "grad_norm": 0.12971193796981845, "learning_rate": 3.9689999066627515e-06, "loss": 0.3249, "step": 3436 }, { "epoch": 0.8853398589689925, "grad_norm": 0.16427301397008595, "learning_rate": 3.951459616418185e-06, "loss": 0.355, "step": 3437 }, { "epoch": 0.8855974498502753, "grad_norm": 0.1596405591427294, "learning_rate": 3.933956575499148e-06, "loss": 0.3244, "step": 3438 }, { "epoch": 0.8858550407315581, "grad_norm": 0.15304527722091246, "learning_rate": 3.916490798064138e-06, "loss": 0.4003, "step": 3439 }, { "epoch": 0.8861126316128409, "grad_norm": 0.22476937531451593, "learning_rate": 3.899062298241446e-06, "loss": 0.3936, "step": 3440 }, { "epoch": 0.8861126316128409, "eval_PRM Accuracy": 0.8018867924528302, "eval_PRM F1": 0.8711656441717791, "eval_PRM F1 AUC": 0.7320586694604505, "eval_PRM F1 AUC (fixed)": 0.8603981141959142, "eval_PRM F1 Neg": 0.5714285714285714, "eval_PRM NPV": 0.5384615384615384, "eval_PRM Precision": 0.8875, "eval_PRM Recall": 0.8554216867469879, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.353515625, "eval_runtime": 16.9526, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 3440 }, { "epoch": 0.8863702224941237, "grad_norm": 0.148355216002109, "learning_rate": 3.881671090129247e-06, "loss": 0.3343, "step": 3441 }, { "epoch": 0.8866278133754065, "grad_norm": 0.14224996259348446, "learning_rate": 3.864317187795524e-06, "loss": 0.3285, "step": 3442 }, { "epoch": 0.8868854042566893, "grad_norm": 0.14074178088930625, "learning_rate": 3.8470006052781116e-06, "loss": 0.3442, "step": 3443 }, { "epoch": 0.8871429951379721, "grad_norm": 0.16503210928207523, "learning_rate": 3.829721356584648e-06, "loss": 0.3492, "step": 3444 }, { "epoch": 0.8874005860192549, "grad_norm": 0.14872269256660958, "learning_rate": 3.812479455692547e-06, "loss": 0.3721, "step": 3445 }, { "epoch": 0.8874005860192549, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35475853085517883, "eval_runtime": 17.4303, "eval_samples_per_second": 2.524, "eval_steps_per_second": 0.172, "step": 3445 }, { "epoch": 0.8876581769005377, "grad_norm": 0.14582776492257432, "learning_rate": 3.795274916549041e-06, "loss": 0.3285, "step": 3446 }, { "epoch": 0.8879157677818206, "grad_norm": 0.15816937023341562, "learning_rate": 3.778107753071125e-06, "loss": 0.3563, "step": 3447 }, { "epoch": 0.8881733586631033, "grad_norm": 0.177014321731312, "learning_rate": 3.7609779791455744e-06, "loss": 0.318, "step": 3448 }, { "epoch": 0.8884309495443862, "grad_norm": 0.14123143850184638, "learning_rate": 3.7438856086288887e-06, "loss": 0.3102, "step": 3449 }, { "epoch": 0.8886885404256689, "grad_norm": 0.16816875465267456, "learning_rate": 3.7268306553473576e-06, "loss": 0.3691, "step": 3450 }, { "epoch": 0.8886885404256689, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.855683603981142, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3568004369735718, "eval_runtime": 17.0467, "eval_samples_per_second": 2.581, "eval_steps_per_second": 0.176, "step": 3450 }, { "epoch": 0.8889461313069518, "grad_norm": 0.14543496644321224, "learning_rate": 3.7098131330969566e-06, "loss": 0.2974, "step": 3451 }, { "epoch": 0.8892037221882345, "grad_norm": 0.16429448547261924, "learning_rate": 3.6928330556434077e-06, "loss": 0.3384, "step": 3452 }, { "epoch": 0.8894613130695174, "grad_norm": 0.16826460889671457, "learning_rate": 3.6758904367221513e-06, "loss": 0.3382, "step": 3453 }, { "epoch": 0.8897189039508001, "grad_norm": 0.1424716855787507, "learning_rate": 3.6589852900383027e-06, "loss": 0.3371, "step": 3454 }, { "epoch": 0.889976494832083, "grad_norm": 0.1733300069265746, "learning_rate": 3.6421176292666783e-06, "loss": 0.3477, "step": 3455 }, { "epoch": 0.889976494832083, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8569931901519119, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.357421875, "eval_runtime": 17.414, "eval_samples_per_second": 2.527, "eval_steps_per_second": 0.172, "step": 3455 }, { "epoch": 0.8902340857133657, "grad_norm": 0.16055435570628257, "learning_rate": 3.6252874680517746e-06, "loss": 0.3409, "step": 3456 }, { "epoch": 0.8904916765946486, "grad_norm": 0.1570864388583678, "learning_rate": 3.6084948200077572e-06, "loss": 0.3383, "step": 3457 }, { "epoch": 0.8907492674759313, "grad_norm": 0.1635186083602298, "learning_rate": 3.591739698718438e-06, "loss": 0.2504, "step": 3458 }, { "epoch": 0.8910068583572142, "grad_norm": 0.20775532996486326, "learning_rate": 3.5750221177372534e-06, "loss": 0.4202, "step": 3459 }, { "epoch": 0.8912644492384969, "grad_norm": 0.17793677032869037, "learning_rate": 3.55834209058733e-06, "loss": 0.3801, "step": 3460 }, { "epoch": 0.8912644492384969, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8606600314300682, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3575994372367859, "eval_runtime": 17.5629, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 3460 }, { "epoch": 0.8915220401197798, "grad_norm": 0.1397258122558241, "learning_rate": 3.5416996307613526e-06, "loss": 0.3576, "step": 3461 }, { "epoch": 0.8917796310010626, "grad_norm": 0.20021537298917827, "learning_rate": 3.5250947517216637e-06, "loss": 0.3965, "step": 3462 }, { "epoch": 0.8920372218823454, "grad_norm": 0.22406579737993645, "learning_rate": 3.50852746690018e-06, "loss": 0.3836, "step": 3463 }, { "epoch": 0.8922948127636282, "grad_norm": 0.14986958549520638, "learning_rate": 3.4919977896984148e-06, "loss": 0.3672, "step": 3464 }, { "epoch": 0.892552403644911, "grad_norm": 0.21698985785700728, "learning_rate": 3.475505733487472e-06, "loss": 0.3904, "step": 3465 }, { "epoch": 0.892552403644911, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8611838658983761, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35671165585517883, "eval_runtime": 16.8196, "eval_samples_per_second": 2.616, "eval_steps_per_second": 0.178, "step": 3465 }, { "epoch": 0.8928099945261938, "grad_norm": 0.14012226831709146, "learning_rate": 3.459051311607997e-06, "loss": 0.352, "step": 3466 }, { "epoch": 0.8930675854074765, "grad_norm": 0.22745469809592667, "learning_rate": 3.442634537370215e-06, "loss": 0.4986, "step": 3467 }, { "epoch": 0.8933251762887594, "grad_norm": 0.15466469424424434, "learning_rate": 3.4262554240538868e-06, "loss": 0.3209, "step": 3468 }, { "epoch": 0.8935827671700421, "grad_norm": 0.22413277766802422, "learning_rate": 3.4099139849083307e-06, "loss": 0.3511, "step": 3469 }, { "epoch": 0.893840358051325, "grad_norm": 0.11860341768835032, "learning_rate": 3.393610233152361e-06, "loss": 0.3119, "step": 3470 }, { "epoch": 0.893840358051325, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3568004369735718, "eval_runtime": 16.9544, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 3470 }, { "epoch": 0.8940979489326077, "grad_norm": 0.18083563004046216, "learning_rate": 3.3773441819743012e-06, "loss": 0.4113, "step": 3471 }, { "epoch": 0.8943555398138906, "grad_norm": 0.17149585089736719, "learning_rate": 3.3611158445320034e-06, "loss": 0.4202, "step": 3472 }, { "epoch": 0.8946131306951733, "grad_norm": 0.15558562107300855, "learning_rate": 3.344925233952806e-06, "loss": 0.3844, "step": 3473 }, { "epoch": 0.8948707215764562, "grad_norm": 0.15558509410071295, "learning_rate": 3.328772363333538e-06, "loss": 0.3836, "step": 3474 }, { "epoch": 0.895128312457739, "grad_norm": 0.18470263944036533, "learning_rate": 3.312657245740464e-06, "loss": 0.3792, "step": 3475 }, { "epoch": 0.895128312457739, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.85751702462022, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3567560315132141, "eval_runtime": 16.8792, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 3475 }, { "epoch": 0.8953859033390218, "grad_norm": 0.16846477488597117, "learning_rate": 3.296579894209345e-06, "loss": 0.3197, "step": 3476 }, { "epoch": 0.8956434942203046, "grad_norm": 0.1585259226334253, "learning_rate": 3.2805403217453956e-06, "loss": 0.3038, "step": 3477 }, { "epoch": 0.8959010851015874, "grad_norm": 0.11633746115143191, "learning_rate": 3.264538541323231e-06, "loss": 0.2563, "step": 3478 }, { "epoch": 0.8961586759828702, "grad_norm": 0.20213178518449737, "learning_rate": 3.2485745658869414e-06, "loss": 0.3316, "step": 3479 }, { "epoch": 0.896416266864153, "grad_norm": 0.1692052806896801, "learning_rate": 3.232648408349992e-06, "loss": 0.2897, "step": 3480 }, { "epoch": 0.896416266864153, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8606600314300681, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3560901880264282, "eval_runtime": 17.1761, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 3480 }, { "epoch": 0.8966738577454358, "grad_norm": 0.16321989055051614, "learning_rate": 3.21676008159531e-06, "loss": 0.4587, "step": 3481 }, { "epoch": 0.8969314486267186, "grad_norm": 0.15727505747572695, "learning_rate": 3.2009095984751715e-06, "loss": 0.4493, "step": 3482 }, { "epoch": 0.8971890395080014, "grad_norm": 0.1902381515248783, "learning_rate": 3.1850969718112745e-06, "loss": 0.3316, "step": 3483 }, { "epoch": 0.8974466303892842, "grad_norm": 0.1865002570972608, "learning_rate": 3.16932221439466e-06, "loss": 0.3816, "step": 3484 }, { "epoch": 0.897704221270567, "grad_norm": 0.15290733777855925, "learning_rate": 3.1535853389857707e-06, "loss": 0.3825, "step": 3485 }, { "epoch": 0.897704221270567, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35622337460517883, "eval_runtime": 16.9246, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 3485 }, { "epoch": 0.8979618121518498, "grad_norm": 0.1657061092856528, "learning_rate": 3.13788635831439e-06, "loss": 0.3478, "step": 3486 }, { "epoch": 0.8982194030331326, "grad_norm": 0.18369734845777763, "learning_rate": 3.1222252850796385e-06, "loss": 0.4137, "step": 3487 }, { "epoch": 0.8984769939144154, "grad_norm": 0.14985312653936153, "learning_rate": 3.1066021319499926e-06, "loss": 0.3131, "step": 3488 }, { "epoch": 0.8987345847956982, "grad_norm": 0.17263610489554684, "learning_rate": 3.0910169115632436e-06, "loss": 0.4082, "step": 3489 }, { "epoch": 0.8989921756769811, "grad_norm": 0.1415773035160174, "learning_rate": 3.0754696365265068e-06, "loss": 0.3778, "step": 3490 }, { "epoch": 0.8989921756769811, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.858302776322682, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35817649960517883, "eval_runtime": 17.5761, "eval_samples_per_second": 2.503, "eval_steps_per_second": 0.171, "step": 3490 }, { "epoch": 0.8992497665582638, "grad_norm": 0.14434952030692258, "learning_rate": 3.059960319416183e-06, "loss": 0.2922, "step": 3491 }, { "epoch": 0.8995073574395467, "grad_norm": 0.14561083035655872, "learning_rate": 3.0444889727779867e-06, "loss": 0.3422, "step": 3492 }, { "epoch": 0.8997649483208294, "grad_norm": 0.19276937119481916, "learning_rate": 3.029055609126913e-06, "loss": 0.3636, "step": 3493 }, { "epoch": 0.9000225392021123, "grad_norm": 0.28487890616005773, "learning_rate": 3.013660240947225e-06, "loss": 0.4912, "step": 3494 }, { "epoch": 0.900280130083395, "grad_norm": 0.16543237738836344, "learning_rate": 2.9983028806924774e-06, "loss": 0.3085, "step": 3495 }, { "epoch": 0.900280130083395, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.85751702462022, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36123934388160706, "eval_runtime": 17.3938, "eval_samples_per_second": 2.53, "eval_steps_per_second": 0.172, "step": 3495 }, { "epoch": 0.9005377209646779, "grad_norm": 0.16314043803783165, "learning_rate": 2.9829835407854334e-06, "loss": 0.3364, "step": 3496 }, { "epoch": 0.9007953118459606, "grad_norm": 0.14180941033485578, "learning_rate": 2.9677022336181413e-06, "loss": 0.3278, "step": 3497 }, { "epoch": 0.9010529027272435, "grad_norm": 0.17070372574640386, "learning_rate": 2.95245897155188e-06, "loss": 0.3852, "step": 3498 }, { "epoch": 0.9013104936085262, "grad_norm": 0.15309622719352337, "learning_rate": 2.9372537669171194e-06, "loss": 0.3758, "step": 3499 }, { "epoch": 0.9015680844898091, "grad_norm": 0.14792960371737923, "learning_rate": 2.922086632013582e-06, "loss": 0.3816, "step": 3500 }, { "epoch": 0.9015680844898091, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.859088528025144, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3594193756580353, "eval_runtime": 17.0052, "eval_samples_per_second": 2.587, "eval_steps_per_second": 0.176, "step": 3500 }, { "epoch": 0.9018256753710918, "grad_norm": 0.14090469611175638, "learning_rate": 2.90695757911017e-06, "loss": 0.3593, "step": 3501 }, { "epoch": 0.9020832662523747, "grad_norm": 0.14977731555923768, "learning_rate": 2.8918666204450106e-06, "loss": 0.3779, "step": 3502 }, { "epoch": 0.9023408571336574, "grad_norm": 0.14409493620439406, "learning_rate": 2.8768137682253837e-06, "loss": 0.3847, "step": 3503 }, { "epoch": 0.9025984480149403, "grad_norm": 0.17852245830856514, "learning_rate": 2.8617990346277657e-06, "loss": 0.3825, "step": 3504 }, { "epoch": 0.9028560388962231, "grad_norm": 0.2081650506236442, "learning_rate": 2.8468224317977743e-06, "loss": 0.4107, "step": 3505 }, { "epoch": 0.9028560388962231, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.858040859088528, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3613725006580353, "eval_runtime": 17.0225, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 3505 }, { "epoch": 0.9031136297775059, "grad_norm": 0.1304410803037061, "learning_rate": 2.831883971850213e-06, "loss": 0.3199, "step": 3506 }, { "epoch": 0.9033712206587887, "grad_norm": 0.3183315368975275, "learning_rate": 2.8169836668690165e-06, "loss": 0.517, "step": 3507 }, { "epoch": 0.9036288115400715, "grad_norm": 0.14265599880347749, "learning_rate": 2.802121528907242e-06, "loss": 0.3872, "step": 3508 }, { "epoch": 0.9038864024213543, "grad_norm": 0.15673814385728924, "learning_rate": 2.787297569987107e-06, "loss": 0.3693, "step": 3509 }, { "epoch": 0.9041439933026371, "grad_norm": 0.17147029433004354, "learning_rate": 2.7725118020998973e-06, "loss": 0.4265, "step": 3510 }, { "epoch": 0.9041439933026371, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8580408590885279, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3582652807235718, "eval_runtime": 17.1274, "eval_samples_per_second": 2.569, "eval_steps_per_second": 0.175, "step": 3510 }, { "epoch": 0.9044015841839199, "grad_norm": 0.1294599974767688, "learning_rate": 2.7577642372060673e-06, "loss": 0.3366, "step": 3511 }, { "epoch": 0.9046591750652027, "grad_norm": 0.10739872504317904, "learning_rate": 2.7430548872351135e-06, "loss": 0.2895, "step": 3512 }, { "epoch": 0.9049167659464855, "grad_norm": 0.1337098599209687, "learning_rate": 2.7283837640856346e-06, "loss": 0.3331, "step": 3513 }, { "epoch": 0.9051743568277683, "grad_norm": 0.15326670322972885, "learning_rate": 2.7137508796253208e-06, "loss": 0.3547, "step": 3514 }, { "epoch": 0.9054319477090511, "grad_norm": 0.17439375071989902, "learning_rate": 2.6991562456909205e-06, "loss": 0.4062, "step": 3515 }, { "epoch": 0.9054319477090511, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8543740178103719, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3610174059867859, "eval_runtime": 17.031, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 3515 }, { "epoch": 0.9056895385903339, "grad_norm": 0.14757466196871588, "learning_rate": 2.684599874088256e-06, "loss": 0.4083, "step": 3516 }, { "epoch": 0.9059471294716167, "grad_norm": 0.13038628864544433, "learning_rate": 2.670081776592165e-06, "loss": 0.3017, "step": 3517 }, { "epoch": 0.9062047203528996, "grad_norm": 0.1362571289704275, "learning_rate": 2.6556019649465525e-06, "loss": 0.2883, "step": 3518 }, { "epoch": 0.9064623112341823, "grad_norm": 0.19400127869035802, "learning_rate": 2.641160450864355e-06, "loss": 0.455, "step": 3519 }, { "epoch": 0.9067199021154652, "grad_norm": 0.1487023689144612, "learning_rate": 2.626757246027506e-06, "loss": 0.3572, "step": 3520 }, { "epoch": 0.9067199021154652, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8559455212152959, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36106178164482117, "eval_runtime": 17.6175, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 3520 }, { "epoch": 0.9069774929967479, "grad_norm": 0.1758953345140761, "learning_rate": 2.6123923620869795e-06, "loss": 0.4051, "step": 3521 }, { "epoch": 0.9072350838780308, "grad_norm": 0.1603008294335897, "learning_rate": 2.59806581066272e-06, "loss": 0.3914, "step": 3522 }, { "epoch": 0.9074926747593135, "grad_norm": 0.14475537508184771, "learning_rate": 2.5837776033436954e-06, "loss": 0.3153, "step": 3523 }, { "epoch": 0.9077502656405964, "grad_norm": 0.1312022526870313, "learning_rate": 2.5695277516878336e-06, "loss": 0.2982, "step": 3524 }, { "epoch": 0.9080078565218791, "grad_norm": 0.21749204403301972, "learning_rate": 2.5553162672220465e-06, "loss": 0.3939, "step": 3525 }, { "epoch": 0.9080078565218791, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8533263488737559, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3616832494735718, "eval_runtime": 16.4985, "eval_samples_per_second": 2.667, "eval_steps_per_second": 0.182, "step": 3525 }, { "epoch": 0.908265447403162, "grad_norm": 0.15509138928369606, "learning_rate": 2.5411431614422053e-06, "loss": 0.3359, "step": 3526 }, { "epoch": 0.9085230382844447, "grad_norm": 0.12699302222708414, "learning_rate": 2.5270084458131395e-06, "loss": 0.2976, "step": 3527 }, { "epoch": 0.9087806291657275, "grad_norm": 0.1781909885669849, "learning_rate": 2.5129121317686356e-06, "loss": 0.3845, "step": 3528 }, { "epoch": 0.9090382200470103, "grad_norm": 0.15216059727780382, "learning_rate": 2.4988542307113837e-06, "loss": 0.3444, "step": 3529 }, { "epoch": 0.9092958109282931, "grad_norm": 0.16200325190532375, "learning_rate": 2.4848347540130434e-06, "loss": 0.2597, "step": 3530 }, { "epoch": 0.9092958109282931, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8530644316396019, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.36110618710517883, "eval_runtime": 16.989, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 3530 }, { "epoch": 0.9095534018095759, "grad_norm": 0.15168951575416167, "learning_rate": 2.4708537130141485e-06, "loss": 0.3409, "step": 3531 }, { "epoch": 0.9098109926908587, "grad_norm": 0.15496414073672882, "learning_rate": 2.45691111902418e-06, "loss": 0.3449, "step": 3532 }, { "epoch": 0.9100685835721416, "grad_norm": 0.3104512486482539, "learning_rate": 2.4430069833214996e-06, "loss": 0.4948, "step": 3533 }, { "epoch": 0.9103261744534243, "grad_norm": 0.20727427059037964, "learning_rate": 2.429141317153355e-06, "loss": 0.455, "step": 3534 }, { "epoch": 0.9105837653347072, "grad_norm": 0.1696170445047076, "learning_rate": 2.415314131735885e-06, "loss": 0.368, "step": 3535 }, { "epoch": 0.9105837653347072, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8567312729177579, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3587535619735718, "eval_runtime": 16.9861, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 3535 }, { "epoch": 0.9108413562159899, "grad_norm": 0.16578645048029902, "learning_rate": 2.4015254382541043e-06, "loss": 0.3967, "step": 3536 }, { "epoch": 0.9110989470972728, "grad_norm": 0.14286368348379852, "learning_rate": 2.38777524786189e-06, "loss": 0.2688, "step": 3537 }, { "epoch": 0.9113565379785555, "grad_norm": 0.12512391214687887, "learning_rate": 2.374063571681956e-06, "loss": 0.3187, "step": 3538 }, { "epoch": 0.9116141288598384, "grad_norm": 0.17653831694965627, "learning_rate": 2.360390420805869e-06, "loss": 0.391, "step": 3539 }, { "epoch": 0.9118717197411211, "grad_norm": 0.14848179498309094, "learning_rate": 2.34675580629406e-06, "loss": 0.4207, "step": 3540 }, { "epoch": 0.9118717197411211, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8517548454688318, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35910865664482117, "eval_runtime": 17.5619, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 3540 }, { "epoch": 0.912129310622404, "grad_norm": 0.17358589157100177, "learning_rate": 2.3331597391757442e-06, "loss": 0.2874, "step": 3541 }, { "epoch": 0.9123869015036867, "grad_norm": 0.17014683888786977, "learning_rate": 2.3196022304489864e-06, "loss": 0.3243, "step": 3542 }, { "epoch": 0.9126444923849696, "grad_norm": 0.219578585265958, "learning_rate": 2.306083291080641e-06, "loss": 0.4471, "step": 3543 }, { "epoch": 0.9129020832662523, "grad_norm": 0.13052088921236898, "learning_rate": 2.292602932006377e-06, "loss": 0.3245, "step": 3544 }, { "epoch": 0.9131596741475352, "grad_norm": 0.1485674479766076, "learning_rate": 2.2791611641306555e-06, "loss": 0.305, "step": 3545 }, { "epoch": 0.9131596741475352, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8533263488737558, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3580433130264282, "eval_runtime": 17.4401, "eval_samples_per_second": 2.523, "eval_steps_per_second": 0.172, "step": 3545 }, { "epoch": 0.9134172650288179, "grad_norm": 0.28276776229349954, "learning_rate": 2.2657579983267064e-06, "loss": 0.4108, "step": 3546 }, { "epoch": 0.9136748559101008, "grad_norm": 0.15989949777721657, "learning_rate": 2.252393445436546e-06, "loss": 0.429, "step": 3547 }, { "epoch": 0.9139324467913836, "grad_norm": 0.16830071915691178, "learning_rate": 2.239067516270954e-06, "loss": 0.3874, "step": 3548 }, { "epoch": 0.9141900376726664, "grad_norm": 0.14365545128953014, "learning_rate": 2.2257802216094746e-06, "loss": 0.3974, "step": 3549 }, { "epoch": 0.9144476285539492, "grad_norm": 0.10287303681402393, "learning_rate": 2.212531572200377e-06, "loss": 0.298, "step": 3550 }, { "epoch": 0.9144476285539492, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8509690937663698, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3582652807235718, "eval_runtime": 16.8653, "eval_samples_per_second": 2.609, "eval_steps_per_second": 0.178, "step": 3550 }, { "epoch": 0.914705219435232, "grad_norm": 0.1414417999527504, "learning_rate": 2.1993215787606936e-06, "loss": 0.3516, "step": 3551 }, { "epoch": 0.9149628103165148, "grad_norm": 0.2086615373938124, "learning_rate": 2.186150251976171e-06, "loss": 0.4494, "step": 3552 }, { "epoch": 0.9152204011977976, "grad_norm": 0.15183181236880697, "learning_rate": 2.1730176025012816e-06, "loss": 0.3249, "step": 3553 }, { "epoch": 0.9154779920790804, "grad_norm": 0.17879774948444485, "learning_rate": 2.1599236409592327e-06, "loss": 0.3687, "step": 3554 }, { "epoch": 0.9157355829603632, "grad_norm": 0.22149387381725968, "learning_rate": 2.1468683779418965e-06, "loss": 0.4342, "step": 3555 }, { "epoch": 0.9157355829603632, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8499214248297537, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3606622815132141, "eval_runtime": 17.747, "eval_samples_per_second": 2.479, "eval_steps_per_second": 0.169, "step": 3555 }, { "epoch": 0.915993173841646, "grad_norm": 0.15702597463200188, "learning_rate": 2.1338518240098694e-06, "loss": 0.4099, "step": 3556 }, { "epoch": 0.9162507647229288, "grad_norm": 0.15451074192970757, "learning_rate": 2.1208739896924345e-06, "loss": 0.3728, "step": 3557 }, { "epoch": 0.9165083556042116, "grad_norm": 0.15794402817072664, "learning_rate": 2.1079348854875505e-06, "loss": 0.3392, "step": 3558 }, { "epoch": 0.9167659464854944, "grad_norm": 0.19678681465612674, "learning_rate": 2.0950345218618328e-06, "loss": 0.3692, "step": 3559 }, { "epoch": 0.9170235373667772, "grad_norm": 0.1361028667540031, "learning_rate": 2.082172909250568e-06, "loss": 0.3296, "step": 3560 }, { "epoch": 0.9170235373667772, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.858040859088528, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35537996888160706, "eval_runtime": 16.9677, "eval_samples_per_second": 2.593, "eval_steps_per_second": 0.177, "step": 3560 }, { "epoch": 0.9172811282480601, "grad_norm": 0.12828516715375252, "learning_rate": 2.069350058057723e-06, "loss": 0.284, "step": 3561 }, { "epoch": 0.9175387191293428, "grad_norm": 0.15589654522386157, "learning_rate": 2.056565978655861e-06, "loss": 0.2953, "step": 3562 }, { "epoch": 0.9177963100106257, "grad_norm": 0.1922738703624335, "learning_rate": 2.043820681386227e-06, "loss": 0.3538, "step": 3563 }, { "epoch": 0.9180539008919084, "grad_norm": 0.20272910116447893, "learning_rate": 2.0311141765586573e-06, "loss": 0.4282, "step": 3564 }, { "epoch": 0.9183114917731913, "grad_norm": 0.16346346255570265, "learning_rate": 2.0184464744516353e-06, "loss": 0.3704, "step": 3565 }, { "epoch": 0.9183114917731913, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8528025144054479, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35910865664482117, "eval_runtime": 17.618, "eval_samples_per_second": 2.497, "eval_steps_per_second": 0.17, "step": 3565 }, { "epoch": 0.918569082654474, "grad_norm": 0.1457485536576306, "learning_rate": 2.005817585312253e-06, "loss": 0.334, "step": 3566 }, { "epoch": 0.9188266735357569, "grad_norm": 0.15443730771182385, "learning_rate": 1.993227519356189e-06, "loss": 0.3371, "step": 3567 }, { "epoch": 0.9190842644170396, "grad_norm": 0.1680000043483095, "learning_rate": 1.9806762867677296e-06, "loss": 0.4377, "step": 3568 }, { "epoch": 0.9193418552983225, "grad_norm": 0.14717374054767854, "learning_rate": 1.9681638976997486e-06, "loss": 0.3451, "step": 3569 }, { "epoch": 0.9195994461796052, "grad_norm": 0.1242823379036716, "learning_rate": 1.95569036227371e-06, "loss": 0.3423, "step": 3570 }, { "epoch": 0.9195994461796052, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3561345934867859, "eval_runtime": 17.0785, "eval_samples_per_second": 2.576, "eval_steps_per_second": 0.176, "step": 3570 }, { "epoch": 0.9198570370608881, "grad_norm": 0.1169699351085616, "learning_rate": 1.943255690579615e-06, "loss": 0.2595, "step": 3571 }, { "epoch": 0.9201146279421708, "grad_norm": 0.11198757782737513, "learning_rate": 1.9308598926760625e-06, "loss": 0.3334, "step": 3572 }, { "epoch": 0.9203722188234537, "grad_norm": 0.14045385474378944, "learning_rate": 1.9185029785901867e-06, "loss": 0.3475, "step": 3573 }, { "epoch": 0.9206298097047364, "grad_norm": 0.1654475938787749, "learning_rate": 1.906184958317664e-06, "loss": 0.3333, "step": 3574 }, { "epoch": 0.9208874005860193, "grad_norm": 0.16327096309656713, "learning_rate": 1.8939058418227406e-06, "loss": 0.4313, "step": 3575 }, { "epoch": 0.9208874005860193, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35595703125, "eval_runtime": 17.2808, "eval_samples_per_second": 2.546, "eval_steps_per_second": 0.174, "step": 3575 }, { "epoch": 0.9211449914673021, "grad_norm": 0.17906720956662106, "learning_rate": 1.8816656390381437e-06, "loss": 0.3375, "step": 3576 }, { "epoch": 0.9214025823485849, "grad_norm": 0.17656544233826593, "learning_rate": 1.8694643598651695e-06, "loss": 0.3924, "step": 3577 }, { "epoch": 0.9216601732298677, "grad_norm": 0.13320038375003498, "learning_rate": 1.8573020141736008e-06, "loss": 0.3321, "step": 3578 }, { "epoch": 0.9219177641111505, "grad_norm": 0.15680397389075254, "learning_rate": 1.8451786118017234e-06, "loss": 0.3439, "step": 3579 }, { "epoch": 0.9221753549924333, "grad_norm": 0.1473731597244704, "learning_rate": 1.8330941625563535e-06, "loss": 0.4521, "step": 3580 }, { "epoch": 0.9221753549924333, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8575170246202201, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35458096861839294, "eval_runtime": 16.9061, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.177, "step": 3580 }, { "epoch": 0.922432945873716, "grad_norm": 0.13627264372745382, "learning_rate": 1.8210486762127499e-06, "loss": 0.3084, "step": 3581 }, { "epoch": 0.9226905367549989, "grad_norm": 0.16310370490610962, "learning_rate": 1.8090421625147013e-06, "loss": 0.3037, "step": 3582 }, { "epoch": 0.9229481276362816, "grad_norm": 0.14387730487937045, "learning_rate": 1.7970746311744336e-06, "loss": 0.4041, "step": 3583 }, { "epoch": 0.9232057185175645, "grad_norm": 0.14068108820423889, "learning_rate": 1.7851460918726748e-06, "loss": 0.3223, "step": 3584 }, { "epoch": 0.9234633093988472, "grad_norm": 0.1302142737116632, "learning_rate": 1.7732565542585678e-06, "loss": 0.315, "step": 3585 }, { "epoch": 0.9234633093988472, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.856993190151912, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35946378111839294, "eval_runtime": 17.6897, "eval_samples_per_second": 2.487, "eval_steps_per_second": 0.17, "step": 3585 }, { "epoch": 0.9237209002801301, "grad_norm": 0.1446479054321807, "learning_rate": 1.7614060279497413e-06, "loss": 0.3067, "step": 3586 }, { "epoch": 0.9239784911614128, "grad_norm": 0.13510928230906516, "learning_rate": 1.7495945225322607e-06, "loss": 0.2805, "step": 3587 }, { "epoch": 0.9242360820426957, "grad_norm": 0.15398682236678907, "learning_rate": 1.737822047560611e-06, "loss": 0.3182, "step": 3588 }, { "epoch": 0.9244936729239784, "grad_norm": 0.1598075897613883, "learning_rate": 1.7260886125577247e-06, "loss": 0.4169, "step": 3589 }, { "epoch": 0.9247512638052613, "grad_norm": 0.15869750034866761, "learning_rate": 1.7143942270149427e-06, "loss": 0.3449, "step": 3590 }, { "epoch": 0.9247512638052613, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8585646935568361, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35830965638160706, "eval_runtime": 16.3997, "eval_samples_per_second": 2.683, "eval_steps_per_second": 0.183, "step": 3590 }, { "epoch": 0.9250088546865441, "grad_norm": 0.15858603689819276, "learning_rate": 1.7027389003920313e-06, "loss": 0.3533, "step": 3591 }, { "epoch": 0.9252664455678269, "grad_norm": 0.15268138246759289, "learning_rate": 1.6911226421171378e-06, "loss": 0.3639, "step": 3592 }, { "epoch": 0.9255240364491097, "grad_norm": 0.1692437619504843, "learning_rate": 1.6795454615868234e-06, "loss": 0.3816, "step": 3593 }, { "epoch": 0.9257816273303925, "grad_norm": 0.16953837399894867, "learning_rate": 1.6680073681660358e-06, "loss": 0.401, "step": 3594 }, { "epoch": 0.9260392182116753, "grad_norm": 0.19482660347644706, "learning_rate": 1.656508371188109e-06, "loss": 0.2827, "step": 3595 }, { "epoch": 0.9260392182116753, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35520240664482117, "eval_runtime": 17.2187, "eval_samples_per_second": 2.555, "eval_steps_per_second": 0.174, "step": 3595 }, { "epoch": 0.9262968090929581, "grad_norm": 0.13849159515883916, "learning_rate": 1.6450484799547473e-06, "loss": 0.4034, "step": 3596 }, { "epoch": 0.9265543999742409, "grad_norm": 0.17046521701031161, "learning_rate": 1.6336277037360127e-06, "loss": 0.3568, "step": 3597 }, { "epoch": 0.9268119908555237, "grad_norm": 0.17147074585372724, "learning_rate": 1.622246051770343e-06, "loss": 0.4252, "step": 3598 }, { "epoch": 0.9270695817368065, "grad_norm": 0.17687896763490749, "learning_rate": 1.6109035332645183e-06, "loss": 0.3575, "step": 3599 }, { "epoch": 0.9273271726180893, "grad_norm": 0.1830855633473594, "learning_rate": 1.5996001573936604e-06, "loss": 0.3733, "step": 3600 }, { "epoch": 0.9273271726180893, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8593504452592982, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3565784692764282, "eval_runtime": 16.8833, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 3600 }, { "epoch": 0.9275847634993721, "grad_norm": 0.17321490179978577, "learning_rate": 1.5883359333012438e-06, "loss": 0.3897, "step": 3601 }, { "epoch": 0.9278423543806549, "grad_norm": 0.15898382741093173, "learning_rate": 1.5771108700990412e-06, "loss": 0.3738, "step": 3602 }, { "epoch": 0.9280999452619377, "grad_norm": 0.1391967307095472, "learning_rate": 1.5659249768671835e-06, "loss": 0.3337, "step": 3603 }, { "epoch": 0.9283575361432206, "grad_norm": 0.12481251556632249, "learning_rate": 1.5547782626540941e-06, "loss": 0.3264, "step": 3604 }, { "epoch": 0.9286151270245033, "grad_norm": 0.1582670706657496, "learning_rate": 1.5436707364765213e-06, "loss": 0.3687, "step": 3605 }, { "epoch": 0.9286151270245033, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8606600314300681, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3534712493419647, "eval_runtime": 17.7365, "eval_samples_per_second": 2.481, "eval_steps_per_second": 0.169, "step": 3605 }, { "epoch": 0.9288727179057862, "grad_norm": 0.1962104659388427, "learning_rate": 1.5326024073194834e-06, "loss": 0.4026, "step": 3606 }, { "epoch": 0.9291303087870689, "grad_norm": 0.13502688190956327, "learning_rate": 1.5215732841363239e-06, "loss": 0.2946, "step": 3607 }, { "epoch": 0.9293878996683518, "grad_norm": 0.11718572355068893, "learning_rate": 1.5105833758486621e-06, "loss": 0.298, "step": 3608 }, { "epoch": 0.9296454905496345, "grad_norm": 0.16677425259863735, "learning_rate": 1.4996326913463754e-06, "loss": 0.2994, "step": 3609 }, { "epoch": 0.9299030814309174, "grad_norm": 0.15552722462552468, "learning_rate": 1.4887212394876503e-06, "loss": 0.3641, "step": 3610 }, { "epoch": 0.9299030814309174, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8593504452592982, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3546253442764282, "eval_runtime": 17.1911, "eval_samples_per_second": 2.559, "eval_steps_per_second": 0.175, "step": 3610 }, { "epoch": 0.9301606723122001, "grad_norm": 0.1307387602339093, "learning_rate": 1.4778490290988934e-06, "loss": 0.3407, "step": 3611 }, { "epoch": 0.930418263193483, "grad_norm": 0.2251240226399944, "learning_rate": 1.467016068974819e-06, "loss": 0.4252, "step": 3612 }, { "epoch": 0.9306758540747657, "grad_norm": 0.1225706200048114, "learning_rate": 1.4562223678783516e-06, "loss": 0.2744, "step": 3613 }, { "epoch": 0.9309334449560486, "grad_norm": 0.14564700385711848, "learning_rate": 1.4454679345406619e-06, "loss": 0.3934, "step": 3614 }, { "epoch": 0.9311910358373313, "grad_norm": 0.16876178194128658, "learning_rate": 1.4347527776611746e-06, "loss": 0.3533, "step": 3615 }, { "epoch": 0.9311910358373313, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3512073755264282, "eval_runtime": 17.5668, "eval_samples_per_second": 2.505, "eval_steps_per_second": 0.171, "step": 3615 }, { "epoch": 0.9314486267186142, "grad_norm": 0.1525862990991277, "learning_rate": 1.4240769059075342e-06, "loss": 0.2566, "step": 3616 }, { "epoch": 0.9317062175998969, "grad_norm": 0.14940505072760127, "learning_rate": 1.4134403279156106e-06, "loss": 0.2961, "step": 3617 }, { "epoch": 0.9319638084811798, "grad_norm": 0.15374299685837137, "learning_rate": 1.4028430522894765e-06, "loss": 0.3751, "step": 3618 }, { "epoch": 0.9322213993624626, "grad_norm": 0.1341987628806026, "learning_rate": 1.3922850876014192e-06, "loss": 0.343, "step": 3619 }, { "epoch": 0.9324789902437454, "grad_norm": 0.13654672843056637, "learning_rate": 1.3817664423919351e-06, "loss": 0.3156, "step": 3620 }, { "epoch": 0.9324789902437454, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.353515625, "eval_runtime": 17.5501, "eval_samples_per_second": 2.507, "eval_steps_per_second": 0.171, "step": 3620 }, { "epoch": 0.9327365811250282, "grad_norm": 0.16672504814855243, "learning_rate": 1.3712871251697012e-06, "loss": 0.3681, "step": 3621 }, { "epoch": 0.932994172006311, "grad_norm": 0.19594028408110487, "learning_rate": 1.3608471444115977e-06, "loss": 0.3699, "step": 3622 }, { "epoch": 0.9332517628875938, "grad_norm": 0.17086512939183604, "learning_rate": 1.3504465085626638e-06, "loss": 0.4609, "step": 3623 }, { "epoch": 0.9335093537688766, "grad_norm": 0.17268770687487686, "learning_rate": 1.3400852260361252e-06, "loss": 0.3939, "step": 3624 }, { "epoch": 0.9337669446501594, "grad_norm": 0.14195089254333754, "learning_rate": 1.3297633052133718e-06, "loss": 0.3224, "step": 3625 }, { "epoch": 0.9337669446501594, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8643268727082242, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3525390625, "eval_runtime": 17.1593, "eval_samples_per_second": 2.564, "eval_steps_per_second": 0.175, "step": 3625 }, { "epoch": 0.9340245355314422, "grad_norm": 0.15892233470683617, "learning_rate": 1.3194807544439635e-06, "loss": 0.373, "step": 3626 }, { "epoch": 0.934282126412725, "grad_norm": 0.13537545563985226, "learning_rate": 1.3092375820455916e-06, "loss": 0.3124, "step": 3627 }, { "epoch": 0.9345397172940078, "grad_norm": 0.15225779088304373, "learning_rate": 1.299033796304111e-06, "loss": 0.382, "step": 3628 }, { "epoch": 0.9347973081752906, "grad_norm": 0.16354081536121157, "learning_rate": 1.2888694054735085e-06, "loss": 0.3384, "step": 3629 }, { "epoch": 0.9350548990565734, "grad_norm": 0.15028260915943015, "learning_rate": 1.2787444177759068e-06, "loss": 0.3891, "step": 3630 }, { "epoch": 0.9350548990565734, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8596123624934522, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3546253442764282, "eval_runtime": 17.0396, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 3630 }, { "epoch": 0.9353124899378562, "grad_norm": 0.15976214590838345, "learning_rate": 1.2686588414015543e-06, "loss": 0.3122, "step": 3631 }, { "epoch": 0.935570080819139, "grad_norm": 0.13884197323278308, "learning_rate": 1.2586126845088086e-06, "loss": 0.3325, "step": 3632 }, { "epoch": 0.9358276717004218, "grad_norm": 0.15873924916917725, "learning_rate": 1.248605955224169e-06, "loss": 0.3719, "step": 3633 }, { "epoch": 0.9360852625817047, "grad_norm": 0.17844417291816023, "learning_rate": 1.2386386616422164e-06, "loss": 0.3619, "step": 3634 }, { "epoch": 0.9363428534629874, "grad_norm": 0.1429127723093715, "learning_rate": 1.228710811825623e-06, "loss": 0.3363, "step": 3635 }, { "epoch": 0.9363428534629874, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8577789418543739, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3564453125, "eval_runtime": 17.1988, "eval_samples_per_second": 2.558, "eval_steps_per_second": 0.174, "step": 3635 }, { "epoch": 0.9366004443442703, "grad_norm": 0.143553936055149, "learning_rate": 1.2188224138051874e-06, "loss": 0.3573, "step": 3636 }, { "epoch": 0.936858035225553, "grad_norm": 0.1570089595566499, "learning_rate": 1.208973475579761e-06, "loss": 0.3635, "step": 3637 }, { "epoch": 0.9371156261068359, "grad_norm": 0.1636449864279838, "learning_rate": 1.19916400511631e-06, "loss": 0.4452, "step": 3638 }, { "epoch": 0.9373732169881186, "grad_norm": 0.1434591093458333, "learning_rate": 1.189394010349848e-06, "loss": 0.3512, "step": 3639 }, { "epoch": 0.9376308078694015, "grad_norm": 0.1845146332799933, "learning_rate": 1.1796634991834476e-06, "loss": 0.3987, "step": 3640 }, { "epoch": 0.9376308078694015, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3558238744735718, "eval_runtime": 17.0517, "eval_samples_per_second": 2.58, "eval_steps_per_second": 0.176, "step": 3640 }, { "epoch": 0.9378883987506842, "grad_norm": 0.1850052147374829, "learning_rate": 1.1699724794882849e-06, "loss": 0.4093, "step": 3641 }, { "epoch": 0.938145989631967, "grad_norm": 0.140018455666938, "learning_rate": 1.1603209591035447e-06, "loss": 0.3434, "step": 3642 }, { "epoch": 0.9384035805132498, "grad_norm": 0.19723646319820293, "learning_rate": 1.1507089458364984e-06, "loss": 0.3912, "step": 3643 }, { "epoch": 0.9386611713945326, "grad_norm": 0.13679557778401036, "learning_rate": 1.1411364474624264e-06, "loss": 0.2239, "step": 3644 }, { "epoch": 0.9389187622758154, "grad_norm": 0.11434361612107999, "learning_rate": 1.1316034717246626e-06, "loss": 0.3308, "step": 3645 }, { "epoch": 0.9389187622758154, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8624934520691461, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35205078125, "eval_runtime": 17.0238, "eval_samples_per_second": 2.585, "eval_steps_per_second": 0.176, "step": 3645 }, { "epoch": 0.9391763531570982, "grad_norm": 0.13629942244093662, "learning_rate": 1.1221100263345773e-06, "loss": 0.3062, "step": 3646 }, { "epoch": 0.939433944038381, "grad_norm": 0.19287017509156754, "learning_rate": 1.1126561189715502e-06, "loss": 0.3842, "step": 3647 }, { "epoch": 0.9396915349196638, "grad_norm": 0.13998401829250906, "learning_rate": 1.1032417572829745e-06, "loss": 0.3509, "step": 3648 }, { "epoch": 0.9399491258009467, "grad_norm": 0.17528116018871204, "learning_rate": 1.0938669488842702e-06, "loss": 0.4325, "step": 3649 }, { "epoch": 0.9402067166822294, "grad_norm": 0.15921787864544712, "learning_rate": 1.0845317013588596e-06, "loss": 0.3764, "step": 3650 }, { "epoch": 0.9402067166822294, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35324928164482117, "eval_runtime": 17.04, "eval_samples_per_second": 2.582, "eval_steps_per_second": 0.176, "step": 3650 }, { "epoch": 0.9404643075635123, "grad_norm": 0.193952286619382, "learning_rate": 1.075236022258147e-06, "loss": 0.3405, "step": 3651 }, { "epoch": 0.940721898444795, "grad_norm": 0.26518998616866324, "learning_rate": 1.0659799191015507e-06, "loss": 0.4643, "step": 3652 }, { "epoch": 0.9409794893260779, "grad_norm": 0.13543714158708117, "learning_rate": 1.0567633993764537e-06, "loss": 0.273, "step": 3653 }, { "epoch": 0.9412370802073606, "grad_norm": 0.13373048613174426, "learning_rate": 1.0475864705382422e-06, "loss": 0.3098, "step": 3654 }, { "epoch": 0.9414946710886435, "grad_norm": 0.15415902218239402, "learning_rate": 1.0384491400102614e-06, "loss": 0.3667, "step": 3655 }, { "epoch": 0.9414946710886435, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3531605005264282, "eval_runtime": 16.5343, "eval_samples_per_second": 2.661, "eval_steps_per_second": 0.181, "step": 3655 }, { "epoch": 0.9417522619699262, "grad_norm": 0.16902528190442034, "learning_rate": 1.0293514151838268e-06, "loss": 0.4194, "step": 3656 }, { "epoch": 0.9420098528512091, "grad_norm": 0.1837710083377154, "learning_rate": 1.0202933034182237e-06, "loss": 0.3673, "step": 3657 }, { "epoch": 0.9422674437324918, "grad_norm": 0.155257115669239, "learning_rate": 1.0112748120406856e-06, "loss": 0.3239, "step": 3658 }, { "epoch": 0.9425250346137747, "grad_norm": 0.1603155333470742, "learning_rate": 1.0022959483464045e-06, "loss": 0.3068, "step": 3659 }, { "epoch": 0.9427826254950574, "grad_norm": 0.19221021847619366, "learning_rate": 9.933567195985094e-07, "loss": 0.4736, "step": 3660 }, { "epoch": 0.9427826254950574, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8619696176008381, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3556463122367859, "eval_runtime": 17.1711, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 3660 }, { "epoch": 0.9430402163763403, "grad_norm": 0.16379670288583872, "learning_rate": 9.844571330280549e-07, "loss": 0.4013, "step": 3661 }, { "epoch": 0.9432978072576231, "grad_norm": 0.17665040568388132, "learning_rate": 9.75597195834077e-07, "loss": 0.3604, "step": 3662 }, { "epoch": 0.9435553981389059, "grad_norm": 0.1694285296370909, "learning_rate": 9.66776915183476e-07, "loss": 0.3601, "step": 3663 }, { "epoch": 0.9438129890201887, "grad_norm": 0.12650901480029578, "learning_rate": 9.579962982111224e-07, "loss": 0.3239, "step": 3664 }, { "epoch": 0.9440705799014715, "grad_norm": 0.14756402561710022, "learning_rate": 9.492553520197733e-07, "loss": 0.4006, "step": 3665 }, { "epoch": 0.9440705799014715, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3529829680919647, "eval_runtime": 17.0353, "eval_samples_per_second": 2.583, "eval_steps_per_second": 0.176, "step": 3665 }, { "epoch": 0.9443281707827543, "grad_norm": 0.17854362312944283, "learning_rate": 9.405540836801119e-07, "loss": 0.3465, "step": 3666 }, { "epoch": 0.9445857616640371, "grad_norm": 0.17709937002340748, "learning_rate": 9.318925002307188e-07, "loss": 0.3149, "step": 3667 }, { "epoch": 0.9448433525453199, "grad_norm": 0.172973032323487, "learning_rate": 9.232706086780619e-07, "loss": 0.3452, "step": 3668 }, { "epoch": 0.9451009434266027, "grad_norm": 0.1345121785044483, "learning_rate": 9.146884159965286e-07, "loss": 0.2891, "step": 3669 }, { "epoch": 0.9453585343078855, "grad_norm": 0.13728174842331684, "learning_rate": 9.061459291283658e-07, "loss": 0.3148, "step": 3670 }, { "epoch": 0.9453585343078855, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.858040859088528, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3525390625, "eval_runtime": 16.9543, "eval_samples_per_second": 2.595, "eval_steps_per_second": 0.177, "step": 3670 }, { "epoch": 0.9456161251891683, "grad_norm": 0.12179028171270745, "learning_rate": 8.976431549837239e-07, "loss": 0.2727, "step": 3671 }, { "epoch": 0.9458737160704511, "grad_norm": 0.20292642131673685, "learning_rate": 8.891801004406119e-07, "loss": 0.4476, "step": 3672 }, { "epoch": 0.9461313069517339, "grad_norm": 0.2117910852732907, "learning_rate": 8.807567723449206e-07, "loss": 0.4602, "step": 3673 }, { "epoch": 0.9463888978330167, "grad_norm": 0.17428962139928333, "learning_rate": 8.723731775103938e-07, "loss": 0.4595, "step": 3674 }, { "epoch": 0.9466464887142995, "grad_norm": 0.2090642216310755, "learning_rate": 8.640293227186513e-07, "loss": 0.4209, "step": 3675 }, { "epoch": 0.9466464887142995, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35422584414482117, "eval_runtime": 16.9944, "eval_samples_per_second": 2.589, "eval_steps_per_second": 0.177, "step": 3675 }, { "epoch": 0.9469040795955823, "grad_norm": 0.1414186990108163, "learning_rate": 8.557252147191497e-07, "loss": 0.3868, "step": 3676 }, { "epoch": 0.9471616704768652, "grad_norm": 0.14781947639985626, "learning_rate": 8.474608602292044e-07, "loss": 0.2981, "step": 3677 }, { "epoch": 0.9474192613581479, "grad_norm": 0.14013584779347527, "learning_rate": 8.392362659339681e-07, "loss": 0.3697, "step": 3678 }, { "epoch": 0.9476768522394308, "grad_norm": 0.15392211696114294, "learning_rate": 8.31051438486441e-07, "loss": 0.3278, "step": 3679 }, { "epoch": 0.9479344431207135, "grad_norm": 0.2299225601108455, "learning_rate": 8.22906384507438e-07, "loss": 0.422, "step": 3680 }, { "epoch": 0.9479344431207135, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8548978522786799, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3544478118419647, "eval_runtime": 17.2464, "eval_samples_per_second": 2.551, "eval_steps_per_second": 0.174, "step": 3680 }, { "epoch": 0.9481920340019964, "grad_norm": 0.16274285836944163, "learning_rate": 8.148011105856168e-07, "loss": 0.4064, "step": 3681 }, { "epoch": 0.9484496248832791, "grad_norm": 0.20910361953817333, "learning_rate": 8.067356232774437e-07, "loss": 0.473, "step": 3682 }, { "epoch": 0.948707215764562, "grad_norm": 0.17748660504950942, "learning_rate": 7.987099291072109e-07, "loss": 0.3576, "step": 3683 }, { "epoch": 0.9489648066458447, "grad_norm": 0.1578814384448594, "learning_rate": 7.907240345670142e-07, "loss": 0.3753, "step": 3684 }, { "epoch": 0.9492223975271276, "grad_norm": 0.15212521856275274, "learning_rate": 7.827779461167695e-07, "loss": 0.3193, "step": 3685 }, { "epoch": 0.9492223975271276, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.861707700366684, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3528497815132141, "eval_runtime": 17.6253, "eval_samples_per_second": 2.496, "eval_steps_per_second": 0.17, "step": 3685 }, { "epoch": 0.9494799884084103, "grad_norm": 0.18749221830312565, "learning_rate": 7.748716701841685e-07, "loss": 0.3724, "step": 3686 }, { "epoch": 0.9497375792896932, "grad_norm": 0.1891080708391055, "learning_rate": 7.670052131647121e-07, "loss": 0.389, "step": 3687 }, { "epoch": 0.9499951701709759, "grad_norm": 0.21227202340748516, "learning_rate": 7.591785814217046e-07, "loss": 0.3401, "step": 3688 }, { "epoch": 0.9502527610522588, "grad_norm": 0.1648754080971513, "learning_rate": 7.513917812862037e-07, "loss": 0.3453, "step": 3689 }, { "epoch": 0.9505103519335415, "grad_norm": 0.19280860950145984, "learning_rate": 7.436448190570766e-07, "loss": 0.3472, "step": 3690 }, { "epoch": 0.9505103519335415, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3533824682235718, "eval_runtime": 17.2241, "eval_samples_per_second": 2.555, "eval_steps_per_second": 0.174, "step": 3690 }, { "epoch": 0.9507679428148244, "grad_norm": 0.14333195087175796, "learning_rate": 7.359377010009383e-07, "loss": 0.2865, "step": 3691 }, { "epoch": 0.9510255336961072, "grad_norm": 0.18370111816292833, "learning_rate": 7.282704333522017e-07, "loss": 0.3927, "step": 3692 }, { "epoch": 0.95128312457739, "grad_norm": 0.1728863568975308, "learning_rate": 7.206430223130278e-07, "loss": 0.3012, "step": 3693 }, { "epoch": 0.9515407154586728, "grad_norm": 0.15169059013242978, "learning_rate": 7.130554740533313e-07, "loss": 0.3035, "step": 3694 }, { "epoch": 0.9517983063399555, "grad_norm": 0.13965884246701635, "learning_rate": 7.055077947107858e-07, "loss": 0.3257, "step": 3695 }, { "epoch": 0.9517983063399555, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35205078125, "eval_runtime": 16.9261, "eval_samples_per_second": 2.6, "eval_steps_per_second": 0.177, "step": 3695 }, { "epoch": 0.9520558972212384, "grad_norm": 0.15234151942918903, "learning_rate": 6.979999903908297e-07, "loss": 0.2756, "step": 3696 }, { "epoch": 0.9523134881025211, "grad_norm": 0.17011987219811123, "learning_rate": 6.905320671666326e-07, "loss": 0.3531, "step": 3697 }, { "epoch": 0.952571078983804, "grad_norm": 0.20705912072551072, "learning_rate": 6.831040310790959e-07, "loss": 0.4757, "step": 3698 }, { "epoch": 0.9528286698650867, "grad_norm": 0.12767561963277557, "learning_rate": 6.757158881368686e-07, "loss": 0.3342, "step": 3699 }, { "epoch": 0.9530862607463696, "grad_norm": 0.17796177316584283, "learning_rate": 6.683676443163311e-07, "loss": 0.3029, "step": 3700 }, { "epoch": 0.9530862607463696, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8622315348349922, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3525390625, "eval_runtime": 17.2548, "eval_samples_per_second": 2.55, "eval_steps_per_second": 0.174, "step": 3700 }, { "epoch": 0.9533438516276523, "grad_norm": 0.1310624988332114, "learning_rate": 6.610593055615733e-07, "loss": 0.3261, "step": 3701 }, { "epoch": 0.9536014425089352, "grad_norm": 0.13505877689353882, "learning_rate": 6.537908777844215e-07, "loss": 0.3194, "step": 3702 }, { "epoch": 0.9538590333902179, "grad_norm": 0.14249633091361077, "learning_rate": 6.465623668644117e-07, "loss": 0.3034, "step": 3703 }, { "epoch": 0.9541166242715008, "grad_norm": 0.14268727301342632, "learning_rate": 6.393737786487885e-07, "loss": 0.3654, "step": 3704 }, { "epoch": 0.9543742151527836, "grad_norm": 0.1564181616551385, "learning_rate": 6.322251189525008e-07, "loss": 0.3605, "step": 3705 }, { "epoch": 0.9543742151527836, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8590885280251441, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3514293432235718, "eval_runtime": 17.4001, "eval_samples_per_second": 2.529, "eval_steps_per_second": 0.172, "step": 3705 }, { "epoch": 0.9546318060340664, "grad_norm": 0.16752144840241906, "learning_rate": 6.251163935582116e-07, "loss": 0.3424, "step": 3706 }, { "epoch": 0.9548893969153492, "grad_norm": 0.1731135089318462, "learning_rate": 6.180476082162656e-07, "loss": 0.3848, "step": 3707 }, { "epoch": 0.955146987796632, "grad_norm": 0.15070275416486573, "learning_rate": 6.110187686447e-07, "loss": 0.3657, "step": 3708 }, { "epoch": 0.9554045786779148, "grad_norm": 0.18480108877326346, "learning_rate": 6.040298805292499e-07, "loss": 0.3594, "step": 3709 }, { "epoch": 0.9556621695591976, "grad_norm": 0.1451269599547431, "learning_rate": 5.970809495233265e-07, "loss": 0.3382, "step": 3710 }, { "epoch": 0.9556621695591976, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3533380627632141, "eval_runtime": 17.1366, "eval_samples_per_second": 2.568, "eval_steps_per_second": 0.175, "step": 3710 }, { "epoch": 0.9559197604404804, "grad_norm": 0.204747373910136, "learning_rate": 5.901719812480166e-07, "loss": 0.4478, "step": 3711 }, { "epoch": 0.9561773513217632, "grad_norm": 0.12067191724353114, "learning_rate": 5.833029812920831e-07, "loss": 0.3148, "step": 3712 }, { "epoch": 0.956434942203046, "grad_norm": 0.15870357656342368, "learning_rate": 5.764739552119702e-07, "loss": 0.4068, "step": 3713 }, { "epoch": 0.9566925330843288, "grad_norm": 0.1973206592364747, "learning_rate": 5.696849085317646e-07, "loss": 0.3478, "step": 3714 }, { "epoch": 0.9569501239656116, "grad_norm": 0.2018788475412071, "learning_rate": 5.629358467432289e-07, "loss": 0.4264, "step": 3715 }, { "epoch": 0.9569501239656116, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.86013619696176, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3541370630264282, "eval_runtime": 17.3697, "eval_samples_per_second": 2.533, "eval_steps_per_second": 0.173, "step": 3715 }, { "epoch": 0.9572077148468944, "grad_norm": 0.15152106035513985, "learning_rate": 5.562267753057626e-07, "loss": 0.3867, "step": 3716 }, { "epoch": 0.9574653057281772, "grad_norm": 0.13845243247216737, "learning_rate": 5.495576996464468e-07, "loss": 0.3161, "step": 3717 }, { "epoch": 0.95772289660946, "grad_norm": 0.13210334465496898, "learning_rate": 5.429286251599885e-07, "loss": 0.3148, "step": 3718 }, { "epoch": 0.9579804874907428, "grad_norm": 0.1571066170842066, "learning_rate": 5.363395572087371e-07, "loss": 0.3541, "step": 3719 }, { "epoch": 0.9582380783720257, "grad_norm": 0.15295813994550886, "learning_rate": 5.297905011226845e-07, "loss": 0.4044, "step": 3720 }, { "epoch": 0.9582380783720257, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.86013619696176, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3545365631580353, "eval_runtime": 17.1569, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 3720 }, { "epoch": 0.9584956692533084, "grad_norm": 0.19608383974821886, "learning_rate": 5.232814621994598e-07, "loss": 0.4614, "step": 3721 }, { "epoch": 0.9587532601345913, "grad_norm": 0.16729845368017604, "learning_rate": 5.168124457043178e-07, "loss": 0.3416, "step": 3722 }, { "epoch": 0.959010851015874, "grad_norm": 0.1385253217089452, "learning_rate": 5.103834568701338e-07, "loss": 0.3307, "step": 3723 }, { "epoch": 0.9592684418971569, "grad_norm": 0.13269673976828575, "learning_rate": 5.039945008974145e-07, "loss": 0.3276, "step": 3724 }, { "epoch": 0.9595260327784396, "grad_norm": 0.1505006388364205, "learning_rate": 4.976455829542704e-07, "loss": 0.3554, "step": 3725 }, { "epoch": 0.9595260327784396, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8606600314300681, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3522283434867859, "eval_runtime": 17.3805, "eval_samples_per_second": 2.532, "eval_steps_per_second": 0.173, "step": 3725 }, { "epoch": 0.9597836236597225, "grad_norm": 0.15422220137904377, "learning_rate": 4.91336708176443e-07, "loss": 0.307, "step": 3726 }, { "epoch": 0.9600412145410052, "grad_norm": 0.1948051781206229, "learning_rate": 4.850678816672671e-07, "loss": 0.3772, "step": 3727 }, { "epoch": 0.9602988054222881, "grad_norm": 0.11942577613308271, "learning_rate": 4.788391084976862e-07, "loss": 0.3148, "step": 3728 }, { "epoch": 0.9605563963035708, "grad_norm": 0.16581696493096246, "learning_rate": 4.726503937062421e-07, "loss": 0.3584, "step": 3729 }, { "epoch": 0.9608139871848537, "grad_norm": 0.18270653336601703, "learning_rate": 4.6650174229908026e-07, "loss": 0.3931, "step": 3730 }, { "epoch": 0.9608139871848537, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35400390625, "eval_runtime": 17.6109, "eval_samples_per_second": 2.498, "eval_steps_per_second": 0.17, "step": 3730 }, { "epoch": 0.9610715780661364, "grad_norm": 0.1656800706537147, "learning_rate": 4.6039315924992774e-07, "loss": 0.337, "step": 3731 }, { "epoch": 0.9613291689474193, "grad_norm": 0.15687605108049824, "learning_rate": 4.543246495001097e-07, "loss": 0.3087, "step": 3732 }, { "epoch": 0.961586759828702, "grad_norm": 0.41979890458747227, "learning_rate": 4.4829621795852705e-07, "loss": 0.4024, "step": 3733 }, { "epoch": 0.9618443507099849, "grad_norm": 0.18933485246564027, "learning_rate": 4.42307869501668e-07, "loss": 0.4332, "step": 3734 }, { "epoch": 0.9621019415912677, "grad_norm": 0.1369765834241001, "learning_rate": 4.363596089735911e-07, "loss": 0.3336, "step": 3735 }, { "epoch": 0.9621019415912677, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.858040859088528, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35520240664482117, "eval_runtime": 16.9809, "eval_samples_per_second": 2.591, "eval_steps_per_second": 0.177, "step": 3735 }, { "epoch": 0.9623595324725505, "grad_norm": 0.1743975417300076, "learning_rate": 4.304514411859306e-07, "loss": 0.4265, "step": 3736 }, { "epoch": 0.9626171233538333, "grad_norm": 0.18163224348449938, "learning_rate": 4.2458337091788593e-07, "loss": 0.4083, "step": 3737 }, { "epoch": 0.9628747142351161, "grad_norm": 0.15285926097764635, "learning_rate": 4.1875540291622106e-07, "loss": 0.3955, "step": 3738 }, { "epoch": 0.9631323051163989, "grad_norm": 0.16429583098588607, "learning_rate": 4.129675418952761e-07, "loss": 0.3556, "step": 3739 }, { "epoch": 0.9633898959976817, "grad_norm": 0.22238495157892732, "learning_rate": 4.0721979253692254e-07, "loss": 0.4598, "step": 3740 }, { "epoch": 0.9633898959976817, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8588266107909901, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35422584414482117, "eval_runtime": 16.9862, "eval_samples_per_second": 2.59, "eval_steps_per_second": 0.177, "step": 3740 }, { "epoch": 0.9636474868789645, "grad_norm": 0.17674656977462916, "learning_rate": 4.015121594906024e-07, "loss": 0.3965, "step": 3741 }, { "epoch": 0.9639050777602473, "grad_norm": 0.16840117530400994, "learning_rate": 3.958446473733002e-07, "loss": 0.4132, "step": 3742 }, { "epoch": 0.9641626686415301, "grad_norm": 0.13867074302418367, "learning_rate": 3.9021726076954867e-07, "loss": 0.3525, "step": 3743 }, { "epoch": 0.9644202595228129, "grad_norm": 0.1459626178307732, "learning_rate": 3.8463000423142326e-07, "loss": 0.3487, "step": 3744 }, { "epoch": 0.9646778504040957, "grad_norm": 0.15807260960562433, "learning_rate": 3.7908288227853085e-07, "loss": 0.3266, "step": 3745 }, { "epoch": 0.9646778504040957, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.859088528025144, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35506924986839294, "eval_runtime": 17.1534, "eval_samples_per_second": 2.565, "eval_steps_per_second": 0.175, "step": 3745 }, { "epoch": 0.9649354412853784, "grad_norm": 0.1452604989808499, "learning_rate": 3.73575899398021e-07, "loss": 0.3457, "step": 3746 }, { "epoch": 0.9651930321666613, "grad_norm": 0.19165309239817846, "learning_rate": 3.681090600445747e-07, "loss": 0.4019, "step": 3747 }, { "epoch": 0.9654506230479442, "grad_norm": 0.1471576365965977, "learning_rate": 3.626823686403935e-07, "loss": 0.3234, "step": 3748 }, { "epoch": 0.9657082139292269, "grad_norm": 0.18331570304808137, "learning_rate": 3.572958295752049e-07, "loss": 0.4197, "step": 3749 }, { "epoch": 0.9659658048105098, "grad_norm": 0.1497592311083479, "learning_rate": 3.519494472062568e-07, "loss": 0.2976, "step": 3750 }, { "epoch": 0.9659658048105098, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8624934520691461, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3533824682235718, "eval_runtime": 17.4882, "eval_samples_per_second": 2.516, "eval_steps_per_second": 0.172, "step": 3750 }, { "epoch": 0.9662233956917925, "grad_norm": 0.18542590579616175, "learning_rate": 3.466432258583174e-07, "loss": 0.2955, "step": 3751 }, { "epoch": 0.9664809865730754, "grad_norm": 0.14196607964512953, "learning_rate": 3.4137716982366453e-07, "loss": 0.2848, "step": 3752 }, { "epoch": 0.9667385774543581, "grad_norm": 0.16210220602760117, "learning_rate": 3.3615128336209054e-07, "loss": 0.4347, "step": 3753 }, { "epoch": 0.966996168335641, "grad_norm": 0.12357408535083989, "learning_rate": 3.309655707008863e-07, "loss": 0.3585, "step": 3754 }, { "epoch": 0.9672537592169237, "grad_norm": 0.13618250690592645, "learning_rate": 3.258200360348462e-07, "loss": 0.3281, "step": 3755 }, { "epoch": 0.9672537592169237, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8588266107909899, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35360440611839294, "eval_runtime": 17.0303, "eval_samples_per_second": 2.584, "eval_steps_per_second": 0.176, "step": 3755 }, { "epoch": 0.9675113500982065, "grad_norm": 0.13654383235663448, "learning_rate": 3.207146835262742e-07, "loss": 0.3063, "step": 3756 }, { "epoch": 0.9677689409794893, "grad_norm": 0.15999728729569007, "learning_rate": 3.1564951730495006e-07, "loss": 0.3554, "step": 3757 }, { "epoch": 0.9680265318607721, "grad_norm": 0.16211117805780945, "learning_rate": 3.106245414681741e-07, "loss": 0.3693, "step": 3758 }, { "epoch": 0.9682841227420549, "grad_norm": 0.21034146330880885, "learning_rate": 3.0563976008071706e-07, "loss": 0.4134, "step": 3759 }, { "epoch": 0.9685417136233377, "grad_norm": 0.14652568706774757, "learning_rate": 3.006951771748423e-07, "loss": 0.3347, "step": 3760 }, { "epoch": 0.9685417136233377, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.857778941854374, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3546697497367859, "eval_runtime": 16.9428, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 3760 }, { "epoch": 0.9687993045046205, "grad_norm": 0.14316930791436056, "learning_rate": 2.9579079675028374e-07, "loss": 0.3233, "step": 3761 }, { "epoch": 0.9690568953859033, "grad_norm": 0.2000551747105647, "learning_rate": 2.9092662277427906e-07, "loss": 0.4459, "step": 3762 }, { "epoch": 0.9693144862671862, "grad_norm": 0.165468342566276, "learning_rate": 2.8610265918151414e-07, "loss": 0.3376, "step": 3763 }, { "epoch": 0.9695720771484689, "grad_norm": 0.11885486319727619, "learning_rate": 2.813189098741731e-07, "loss": 0.2936, "step": 3764 }, { "epoch": 0.9698296680297518, "grad_norm": 0.18333947791187652, "learning_rate": 2.7657537872189386e-07, "loss": 0.4077, "step": 3765 }, { "epoch": 0.9698296680297518, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8601361969617601, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35245028138160706, "eval_runtime": 17.0879, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 3765 }, { "epoch": 0.9700872589110345, "grad_norm": 0.18535954788255296, "learning_rate": 2.7187206956179047e-07, "loss": 0.404, "step": 3766 }, { "epoch": 0.9703448497923174, "grad_norm": 0.17033575330351897, "learning_rate": 2.6720898619843615e-07, "loss": 0.3333, "step": 3767 }, { "epoch": 0.9706024406736001, "grad_norm": 0.1340335465058161, "learning_rate": 2.625861324038692e-07, "loss": 0.3344, "step": 3768 }, { "epoch": 0.970860031554883, "grad_norm": 0.1539518992267126, "learning_rate": 2.580035119175761e-07, "loss": 0.3689, "step": 3769 }, { "epoch": 0.9711176224361657, "grad_norm": 0.22640026655678336, "learning_rate": 2.534611284465083e-07, "loss": 0.404, "step": 3770 }, { "epoch": 0.9711176224361657, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8601361969617599, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35391512513160706, "eval_runtime": 17.1355, "eval_samples_per_second": 2.568, "eval_steps_per_second": 0.175, "step": 3770 }, { "epoch": 0.9713752133174486, "grad_norm": 0.1467583746360964, "learning_rate": 2.4895898566505983e-07, "loss": 0.3658, "step": 3771 }, { "epoch": 0.9716328041987313, "grad_norm": 0.15289702694249147, "learning_rate": 2.4449708721508424e-07, "loss": 0.3454, "step": 3772 }, { "epoch": 0.9718903950800142, "grad_norm": 0.16047779634622722, "learning_rate": 2.4007543670587774e-07, "loss": 0.4495, "step": 3773 }, { "epoch": 0.9721479859612969, "grad_norm": 0.1665765188938278, "learning_rate": 2.356940377141681e-07, "loss": 0.4329, "step": 3774 }, { "epoch": 0.9724055768425798, "grad_norm": 0.1179113612466018, "learning_rate": 2.3135289378413694e-07, "loss": 0.3069, "step": 3775 }, { "epoch": 0.9724055768425798, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8569931901519119, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3548029065132141, "eval_runtime": 17.5981, "eval_samples_per_second": 2.5, "eval_steps_per_second": 0.17, "step": 3775 }, { "epoch": 0.9726631677238625, "grad_norm": 0.16314819661869495, "learning_rate": 2.2705200842740305e-07, "loss": 0.2938, "step": 3776 }, { "epoch": 0.9729207586051454, "grad_norm": 0.20572881699364856, "learning_rate": 2.2279138512300567e-07, "loss": 0.3926, "step": 3777 }, { "epoch": 0.9731783494864282, "grad_norm": 0.16351923007215768, "learning_rate": 2.1857102731742684e-07, "loss": 0.309, "step": 3778 }, { "epoch": 0.973435940367711, "grad_norm": 0.15430164950532926, "learning_rate": 2.143909384245746e-07, "loss": 0.34, "step": 3779 }, { "epoch": 0.9736935312489938, "grad_norm": 0.17881733482234016, "learning_rate": 2.10251121825783e-07, "loss": 0.3813, "step": 3780 }, { "epoch": 0.9736935312489938, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.857778941854374, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3528497815132141, "eval_runtime": 16.9415, "eval_samples_per_second": 2.597, "eval_steps_per_second": 0.177, "step": 3780 }, { "epoch": 0.9739511221302766, "grad_norm": 0.1759713240969221, "learning_rate": 2.0615158086981222e-07, "loss": 0.4305, "step": 3781 }, { "epoch": 0.9742087130115594, "grad_norm": 0.15528693139533326, "learning_rate": 2.020923188728374e-07, "loss": 0.3215, "step": 3782 }, { "epoch": 0.9744663038928422, "grad_norm": 0.1394952976316927, "learning_rate": 1.980733391184486e-07, "loss": 0.335, "step": 3783 }, { "epoch": 0.974723894774125, "grad_norm": 0.16330749731661878, "learning_rate": 1.940946448576675e-07, "loss": 0.3388, "step": 3784 }, { "epoch": 0.9749814856554078, "grad_norm": 0.13626155155802247, "learning_rate": 1.9015623930890846e-07, "loss": 0.3177, "step": 3785 }, { "epoch": 0.9749814856554078, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8617077003666841, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35196200013160706, "eval_runtime": 16.6163, "eval_samples_per_second": 2.648, "eval_steps_per_second": 0.181, "step": 3785 }, { "epoch": 0.9752390765366906, "grad_norm": 0.16720574020751214, "learning_rate": 1.8625812565800648e-07, "loss": 0.4074, "step": 3786 }, { "epoch": 0.9754966674179734, "grad_norm": 0.16792236698504823, "learning_rate": 1.8240030705820032e-07, "loss": 0.3667, "step": 3787 }, { "epoch": 0.9757542582992562, "grad_norm": 0.1932284534720809, "learning_rate": 1.7858278663013817e-07, "loss": 0.3507, "step": 3788 }, { "epoch": 0.976011849180539, "grad_norm": 0.15949009758829952, "learning_rate": 1.748055674618665e-07, "loss": 0.2286, "step": 3789 }, { "epoch": 0.9762694400618218, "grad_norm": 0.17407811866438883, "learning_rate": 1.710686526088301e-07, "loss": 0.3552, "step": 3790 }, { "epoch": 0.9762694400618218, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35324928164482117, "eval_runtime": 17.4588, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 3790 }, { "epoch": 0.9765270309431047, "grad_norm": 0.18141142441348804, "learning_rate": 1.6737204509387206e-07, "loss": 0.4585, "step": 3791 }, { "epoch": 0.9767846218243874, "grad_norm": 0.17238267023227896, "learning_rate": 1.6371574790723377e-07, "loss": 0.3291, "step": 3792 }, { "epoch": 0.9770422127056703, "grad_norm": 0.18083413404662643, "learning_rate": 1.6009976400654937e-07, "loss": 0.3972, "step": 3793 }, { "epoch": 0.977299803586953, "grad_norm": 0.1659465500339923, "learning_rate": 1.5652409631682908e-07, "loss": 0.3672, "step": 3794 }, { "epoch": 0.9775573944682359, "grad_norm": 0.13994735128114089, "learning_rate": 1.529887477304981e-07, "loss": 0.4038, "step": 3795 }, { "epoch": 0.9775573944682359, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8572551073860659, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3546253442764282, "eval_runtime": 16.6268, "eval_samples_per_second": 2.646, "eval_steps_per_second": 0.18, "step": 3795 }, { "epoch": 0.9778149853495186, "grad_norm": 0.14847747360892083, "learning_rate": 1.494937211073355e-07, "loss": 0.3311, "step": 3796 }, { "epoch": 0.9780725762308015, "grad_norm": 0.14264566608027543, "learning_rate": 1.4603901927452978e-07, "loss": 0.3381, "step": 3797 }, { "epoch": 0.9783301671120842, "grad_norm": 0.13899999288446177, "learning_rate": 1.4262464502663443e-07, "loss": 0.3626, "step": 3798 }, { "epoch": 0.9785877579933671, "grad_norm": 0.13291754858024754, "learning_rate": 1.3925060112557898e-07, "loss": 0.3594, "step": 3799 }, { "epoch": 0.9788453488746498, "grad_norm": 0.15571500003310815, "learning_rate": 1.3591689030068577e-07, "loss": 0.3405, "step": 3800 }, { "epoch": 0.9788453488746498, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8795180722891566, "eval_PRM F1 AUC": 0.7223677317967523, "eval_PRM F1 AUC (fixed)": 0.8590885280251439, "eval_PRM F1 Neg": 0.5652173913043478, "eval_PRM NPV": 0.5652173913043478, "eval_PRM Precision": 0.8795180722891566, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.3543146252632141, "eval_runtime": 17.097, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 3800 }, { "epoch": 0.9791029397559327, "grad_norm": 0.18620757337239352, "learning_rate": 1.3262351524864213e-07, "loss": 0.4272, "step": 3801 }, { "epoch": 0.9793605306372154, "grad_norm": 0.1756420655693183, "learning_rate": 1.2937047863350037e-07, "loss": 0.2808, "step": 3802 }, { "epoch": 0.9796181215184983, "grad_norm": 0.14244491271889062, "learning_rate": 1.2615778308668892e-07, "loss": 0.2852, "step": 3803 }, { "epoch": 0.979875712399781, "grad_norm": 0.1516494617807825, "learning_rate": 1.2298543120700113e-07, "loss": 0.3433, "step": 3804 }, { "epoch": 0.9801333032810639, "grad_norm": 0.14925646654192018, "learning_rate": 1.1985342556060652e-07, "loss": 0.2899, "step": 3805 }, { "epoch": 0.9801333032810639, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8609219486642221, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3538263440132141, "eval_runtime": 17.8024, "eval_samples_per_second": 2.472, "eval_steps_per_second": 0.169, "step": 3805 }, { "epoch": 0.9803908941623467, "grad_norm": 0.14432809565504431, "learning_rate": 1.1676176868102295e-07, "loss": 0.3247, "step": 3806 }, { "epoch": 0.9806484850436294, "grad_norm": 0.17548929482352033, "learning_rate": 1.1371046306914435e-07, "loss": 0.3986, "step": 3807 }, { "epoch": 0.9809060759249123, "grad_norm": 0.13571487128816537, "learning_rate": 1.1069951119320188e-07, "loss": 0.3344, "step": 3808 }, { "epoch": 0.981163666806195, "grad_norm": 0.14559430886412886, "learning_rate": 1.0772891548880282e-07, "loss": 0.3374, "step": 3809 }, { "epoch": 0.9814212576874779, "grad_norm": 0.15790207391145736, "learning_rate": 1.0479867835891389e-07, "loss": 0.3819, "step": 3810 }, { "epoch": 0.9814212576874779, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.85620743844945, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3541814684867859, "eval_runtime": 17.5142, "eval_samples_per_second": 2.512, "eval_steps_per_second": 0.171, "step": 3810 }, { "epoch": 0.9816788485687606, "grad_norm": 0.14105410419460254, "learning_rate": 1.0190880217383347e-07, "loss": 0.3418, "step": 3811 }, { "epoch": 0.9819364394500435, "grad_norm": 0.16032004791537616, "learning_rate": 9.905928927123609e-08, "loss": 0.2992, "step": 3812 }, { "epoch": 0.9821940303313262, "grad_norm": 0.17342208377038257, "learning_rate": 9.625014195612236e-08, "loss": 0.3601, "step": 3813 }, { "epoch": 0.9824516212126091, "grad_norm": 0.13949111908780418, "learning_rate": 9.348136250085793e-08, "loss": 0.3036, "step": 3814 }, { "epoch": 0.9827092120938918, "grad_norm": 0.1604200708844017, "learning_rate": 9.075295314514565e-08, "loss": 0.3832, "step": 3815 }, { "epoch": 0.9827092120938918, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859350445259298, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3556019067764282, "eval_runtime": 17.1716, "eval_samples_per_second": 2.562, "eval_steps_per_second": 0.175, "step": 3815 }, { "epoch": 0.9829668029751747, "grad_norm": 0.15596615102074293, "learning_rate": 8.806491609603673e-08, "loss": 0.3538, "step": 3816 }, { "epoch": 0.9832243938564574, "grad_norm": 0.1798691547838207, "learning_rate": 8.541725352791963e-08, "loss": 0.3654, "step": 3817 }, { "epoch": 0.9834819847377403, "grad_norm": 0.16031802102742165, "learning_rate": 8.280996758253112e-08, "loss": 0.363, "step": 3818 }, { "epoch": 0.983739575619023, "grad_norm": 0.13947517080899272, "learning_rate": 8.02430603689397e-08, "loss": 0.315, "step": 3819 }, { "epoch": 0.9839971665003059, "grad_norm": 0.16446868867314984, "learning_rate": 7.77165339635566e-08, "loss": 0.394, "step": 3820 }, { "epoch": 0.9839971665003059, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8619696176008381, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35427024960517883, "eval_runtime": 17.0867, "eval_samples_per_second": 2.575, "eval_steps_per_second": 0.176, "step": 3820 }, { "epoch": 0.9842547573815887, "grad_norm": 0.1385861107711507, "learning_rate": 7.523039041012481e-08, "loss": 0.3465, "step": 3821 }, { "epoch": 0.9845123482628715, "grad_norm": 0.12561988471237037, "learning_rate": 7.27846317197134e-08, "loss": 0.3569, "step": 3822 }, { "epoch": 0.9847699391441543, "grad_norm": 0.19075340599019874, "learning_rate": 7.037925987074534e-08, "loss": 0.324, "step": 3823 }, { "epoch": 0.9850275300254371, "grad_norm": 0.1658793046587931, "learning_rate": 6.801427680894756e-08, "loss": 0.3466, "step": 3824 }, { "epoch": 0.9852851209067199, "grad_norm": 0.1456440297940814, "learning_rate": 6.568968444739532e-08, "loss": 0.4245, "step": 3825 }, { "epoch": 0.9852851209067199, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8862275449101796, "eval_PRM F1 AUC": 0.7283918281822945, "eval_PRM F1 AUC (fixed)": 0.8588266107909899, "eval_PRM F1 Neg": 0.5777777777777777, "eval_PRM NPV": 0.5909090909090909, "eval_PRM Precision": 0.8809523809523809, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.5652173913043478, "eval_loss": 0.35573509335517883, "eval_runtime": 17.1337, "eval_samples_per_second": 2.568, "eval_steps_per_second": 0.175, "step": 3825 }, { "epoch": 0.9855427117880027, "grad_norm": 0.13283828143284623, "learning_rate": 6.340548466648443e-08, "loss": 0.2988, "step": 3826 }, { "epoch": 0.9858003026692855, "grad_norm": 0.1839927084008868, "learning_rate": 6.116167931393691e-08, "loss": 0.3724, "step": 3827 }, { "epoch": 0.9860578935505683, "grad_norm": 0.14082341113721372, "learning_rate": 5.895827020479527e-08, "loss": 0.276, "step": 3828 }, { "epoch": 0.9863154844318511, "grad_norm": 0.14357908740989736, "learning_rate": 5.6795259121439345e-08, "loss": 0.2945, "step": 3829 }, { "epoch": 0.9865730753131339, "grad_norm": 0.15451102193521904, "learning_rate": 5.4672647813547305e-08, "loss": 0.3223, "step": 3830 }, { "epoch": 0.9865730753131339, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8551597695128339, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3560901880264282, "eval_runtime": 16.8872, "eval_samples_per_second": 2.606, "eval_steps_per_second": 0.178, "step": 3830 }, { "epoch": 0.9868306661944167, "grad_norm": 0.17445890619553567, "learning_rate": 5.2590437998134566e-08, "loss": 0.4237, "step": 3831 }, { "epoch": 0.9870882570756995, "grad_norm": 0.1255277707156797, "learning_rate": 5.054863135953158e-08, "loss": 0.3201, "step": 3832 }, { "epoch": 0.9873458479569823, "grad_norm": 0.1420320075937339, "learning_rate": 4.8547229549383844e-08, "loss": 0.4258, "step": 3833 }, { "epoch": 0.9876034388382652, "grad_norm": 0.16849844384390825, "learning_rate": 4.658623418665742e-08, "loss": 0.3963, "step": 3834 }, { "epoch": 0.9878610297195479, "grad_norm": 0.13801399523631844, "learning_rate": 4.4665646857627864e-08, "loss": 0.3911, "step": 3835 }, { "epoch": 0.9878610297195479, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8619696176008381, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35400390625, "eval_runtime": 17.5443, "eval_samples_per_second": 2.508, "eval_steps_per_second": 0.171, "step": 3835 }, { "epoch": 0.9881186206008308, "grad_norm": 0.14497941822115065, "learning_rate": 4.278546911588022e-08, "loss": 0.337, "step": 3836 }, { "epoch": 0.9883762114821135, "grad_norm": 0.17940620321670397, "learning_rate": 4.094570248232565e-08, "loss": 0.3965, "step": 3837 }, { "epoch": 0.9886338023633964, "grad_norm": 0.13987601268318273, "learning_rate": 3.9146348445173733e-08, "loss": 0.3451, "step": 3838 }, { "epoch": 0.9888913932446791, "grad_norm": 0.16282875349357964, "learning_rate": 3.7387408459949035e-08, "loss": 0.3761, "step": 3839 }, { "epoch": 0.989148984125962, "grad_norm": 0.15513189177962927, "learning_rate": 3.566888394948009e-08, "loss": 0.3252, "step": 3840 }, { "epoch": 0.989148984125962, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8624934520691462, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3528497815132141, "eval_runtime": 16.8796, "eval_samples_per_second": 2.607, "eval_steps_per_second": 0.178, "step": 3840 }, { "epoch": 0.9894065750072447, "grad_norm": 0.1551213359199816, "learning_rate": 3.3990776303910456e-08, "loss": 0.3912, "step": 3841 }, { "epoch": 0.9896641658885276, "grad_norm": 0.15981647033788135, "learning_rate": 3.235308688068206e-08, "loss": 0.3977, "step": 3842 }, { "epoch": 0.9899217567698103, "grad_norm": 0.16522435580180106, "learning_rate": 3.075581700454633e-08, "loss": 0.2958, "step": 3843 }, { "epoch": 0.9901793476510932, "grad_norm": 0.23521488165578452, "learning_rate": 2.919896796755861e-08, "loss": 0.4202, "step": 3844 }, { "epoch": 0.9904369385323759, "grad_norm": 0.1904301992468953, "learning_rate": 2.768254102907819e-08, "loss": 0.4, "step": 3845 }, { "epoch": 0.9904369385323759, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.858302776322682, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35178443789482117, "eval_runtime": 17.4583, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 3845 }, { "epoch": 0.9906945294136588, "grad_norm": 0.1464762142939478, "learning_rate": 2.6206537415762733e-08, "loss": 0.3524, "step": 3846 }, { "epoch": 0.9909521202949415, "grad_norm": 0.16020884252536802, "learning_rate": 2.4770958321568283e-08, "loss": 0.4248, "step": 3847 }, { "epoch": 0.9912097111762244, "grad_norm": 0.11633653027179804, "learning_rate": 2.337580490776592e-08, "loss": 0.246, "step": 3848 }, { "epoch": 0.9914673020575072, "grad_norm": 0.14268793767622032, "learning_rate": 2.2021078302902897e-08, "loss": 0.339, "step": 3849 }, { "epoch": 0.99172489293879, "grad_norm": 0.1373486811631178, "learning_rate": 2.070677960284706e-08, "loss": 0.3918, "step": 3850 }, { "epoch": 0.99172489293879, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.859874279727606, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35293856263160706, "eval_runtime": 17.4584, "eval_samples_per_second": 2.52, "eval_steps_per_second": 0.172, "step": 3850 }, { "epoch": 0.9919824838200728, "grad_norm": 0.12419707771509048, "learning_rate": 1.9432909870747974e-08, "loss": 0.3071, "step": 3851 }, { "epoch": 0.9922400747013556, "grad_norm": 0.14396651708514002, "learning_rate": 1.819947013705914e-08, "loss": 0.3771, "step": 3852 }, { "epoch": 0.9924976655826384, "grad_norm": 0.16279186864950249, "learning_rate": 1.7006461399532436e-08, "loss": 0.3324, "step": 3853 }, { "epoch": 0.9927552564639212, "grad_norm": 0.14552583560564572, "learning_rate": 1.5853884623195925e-08, "loss": 0.306, "step": 3854 }, { "epoch": 0.993012847345204, "grad_norm": 0.14857715616726758, "learning_rate": 1.4741740740398246e-08, "loss": 0.3462, "step": 3855 }, { "epoch": 0.993012847345204, "eval_PRM Accuracy": 0.8113207547169812, "eval_PRM F1": 0.8780487804878049, "eval_PRM F1 AUC": 0.7380827658459927, "eval_PRM F1 AUC (fixed)": 0.8611838658983761, "eval_PRM F1 Neg": 0.5833333333333334, "eval_PRM NPV": 0.56, "eval_PRM Precision": 0.8888888888888888, "eval_PRM Recall": 0.8674698795180723, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35262784361839294, "eval_runtime": 16.7981, "eval_samples_per_second": 2.619, "eval_steps_per_second": 0.179, "step": 3855 }, { "epoch": 0.9932704382264868, "grad_norm": 0.11861395561824115, "learning_rate": 1.367003065076422e-08, "loss": 0.2956, "step": 3856 }, { "epoch": 0.9935280291077696, "grad_norm": 0.18274494107078726, "learning_rate": 1.2638755221217047e-08, "loss": 0.3989, "step": 3857 }, { "epoch": 0.9937856199890523, "grad_norm": 0.15911968143770888, "learning_rate": 1.1647915285967204e-08, "loss": 0.4393, "step": 3858 }, { "epoch": 0.9940432108703352, "grad_norm": 0.19947833891807695, "learning_rate": 1.069751164652355e-08, "loss": 0.4774, "step": 3859 }, { "epoch": 0.994300801751618, "grad_norm": 0.1792602435414376, "learning_rate": 9.787545071676674e-09, "loss": 0.4409, "step": 3860 }, { "epoch": 0.994300801751618, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.8596123624934521, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.3546697497367859, "eval_runtime": 16.8421, "eval_samples_per_second": 2.612, "eval_steps_per_second": 0.178, "step": 3860 }, { "epoch": 0.9945583926329008, "grad_norm": 0.16676315030772298, "learning_rate": 8.918016297515541e-09, "loss": 0.3873, "step": 3861 }, { "epoch": 0.9948159835141835, "grad_norm": 0.1537904133890653, "learning_rate": 8.088926027410848e-09, "loss": 0.3587, "step": 3862 }, { "epoch": 0.9950735743954664, "grad_norm": 0.14157889090639966, "learning_rate": 7.30027493203167e-09, "loss": 0.3607, "step": 3863 }, { "epoch": 0.9953311652767493, "grad_norm": 0.19332578555591137, "learning_rate": 6.552063649323259e-09, "loss": 0.4088, "step": 3864 }, { "epoch": 0.995588756158032, "grad_norm": 0.13129590984808737, "learning_rate": 5.844292784523697e-09, "loss": 0.3371, "step": 3865 }, { "epoch": 0.995588756158032, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.85751702462022, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35520240664482117, "eval_runtime": 17.1042, "eval_samples_per_second": 2.572, "eval_steps_per_second": 0.175, "step": 3865 }, { "epoch": 0.9958463470393148, "grad_norm": 0.1591974055243455, "learning_rate": 5.176962910163896e-09, "loss": 0.302, "step": 3866 }, { "epoch": 0.9961039379205976, "grad_norm": 0.13232354053669065, "learning_rate": 4.5500745660509435e-09, "loss": 0.2751, "step": 3867 }, { "epoch": 0.9963615288018804, "grad_norm": 0.19267965536010473, "learning_rate": 3.963628259290308e-09, "loss": 0.4389, "step": 3868 }, { "epoch": 0.9966191196831632, "grad_norm": 0.22194226750555665, "learning_rate": 3.4176244642636355e-09, "loss": 0.4047, "step": 3869 }, { "epoch": 0.996876710564446, "grad_norm": 0.1667614023688519, "learning_rate": 2.912063622639849e-09, "loss": 0.3986, "step": 3870 }, { "epoch": 0.996876710564446, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.8643268727082242, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35129615664482117, "eval_runtime": 16.8712, "eval_samples_per_second": 2.608, "eval_steps_per_second": 0.178, "step": 3870 }, { "epoch": 0.9971343014457288, "grad_norm": 0.1728700765894953, "learning_rate": 2.4469461433751507e-09, "loss": 0.3819, "step": 3871 }, { "epoch": 0.9973918923270116, "grad_norm": 0.21291593566328246, "learning_rate": 2.0222724027074703e-09, "loss": 0.3915, "step": 3872 }, { "epoch": 0.9976494832082944, "grad_norm": 0.1550645695952983, "learning_rate": 1.6380427441731184e-09, "loss": 0.3743, "step": 3873 }, { "epoch": 0.9979070740895772, "grad_norm": 0.166816058084006, "learning_rate": 1.2942574785623772e-09, "loss": 0.3438, "step": 3874 }, { "epoch": 0.99816466497086, "grad_norm": 0.18251919599287586, "learning_rate": 9.90916883986115e-10, "loss": 0.2944, "step": 3875 }, { "epoch": 0.99816466497086, "eval_PRM Accuracy": 0.8207547169811321, "eval_PRM F1": 0.8848484848484849, "eval_PRM F1 AUC": 0.7441068622315348, "eval_PRM F1 AUC (fixed)": 0.863017286537454, "eval_PRM F1 Neg": 0.5957446808510638, "eval_PRM NPV": 0.5833333333333334, "eval_PRM Precision": 0.8902439024390244, "eval_PRM Recall": 0.8795180722891566, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35129615664482117, "eval_runtime": 16.9038, "eval_samples_per_second": 2.603, "eval_steps_per_second": 0.177, "step": 3875 }, { "epoch": 0.9984222558521428, "grad_norm": 0.15290702113417942, "learning_rate": 7.280212058091706e-10, "loss": 0.2959, "step": 3876 }, { "epoch": 0.9986798467334257, "grad_norm": 0.14057128974127117, "learning_rate": 5.055706566947649e-10, "loss": 0.4001, "step": 3877 }, { "epoch": 0.9989374376147084, "grad_norm": 0.14824828438814447, "learning_rate": 3.2356541658784546e-10, "loss": 0.3468, "step": 3878 }, { "epoch": 0.9991950284959913, "grad_norm": 0.15676207191010466, "learning_rate": 1.8200563271508765e-10, "loss": 0.4174, "step": 3879 }, { "epoch": 0.999452619377274, "grad_norm": 0.13897661504636863, "learning_rate": 8.08914195793431e-11, "loss": 0.342, "step": 3880 }, { "epoch": 0.999452619377274, "eval_PRM Accuracy": 0.8301886792452831, "eval_PRM F1": 0.891566265060241, "eval_PRM F1 AUC": 0.7501309586170771, "eval_PRM F1 AUC (fixed)": 0.859088528025144, "eval_PRM F1 Neg": 0.6086956521739131, "eval_PRM NPV": 0.6086956521739131, "eval_PRM Precision": 0.891566265060241, "eval_PRM Recall": 0.891566265060241, "eval_PRM Specificty": 0.6086956521739131, "eval_loss": 0.35400390625, "eval_runtime": 17.0944, "eval_samples_per_second": 2.574, "eval_steps_per_second": 0.175, "step": 3880 }, { "epoch": 0.9997102102585569, "grad_norm": 0.18222748366726835, "learning_rate": 2.0222858987395398e-11, "loss": 0.2709, "step": 3881 }, { "epoch": 0.9999678011398396, "grad_norm": 0.175363916804034, "learning_rate": 0.0, "loss": 0.4232, "step": 3882 } ], "logging_steps": 1, "max_steps": 3882, "num_input_tokens_seen": 0, "num_train_epochs": 1, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 8470762821648384.0, "train_batch_size": 4, "trial_name": null, "trial_params": null }