{ "best_global_step": 6075, "best_metric": 0.01458834670484066, "best_model_checkpoint": "./models/autocrop-av-abm/checkpoint-6075", "epoch": 50.0, "eval_steps": 500, "global_step": 11250, "is_hyper_param_search": false, "is_local_process_zero": true, "is_world_process_zero": true, "log_history": [ { "epoch": 0.044444444444444446, "grad_norm": 3.5248303413391113, "learning_rate": 4.800000000000001e-07, "loss": 0.6824576377868652, "step": 10 }, { "epoch": 0.08888888888888889, "grad_norm": 3.914372444152832, "learning_rate": 1.0133333333333333e-06, "loss": 0.6767735958099366, "step": 20 }, { "epoch": 0.13333333333333333, "grad_norm": 4.649425029754639, "learning_rate": 1.5466666666666668e-06, "loss": 0.6572538375854492, "step": 30 }, { "epoch": 0.17777777777777778, "grad_norm": 4.037201404571533, "learning_rate": 2.08e-06, "loss": 0.646054744720459, "step": 40 }, { "epoch": 0.2222222222222222, "grad_norm": 3.690566062927246, "learning_rate": 2.6133333333333334e-06, "loss": 0.623114824295044, "step": 50 }, { "epoch": 0.26666666666666666, "grad_norm": 3.160806179046631, "learning_rate": 3.146666666666667e-06, "loss": 0.5923313617706298, "step": 60 }, { "epoch": 0.3111111111111111, "grad_norm": 3.562601089477539, "learning_rate": 3.68e-06, "loss": 0.5591856002807617, "step": 70 }, { "epoch": 0.35555555555555557, "grad_norm": 3.1448721885681152, "learning_rate": 4.213333333333333e-06, "loss": 0.5201993942260742, "step": 80 }, { "epoch": 0.4, "grad_norm": 2.812706232070923, "learning_rate": 4.746666666666666e-06, "loss": 0.490341329574585, "step": 90 }, { "epoch": 0.4444444444444444, "grad_norm": 2.539597511291504, "learning_rate": 5.279999999999999e-06, "loss": 0.45255489349365235, "step": 100 }, { "epoch": 0.4888888888888889, "grad_norm": 2.3462679386138916, "learning_rate": 5.813333333333333e-06, "loss": 0.4123825550079346, "step": 110 }, { "epoch": 0.5333333333333333, "grad_norm": 2.5169103145599365, "learning_rate": 6.346666666666666e-06, "loss": 0.38111062049865724, "step": 120 }, { "epoch": 0.5777777777777777, "grad_norm": 2.222943067550659, "learning_rate": 6.88e-06, "loss": 0.35951244831085205, "step": 130 }, { "epoch": 0.6222222222222222, "grad_norm": 1.8624954223632812, "learning_rate": 7.413333333333333e-06, "loss": 0.3284521341323853, "step": 140 }, { "epoch": 0.6666666666666666, "grad_norm": 1.7847062349319458, "learning_rate": 7.946666666666666e-06, "loss": 0.30641708374023435, "step": 150 }, { "epoch": 0.7111111111111111, "grad_norm": 2.247802495956421, "learning_rate": 8.48e-06, "loss": 0.289764928817749, "step": 160 }, { "epoch": 0.7555555555555555, "grad_norm": 1.7219352722167969, "learning_rate": 9.013333333333334e-06, "loss": 0.26606502532958987, "step": 170 }, { "epoch": 0.8, "grad_norm": 2.5160794258117676, "learning_rate": 9.546666666666668e-06, "loss": 0.256056022644043, "step": 180 }, { "epoch": 0.8444444444444444, "grad_norm": 1.9258393049240112, "learning_rate": 1.008e-05, "loss": 0.24313576221466066, "step": 190 }, { "epoch": 0.8888888888888888, "grad_norm": 1.749173879623413, "learning_rate": 1.0613333333333334e-05, "loss": 0.24803221225738525, "step": 200 }, { "epoch": 0.9333333333333333, "grad_norm": 1.7766447067260742, "learning_rate": 1.1146666666666666e-05, "loss": 0.23913590908050536, "step": 210 }, { "epoch": 0.9777777777777777, "grad_norm": 1.1860841512680054, "learning_rate": 1.168e-05, "loss": 0.19189679622650146, "step": 220 }, { "epoch": 1.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9859089194249521, "eval_iou_background": 0.0, "eval_iou_crop": 0.9859089194249521, "eval_loss": 0.1796150952577591, "eval_mean_accuracy": 0.9859089194249521, "eval_mean_iou": 0.49295445971247603, "eval_overall_accuracy": 0.9859089194249521, "eval_runtime": 5.2808, "eval_samples_per_second": 60.218, "eval_steps_per_second": 7.575, "step": 225 }, { "epoch": 1.0222222222222221, "grad_norm": 1.2548867464065552, "learning_rate": 1.2213333333333334e-05, "loss": 0.19185034036636353, "step": 230 }, { "epoch": 1.0666666666666667, "grad_norm": 1.051390528678894, "learning_rate": 1.2746666666666666e-05, "loss": 0.19758784770965576, "step": 240 }, { "epoch": 1.1111111111111112, "grad_norm": 1.718682885169983, "learning_rate": 1.328e-05, "loss": 0.18768845796585082, "step": 250 }, { "epoch": 1.1555555555555554, "grad_norm": 1.3972783088684082, "learning_rate": 1.3813333333333334e-05, "loss": 0.17185139656066895, "step": 260 }, { "epoch": 1.2, "grad_norm": 2.0489516258239746, "learning_rate": 1.4346666666666668e-05, "loss": 0.1998542070388794, "step": 270 }, { "epoch": 1.2444444444444445, "grad_norm": 1.3367419242858887, "learning_rate": 1.488e-05, "loss": 0.18080754280090333, "step": 280 }, { "epoch": 1.2888888888888888, "grad_norm": 1.0174310207366943, "learning_rate": 1.5413333333333334e-05, "loss": 0.17363922595977782, "step": 290 }, { "epoch": 1.3333333333333333, "grad_norm": 1.4421097040176392, "learning_rate": 1.5946666666666668e-05, "loss": 0.16403573751449585, "step": 300 }, { "epoch": 1.3777777777777778, "grad_norm": 1.3067890405654907, "learning_rate": 1.648e-05, "loss": 0.1602041482925415, "step": 310 }, { "epoch": 1.4222222222222223, "grad_norm": 0.889907717704773, "learning_rate": 1.7013333333333335e-05, "loss": 0.1635483980178833, "step": 320 }, { "epoch": 1.4666666666666668, "grad_norm": 0.8808795809745789, "learning_rate": 1.754666666666667e-05, "loss": 0.148528790473938, "step": 330 }, { "epoch": 1.511111111111111, "grad_norm": 1.3477909564971924, "learning_rate": 1.808e-05, "loss": 0.14744044542312623, "step": 340 }, { "epoch": 1.5555555555555556, "grad_norm": 1.1558278799057007, "learning_rate": 1.8613333333333334e-05, "loss": 0.12649898529052733, "step": 350 }, { "epoch": 1.6, "grad_norm": 1.1723448038101196, "learning_rate": 1.9146666666666667e-05, "loss": 0.14385347366333007, "step": 360 }, { "epoch": 1.6444444444444444, "grad_norm": 1.0262385606765747, "learning_rate": 1.968e-05, "loss": 0.1383821487426758, "step": 370 }, { "epoch": 1.6888888888888889, "grad_norm": 0.8583065271377563, "learning_rate": 2.0213333333333335e-05, "loss": 0.12373638153076172, "step": 380 }, { "epoch": 1.7333333333333334, "grad_norm": 0.7211213707923889, "learning_rate": 2.074666666666667e-05, "loss": 0.13567585945129396, "step": 390 }, { "epoch": 1.7777777777777777, "grad_norm": 1.1027973890304565, "learning_rate": 2.1280000000000003e-05, "loss": 0.13187665939331056, "step": 400 }, { "epoch": 1.8222222222222222, "grad_norm": 0.8209453225135803, "learning_rate": 2.1813333333333337e-05, "loss": 0.10841170549392701, "step": 410 }, { "epoch": 1.8666666666666667, "grad_norm": 1.130061149597168, "learning_rate": 2.2346666666666667e-05, "loss": 0.12105604410171508, "step": 420 }, { "epoch": 1.911111111111111, "grad_norm": 0.6629496216773987, "learning_rate": 2.288e-05, "loss": 0.1161539912223816, "step": 430 }, { "epoch": 1.9555555555555557, "grad_norm": 0.7081212997436523, "learning_rate": 2.3413333333333335e-05, "loss": 0.11264129877090454, "step": 440 }, { "epoch": 2.0, "grad_norm": 0.7436115741729736, "learning_rate": 2.394666666666667e-05, "loss": 0.10730005502700805, "step": 450 }, { "epoch": 2.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9790269683961709, "eval_iou_background": 0.0, "eval_iou_crop": 0.9790269683961709, "eval_loss": 0.10565543174743652, "eval_mean_accuracy": 0.9790269683961709, "eval_mean_iou": 0.48951348419808544, "eval_overall_accuracy": 0.9790269683961709, "eval_runtime": 4.8334, "eval_samples_per_second": 65.793, "eval_steps_per_second": 8.276, "step": 450 }, { "epoch": 2.0444444444444443, "grad_norm": 0.6431455016136169, "learning_rate": 2.448e-05, "loss": 0.10873520374298096, "step": 460 }, { "epoch": 2.088888888888889, "grad_norm": 0.8612810969352722, "learning_rate": 2.5013333333333333e-05, "loss": 0.1075707197189331, "step": 470 }, { "epoch": 2.1333333333333333, "grad_norm": 0.464311808347702, "learning_rate": 2.5546666666666667e-05, "loss": 0.10260558128356934, "step": 480 }, { "epoch": 2.1777777777777776, "grad_norm": 0.8125102519989014, "learning_rate": 2.608e-05, "loss": 0.0926192045211792, "step": 490 }, { "epoch": 2.2222222222222223, "grad_norm": 0.6775174140930176, "learning_rate": 2.661333333333333e-05, "loss": 0.09348201751708984, "step": 500 }, { "epoch": 2.2666666666666666, "grad_norm": 0.7547085881233215, "learning_rate": 2.7146666666666665e-05, "loss": 0.09200754165649414, "step": 510 }, { "epoch": 2.311111111111111, "grad_norm": 0.5086994767189026, "learning_rate": 2.768e-05, "loss": 0.08397443890571595, "step": 520 }, { "epoch": 2.3555555555555556, "grad_norm": 0.732149064540863, "learning_rate": 2.8213333333333333e-05, "loss": 0.09163645505905152, "step": 530 }, { "epoch": 2.4, "grad_norm": 0.6456112265586853, "learning_rate": 2.8746666666666667e-05, "loss": 0.08097342848777771, "step": 540 }, { "epoch": 2.4444444444444446, "grad_norm": 0.40750372409820557, "learning_rate": 2.928e-05, "loss": 0.08197349905967713, "step": 550 }, { "epoch": 2.488888888888889, "grad_norm": 0.8187499046325684, "learning_rate": 2.9813333333333335e-05, "loss": 0.07796886563301086, "step": 560 }, { "epoch": 2.533333333333333, "grad_norm": 0.9145808815956116, "learning_rate": 3.034666666666667e-05, "loss": 0.07138473987579345, "step": 570 }, { "epoch": 2.5777777777777775, "grad_norm": 0.536822497844696, "learning_rate": 3.088e-05, "loss": 0.07692977786064148, "step": 580 }, { "epoch": 2.6222222222222222, "grad_norm": 0.5678733587265015, "learning_rate": 3.141333333333333e-05, "loss": 0.06506951451301575, "step": 590 }, { "epoch": 2.6666666666666665, "grad_norm": 0.5523478388786316, "learning_rate": 3.194666666666667e-05, "loss": 0.07164572477340699, "step": 600 }, { "epoch": 2.7111111111111112, "grad_norm": 0.5508274435997009, "learning_rate": 3.248e-05, "loss": 0.06439810395240783, "step": 610 }, { "epoch": 2.7555555555555555, "grad_norm": 0.4774600863456726, "learning_rate": 3.301333333333333e-05, "loss": 0.06405921578407288, "step": 620 }, { "epoch": 2.8, "grad_norm": 0.3406943380832672, "learning_rate": 3.354666666666667e-05, "loss": 0.06375088691711425, "step": 630 }, { "epoch": 2.8444444444444446, "grad_norm": 0.6085440516471863, "learning_rate": 3.408e-05, "loss": 0.062880140542984, "step": 640 }, { "epoch": 2.888888888888889, "grad_norm": 0.6862090826034546, "learning_rate": 3.4613333333333336e-05, "loss": 0.06911001801490783, "step": 650 }, { "epoch": 2.9333333333333336, "grad_norm": 0.30844491720199585, "learning_rate": 3.514666666666667e-05, "loss": 0.06744029521942138, "step": 660 }, { "epoch": 2.977777777777778, "grad_norm": 0.4593600034713745, "learning_rate": 3.5680000000000004e-05, "loss": 0.05715551972389221, "step": 670 }, { "epoch": 3.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9706378957816592, "eval_iou_background": 0.0, "eval_iou_crop": 0.9706378957816592, "eval_loss": 0.04904763028025627, "eval_mean_accuracy": 0.9706378957816592, "eval_mean_iou": 0.4853189478908296, "eval_overall_accuracy": 0.9706378957816592, "eval_runtime": 4.0555, "eval_samples_per_second": 78.412, "eval_steps_per_second": 9.863, "step": 675 }, { "epoch": 3.022222222222222, "grad_norm": 14.09307861328125, "learning_rate": 3.6213333333333334e-05, "loss": 0.0580611526966095, "step": 680 }, { "epoch": 3.066666666666667, "grad_norm": 0.34167131781578064, "learning_rate": 3.674666666666667e-05, "loss": 0.0609450101852417, "step": 690 }, { "epoch": 3.111111111111111, "grad_norm": 0.44965633749961853, "learning_rate": 3.7279999999999995e-05, "loss": 0.05775919556617737, "step": 700 }, { "epoch": 3.1555555555555554, "grad_norm": 0.39594125747680664, "learning_rate": 3.781333333333333e-05, "loss": 0.05335736274719238, "step": 710 }, { "epoch": 3.2, "grad_norm": 0.3181576132774353, "learning_rate": 3.834666666666666e-05, "loss": 0.05584867000579834, "step": 720 }, { "epoch": 3.2444444444444445, "grad_norm": 0.37977147102355957, "learning_rate": 3.888e-05, "loss": 0.0503345787525177, "step": 730 }, { "epoch": 3.2888888888888888, "grad_norm": 0.37320592999458313, "learning_rate": 3.941333333333333e-05, "loss": 0.05368784666061401, "step": 740 }, { "epoch": 3.3333333333333335, "grad_norm": 0.646068274974823, "learning_rate": 3.994666666666667e-05, "loss": 0.052375185489654544, "step": 750 }, { "epoch": 3.3777777777777778, "grad_norm": 0.685707151889801, "learning_rate": 4.048e-05, "loss": 0.045791652798652646, "step": 760 }, { "epoch": 3.422222222222222, "grad_norm": 0.39380910992622375, "learning_rate": 4.1013333333333336e-05, "loss": 0.04926330149173737, "step": 770 }, { "epoch": 3.466666666666667, "grad_norm": 0.34124818444252014, "learning_rate": 4.1546666666666666e-05, "loss": 0.05358283519744873, "step": 780 }, { "epoch": 3.511111111111111, "grad_norm": 0.38596010208129883, "learning_rate": 4.2080000000000004e-05, "loss": 0.046906673908233644, "step": 790 }, { "epoch": 3.5555555555555554, "grad_norm": 0.4585939049720764, "learning_rate": 4.2613333333333334e-05, "loss": 0.0466411679983139, "step": 800 }, { "epoch": 3.6, "grad_norm": 1.472694993019104, "learning_rate": 4.314666666666667e-05, "loss": 0.050793427228927615, "step": 810 }, { "epoch": 3.6444444444444444, "grad_norm": 0.348598837852478, "learning_rate": 4.368e-05, "loss": 0.044522547721862794, "step": 820 }, { "epoch": 3.688888888888889, "grad_norm": 0.3608667254447937, "learning_rate": 4.421333333333334e-05, "loss": 0.05709003210067749, "step": 830 }, { "epoch": 3.7333333333333334, "grad_norm": 0.22636334598064423, "learning_rate": 4.474666666666667e-05, "loss": 0.044133943319320676, "step": 840 }, { "epoch": 3.7777777777777777, "grad_norm": 0.37805142998695374, "learning_rate": 4.528000000000001e-05, "loss": 0.05256962776184082, "step": 850 }, { "epoch": 3.822222222222222, "grad_norm": 0.2991584837436676, "learning_rate": 4.581333333333333e-05, "loss": 0.04162576198577881, "step": 860 }, { "epoch": 3.8666666666666667, "grad_norm": 0.8615538477897644, "learning_rate": 4.634666666666667e-05, "loss": 0.045782452821731566, "step": 870 }, { "epoch": 3.911111111111111, "grad_norm": 0.40110212564468384, "learning_rate": 4.688e-05, "loss": 0.03842214941978454, "step": 880 }, { "epoch": 3.9555555555555557, "grad_norm": 0.4481162428855896, "learning_rate": 4.7413333333333336e-05, "loss": 0.04109309017658234, "step": 890 }, { "epoch": 4.0, "grad_norm": 0.32728227972984314, "learning_rate": 4.7946666666666666e-05, "loss": 0.037542372941970825, "step": 900 }, { "epoch": 4.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9803799525469973, "eval_iou_background": 0.0, "eval_iou_crop": 0.9803799525469973, "eval_loss": 0.03712577000260353, "eval_mean_accuracy": 0.9803799525469973, "eval_mean_iou": 0.49018997627349864, "eval_overall_accuracy": 0.9803799525469973, "eval_runtime": 4.9063, "eval_samples_per_second": 64.815, "eval_steps_per_second": 8.153, "step": 900 }, { "epoch": 4.044444444444444, "grad_norm": 0.2824453115463257, "learning_rate": 4.8480000000000003e-05, "loss": 0.04001589417457581, "step": 910 }, { "epoch": 4.088888888888889, "grad_norm": 0.37437719106674194, "learning_rate": 4.9013333333333334e-05, "loss": 0.044075435400009154, "step": 920 }, { "epoch": 4.133333333333334, "grad_norm": 0.39725029468536377, "learning_rate": 4.954666666666667e-05, "loss": 0.04842301309108734, "step": 930 }, { "epoch": 4.177777777777778, "grad_norm": 0.3993479907512665, "learning_rate": 5.008e-05, "loss": 0.0406807541847229, "step": 940 }, { "epoch": 4.222222222222222, "grad_norm": 0.5353586077690125, "learning_rate": 5.061333333333333e-05, "loss": 0.04123523831367493, "step": 950 }, { "epoch": 4.266666666666667, "grad_norm": 2.142263650894165, "learning_rate": 5.114666666666667e-05, "loss": 0.03884044289588928, "step": 960 }, { "epoch": 4.311111111111111, "grad_norm": 1.3085217475891113, "learning_rate": 5.168e-05, "loss": 0.04114464521408081, "step": 970 }, { "epoch": 4.355555555555555, "grad_norm": 0.46703723073005676, "learning_rate": 5.221333333333334e-05, "loss": 0.037194561958312986, "step": 980 }, { "epoch": 4.4, "grad_norm": 0.25801995396614075, "learning_rate": 5.274666666666667e-05, "loss": 0.0392421692609787, "step": 990 }, { "epoch": 4.444444444444445, "grad_norm": 0.5428070425987244, "learning_rate": 5.3280000000000005e-05, "loss": 0.03741243183612823, "step": 1000 }, { "epoch": 4.488888888888889, "grad_norm": 0.3124564290046692, "learning_rate": 5.3813333333333335e-05, "loss": 0.03622358739376068, "step": 1010 }, { "epoch": 4.533333333333333, "grad_norm": 0.6635043025016785, "learning_rate": 5.4346666666666666e-05, "loss": 0.03287203907966614, "step": 1020 }, { "epoch": 4.5777777777777775, "grad_norm": 0.519015908241272, "learning_rate": 5.4879999999999996e-05, "loss": 0.040299683809280396, "step": 1030 }, { "epoch": 4.622222222222222, "grad_norm": 0.3608980178833008, "learning_rate": 5.5413333333333334e-05, "loss": 0.034294682741165164, "step": 1040 }, { "epoch": 4.666666666666667, "grad_norm": 0.41539570689201355, "learning_rate": 5.5946666666666664e-05, "loss": 0.045557767152786255, "step": 1050 }, { "epoch": 4.711111111111111, "grad_norm": 0.32102257013320923, "learning_rate": 5.648e-05, "loss": 0.03539595901966095, "step": 1060 }, { "epoch": 4.7555555555555555, "grad_norm": 0.24864570796489716, "learning_rate": 5.701333333333333e-05, "loss": 0.03778429627418518, "step": 1070 }, { "epoch": 4.8, "grad_norm": 0.5835459232330322, "learning_rate": 5.754666666666667e-05, "loss": 0.028651362657546996, "step": 1080 }, { "epoch": 4.844444444444444, "grad_norm": 0.3739009201526642, "learning_rate": 5.808e-05, "loss": 0.03362091183662415, "step": 1090 }, { "epoch": 4.888888888888889, "grad_norm": 0.6427468061447144, "learning_rate": 5.861333333333334e-05, "loss": 0.027434492111206056, "step": 1100 }, { "epoch": 4.933333333333334, "grad_norm": 0.9151515364646912, "learning_rate": 5.914666666666667e-05, "loss": 0.03355176448822021, "step": 1110 }, { "epoch": 4.977777777777778, "grad_norm": 0.40982338786125183, "learning_rate": 5.9680000000000005e-05, "loss": 0.043997785449028014, "step": 1120 }, { "epoch": 5.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9837152884462359, "eval_iou_background": 0.0, "eval_iou_crop": 0.9837152884462359, "eval_loss": 0.03160220757126808, "eval_mean_accuracy": 0.9837152884462359, "eval_mean_iou": 0.49185764422311795, "eval_overall_accuracy": 0.9837152884462359, "eval_runtime": 4.3051, "eval_samples_per_second": 73.866, "eval_steps_per_second": 9.291, "step": 1125 }, { "epoch": 5.022222222222222, "grad_norm": 0.5154401063919067, "learning_rate": 5.999997689420757e-05, "loss": 0.03167508244514465, "step": 1130 }, { "epoch": 5.066666666666666, "grad_norm": 0.28879672288894653, "learning_rate": 5.999971695445147e-05, "loss": 0.03561036586761475, "step": 1140 }, { "epoch": 5.111111111111111, "grad_norm": 0.41505226492881775, "learning_rate": 5.9999168195209624e-05, "loss": 0.03081900179386139, "step": 1150 }, { "epoch": 5.155555555555556, "grad_norm": 0.21958798170089722, "learning_rate": 5.999833062176514e-05, "loss": 0.0338530570268631, "step": 1160 }, { "epoch": 5.2, "grad_norm": 0.21357500553131104, "learning_rate": 5.99972042421817e-05, "loss": 0.03936813473701477, "step": 1170 }, { "epoch": 5.2444444444444445, "grad_norm": 0.2509428560733795, "learning_rate": 5.999578906730341e-05, "loss": 0.028076761960983278, "step": 1180 }, { "epoch": 5.288888888888889, "grad_norm": 0.8507352471351624, "learning_rate": 5.999408511075474e-05, "loss": 0.027349865436553954, "step": 1190 }, { "epoch": 5.333333333333333, "grad_norm": 0.5596743822097778, "learning_rate": 5.999209238894037e-05, "loss": 0.03489661514759064, "step": 1200 }, { "epoch": 5.377777777777778, "grad_norm": 0.6814782619476318, "learning_rate": 5.998981092104504e-05, "loss": 0.02936413586139679, "step": 1210 }, { "epoch": 5.4222222222222225, "grad_norm": 0.8596444129943848, "learning_rate": 5.998724072903338e-05, "loss": 0.03472908735275269, "step": 1220 }, { "epoch": 5.466666666666667, "grad_norm": 0.19605295360088348, "learning_rate": 5.998438183764966e-05, "loss": 0.02607877254486084, "step": 1230 }, { "epoch": 5.511111111111111, "grad_norm": 0.3320583999156952, "learning_rate": 5.998123427441761e-05, "loss": 0.03048555850982666, "step": 1240 }, { "epoch": 5.555555555555555, "grad_norm": 0.38816800713539124, "learning_rate": 5.9977798069640076e-05, "loss": 0.026038551330566408, "step": 1250 }, { "epoch": 5.6, "grad_norm": 0.3036852777004242, "learning_rate": 5.997407325639883e-05, "loss": 0.027465540170669555, "step": 1260 }, { "epoch": 5.644444444444445, "grad_norm": 0.6851722598075867, "learning_rate": 5.997005987055415e-05, "loss": 0.030760732293128968, "step": 1270 }, { "epoch": 5.688888888888889, "grad_norm": 0.33638131618499756, "learning_rate": 5.9965757950744525e-05, "loss": 0.028122958540916444, "step": 1280 }, { "epoch": 5.733333333333333, "grad_norm": 0.30311980843544006, "learning_rate": 5.9961167538386306e-05, "loss": 0.03382556736469269, "step": 1290 }, { "epoch": 5.777777777777778, "grad_norm": 0.31270864605903625, "learning_rate": 5.995628867767325e-05, "loss": 0.02801945209503174, "step": 1300 }, { "epoch": 5.822222222222222, "grad_norm": 0.3521674871444702, "learning_rate": 5.995112141557614e-05, "loss": 0.02482060045003891, "step": 1310 }, { "epoch": 5.866666666666667, "grad_norm": 0.7939164042472839, "learning_rate": 5.994566580184231e-05, "loss": 0.033414483070373535, "step": 1320 }, { "epoch": 5.911111111111111, "grad_norm": 0.15953071415424347, "learning_rate": 5.9939921888995186e-05, "loss": 0.030252185463905335, "step": 1330 }, { "epoch": 5.955555555555556, "grad_norm": 2.0538058280944824, "learning_rate": 5.993388973233373e-05, "loss": 0.038461548089981076, "step": 1340 }, { "epoch": 6.0, "grad_norm": 0.16759829223155975, "learning_rate": 5.992756938993198e-05, "loss": 0.022777898609638213, "step": 1350 }, { "epoch": 6.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9803476924758905, "eval_iou_background": 0.0, "eval_iou_crop": 0.9803476924758905, "eval_loss": 0.024956196546554565, "eval_mean_accuracy": 0.9803476924758905, "eval_mean_iou": 0.49017384623794524, "eval_overall_accuracy": 0.9803476924758905, "eval_runtime": 5.0098, "eval_samples_per_second": 63.476, "eval_steps_per_second": 7.984, "step": 1350 }, { "epoch": 6.044444444444444, "grad_norm": 0.19292712211608887, "learning_rate": 5.992096092263846e-05, "loss": 0.02220650464296341, "step": 1360 }, { "epoch": 6.088888888888889, "grad_norm": 0.1689830869436264, "learning_rate": 5.991406439407555e-05, "loss": 0.023907102644443512, "step": 1370 }, { "epoch": 6.133333333333334, "grad_norm": 0.5275858640670776, "learning_rate": 5.990687987063896e-05, "loss": 0.03326213359832764, "step": 1380 }, { "epoch": 6.177777777777778, "grad_norm": 0.2718386650085449, "learning_rate": 5.9899407421497e-05, "loss": 0.029743513464927672, "step": 1390 }, { "epoch": 6.222222222222222, "grad_norm": 0.17206081748008728, "learning_rate": 5.989164711859e-05, "loss": 0.028239110112190248, "step": 1400 }, { "epoch": 6.266666666666667, "grad_norm": 0.5629389882087708, "learning_rate": 5.9883599036629534e-05, "loss": 0.024127838015556336, "step": 1410 }, { "epoch": 6.311111111111111, "grad_norm": 0.12005782127380371, "learning_rate": 5.9875263253097786e-05, "loss": 0.028623118996620178, "step": 1420 }, { "epoch": 6.355555555555555, "grad_norm": 1.5187276601791382, "learning_rate": 5.9866639848246726e-05, "loss": 0.03739739954471588, "step": 1430 }, { "epoch": 6.4, "grad_norm": 0.605290412902832, "learning_rate": 5.985772890509737e-05, "loss": 0.023904742300510408, "step": 1440 }, { "epoch": 6.444444444444445, "grad_norm": 0.7090761065483093, "learning_rate": 5.984853050943901e-05, "loss": 0.029369419813156127, "step": 1450 }, { "epoch": 6.488888888888889, "grad_norm": 0.35442689061164856, "learning_rate": 5.9839044749828335e-05, "loss": 0.027673700451850893, "step": 1460 }, { "epoch": 6.533333333333333, "grad_norm": 0.12377811968326569, "learning_rate": 5.982927171758863e-05, "loss": 0.024320544302463533, "step": 1470 }, { "epoch": 6.5777777777777775, "grad_norm": 0.41834911704063416, "learning_rate": 5.981921150680884e-05, "loss": 0.027434533834457396, "step": 1480 }, { "epoch": 6.622222222222222, "grad_norm": 0.2632192373275757, "learning_rate": 5.980886421434271e-05, "loss": 0.023983579874038697, "step": 1490 }, { "epoch": 6.666666666666667, "grad_norm": 0.6196466088294983, "learning_rate": 5.979822993980784e-05, "loss": 0.02572091817855835, "step": 1500 }, { "epoch": 6.711111111111111, "grad_norm": 0.42908981442451477, "learning_rate": 5.978730878558472e-05, "loss": 0.022932884097099305, "step": 1510 }, { "epoch": 6.7555555555555555, "grad_norm": 1.2562302350997925, "learning_rate": 5.9776100856815736e-05, "loss": 0.024826666712760924, "step": 1520 }, { "epoch": 6.8, "grad_norm": 0.156297504901886, "learning_rate": 5.9764606261404197e-05, "loss": 0.020381520688533782, "step": 1530 }, { "epoch": 6.844444444444444, "grad_norm": 0.4894500970840454, "learning_rate": 5.975282511001325e-05, "loss": 0.02667376399040222, "step": 1540 }, { "epoch": 6.888888888888889, "grad_norm": 0.29653042554855347, "learning_rate": 5.974075751606482e-05, "loss": 0.0210765540599823, "step": 1550 }, { "epoch": 6.933333333333334, "grad_norm": 0.48105350136756897, "learning_rate": 5.972840359573856e-05, "loss": 0.021568430960178374, "step": 1560 }, { "epoch": 6.977777777777778, "grad_norm": 0.19659851491451263, "learning_rate": 5.9715763467970674e-05, "loss": 0.029361891746520995, "step": 1570 }, { "epoch": 7.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9745605911725351, "eval_iou_background": 0.0, "eval_iou_crop": 0.9745605911725351, "eval_loss": 0.02326256036758423, "eval_mean_accuracy": 0.9745605911725351, "eval_mean_iou": 0.48728029558626756, "eval_overall_accuracy": 0.9745605911725351, "eval_runtime": 4.9868, "eval_samples_per_second": 63.768, "eval_steps_per_second": 8.021, "step": 1575 }, { "epoch": 7.022222222222222, "grad_norm": 0.30831804871559143, "learning_rate": 5.970283725445283e-05, "loss": 0.021829694509506226, "step": 1580 }, { "epoch": 7.066666666666666, "grad_norm": 0.3810664117336273, "learning_rate": 5.968962507963095e-05, "loss": 0.023245696723461152, "step": 1590 }, { "epoch": 7.111111111111111, "grad_norm": 0.37900832295417786, "learning_rate": 5.967612707070401e-05, "loss": 0.019126971065998078, "step": 1600 }, { "epoch": 7.155555555555556, "grad_norm": 0.7442126870155334, "learning_rate": 5.966234335762284e-05, "loss": 0.028181317448616027, "step": 1610 }, { "epoch": 7.2, "grad_norm": 0.48315268754959106, "learning_rate": 5.964827407308885e-05, "loss": 0.028313300013542174, "step": 1620 }, { "epoch": 7.2444444444444445, "grad_norm": 0.5287045240402222, "learning_rate": 5.963391935255277e-05, "loss": 0.022829659283161163, "step": 1630 }, { "epoch": 7.288888888888889, "grad_norm": 0.22872966527938843, "learning_rate": 5.9619279334213346e-05, "loss": 0.028395310044288635, "step": 1640 }, { "epoch": 7.333333333333333, "grad_norm": 0.7591527700424194, "learning_rate": 5.960435415901598e-05, "loss": 0.02693500220775604, "step": 1650 }, { "epoch": 7.377777777777778, "grad_norm": 0.24480341374874115, "learning_rate": 5.958914397065142e-05, "loss": 0.022064709663391115, "step": 1660 }, { "epoch": 7.4222222222222225, "grad_norm": 0.10583412647247314, "learning_rate": 5.957364891555434e-05, "loss": 0.019875745475292205, "step": 1670 }, { "epoch": 7.466666666666667, "grad_norm": 0.19980314373970032, "learning_rate": 5.9557869142901935e-05, "loss": 0.017398793995380402, "step": 1680 }, { "epoch": 7.511111111111111, "grad_norm": 0.2687499523162842, "learning_rate": 5.9541804804612505e-05, "loss": 0.025153425335884095, "step": 1690 }, { "epoch": 7.555555555555555, "grad_norm": 0.6190925240516663, "learning_rate": 5.9525456055343965e-05, "loss": 0.02306385487318039, "step": 1700 }, { "epoch": 7.6, "grad_norm": 0.174056738615036, "learning_rate": 5.950882305249239e-05, "loss": 0.022678129374980927, "step": 1710 }, { "epoch": 7.644444444444445, "grad_norm": 0.1692689061164856, "learning_rate": 5.949190595619046e-05, "loss": 0.023095321655273438, "step": 1720 }, { "epoch": 7.688888888888889, "grad_norm": 0.1307246834039688, "learning_rate": 5.947470492930596e-05, "loss": 0.018887031078338622, "step": 1730 }, { "epoch": 7.733333333333333, "grad_norm": 0.29090988636016846, "learning_rate": 5.945722013744016e-05, "loss": 0.030557361245155335, "step": 1740 }, { "epoch": 7.777777777777778, "grad_norm": 0.213711678981781, "learning_rate": 5.943945174892627e-05, "loss": 0.02240873724222183, "step": 1750 }, { "epoch": 7.822222222222222, "grad_norm": 0.480829119682312, "learning_rate": 5.942139993482781e-05, "loss": 0.026100322604179382, "step": 1760 }, { "epoch": 7.866666666666667, "grad_norm": 0.1798330694437027, "learning_rate": 5.940306486893694e-05, "loss": 0.02332938462495804, "step": 1770 }, { "epoch": 7.911111111111111, "grad_norm": 0.484030157327652, "learning_rate": 5.938444672777279e-05, "loss": 0.02182285636663437, "step": 1780 }, { "epoch": 7.955555555555556, "grad_norm": 0.4164707362651825, "learning_rate": 5.9365545690579784e-05, "loss": 0.026998502016067506, "step": 1790 }, { "epoch": 8.0, "grad_norm": 0.512827455997467, "learning_rate": 5.934636193932592e-05, "loss": 0.021303069591522217, "step": 1800 }, { "epoch": 8.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9862792370358542, "eval_iou_background": 0.0, "eval_iou_crop": 0.9862792370358542, "eval_loss": 0.02089126780629158, "eval_mean_accuracy": 0.9862792370358542, "eval_mean_iou": 0.4931396185179271, "eval_overall_accuracy": 0.9862792370358542, "eval_runtime": 4.3873, "eval_samples_per_second": 72.483, "eval_steps_per_second": 9.117, "step": 1800 }, { "epoch": 8.044444444444444, "grad_norm": 0.3750280439853668, "learning_rate": 5.932689565870096e-05, "loss": 0.02774544060230255, "step": 1810 }, { "epoch": 8.088888888888889, "grad_norm": 0.09331250190734863, "learning_rate": 5.9307147036114715e-05, "loss": 0.018551455438137056, "step": 1820 }, { "epoch": 8.133333333333333, "grad_norm": 0.2520679235458374, "learning_rate": 5.928711626169522e-05, "loss": 0.02102348506450653, "step": 1830 }, { "epoch": 8.177777777777777, "grad_norm": 0.22293546795845032, "learning_rate": 5.926680352828688e-05, "loss": 0.021540656685829163, "step": 1840 }, { "epoch": 8.222222222222221, "grad_norm": 0.3365994393825531, "learning_rate": 5.924620903144866e-05, "loss": 0.01952708214521408, "step": 1850 }, { "epoch": 8.266666666666667, "grad_norm": 0.178181454539299, "learning_rate": 5.922533296945217e-05, "loss": 0.01960945427417755, "step": 1860 }, { "epoch": 8.311111111111112, "grad_norm": 0.7973014712333679, "learning_rate": 5.920417554327973e-05, "loss": 0.023567810654640198, "step": 1870 }, { "epoch": 8.355555555555556, "grad_norm": 0.2192898988723755, "learning_rate": 5.918273695662252e-05, "loss": 0.020967347919940947, "step": 1880 }, { "epoch": 8.4, "grad_norm": 0.4955143630504608, "learning_rate": 5.916101741587852e-05, "loss": 0.022594356536865236, "step": 1890 }, { "epoch": 8.444444444444445, "grad_norm": 0.1294562667608261, "learning_rate": 5.91390171301506e-05, "loss": 0.020742426812648772, "step": 1900 }, { "epoch": 8.488888888888889, "grad_norm": 1.841516375541687, "learning_rate": 5.911673631124446e-05, "loss": 0.02064659893512726, "step": 1910 }, { "epoch": 8.533333333333333, "grad_norm": 0.3090057373046875, "learning_rate": 5.909417517366662e-05, "loss": 0.0244680181145668, "step": 1920 }, { "epoch": 8.577777777777778, "grad_norm": 0.24640917778015137, "learning_rate": 5.907133393462233e-05, "loss": 0.02893313765525818, "step": 1930 }, { "epoch": 8.622222222222222, "grad_norm": 0.37263238430023193, "learning_rate": 5.904821281401349e-05, "loss": 0.02242177277803421, "step": 1940 }, { "epoch": 8.666666666666666, "grad_norm": 0.22164225578308105, "learning_rate": 5.902481203443655e-05, "loss": 0.022078101336956025, "step": 1950 }, { "epoch": 8.71111111111111, "grad_norm": 0.7043717503547668, "learning_rate": 5.900113182118033e-05, "loss": 0.027357828617095948, "step": 1960 }, { "epoch": 8.755555555555556, "grad_norm": 0.17114096879959106, "learning_rate": 5.8977172402223887e-05, "loss": 0.02590107321739197, "step": 1970 }, { "epoch": 8.8, "grad_norm": 0.2260318547487259, "learning_rate": 5.89529340082343e-05, "loss": 0.022403007745742796, "step": 1980 }, { "epoch": 8.844444444444445, "grad_norm": 0.22599756717681885, "learning_rate": 5.892841687256444e-05, "loss": 0.01884809285402298, "step": 1990 }, { "epoch": 8.88888888888889, "grad_norm": 0.09801608324050903, "learning_rate": 5.890362123125077e-05, "loss": 0.01886136084794998, "step": 2000 }, { "epoch": 8.933333333333334, "grad_norm": 0.3745884895324707, "learning_rate": 5.887854732301101e-05, "loss": 0.02581452429294586, "step": 2010 }, { "epoch": 8.977777777777778, "grad_norm": 0.1903250515460968, "learning_rate": 5.885319538924189e-05, "loss": 0.021467125415802, "step": 2020 }, { "epoch": 9.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9880881168493166, "eval_iou_background": 0.0, "eval_iou_crop": 0.9880881168493166, "eval_loss": 0.022039713338017464, "eval_mean_accuracy": 0.9880881168493166, "eval_mean_iou": 0.4940440584246583, "eval_overall_accuracy": 0.9880881168493166, "eval_runtime": 4.9326, "eval_samples_per_second": 64.469, "eval_steps_per_second": 8.109, "step": 2025 }, { "epoch": 9.022222222222222, "grad_norm": 0.29114872217178345, "learning_rate": 5.882756567401678e-05, "loss": 0.02046652287244797, "step": 2030 }, { "epoch": 9.066666666666666, "grad_norm": 0.36242613196372986, "learning_rate": 5.88016584240834e-05, "loss": 0.020714859664440154, "step": 2040 }, { "epoch": 9.11111111111111, "grad_norm": 0.24400602281093597, "learning_rate": 5.877547388886138e-05, "loss": 0.015958608686923982, "step": 2050 }, { "epoch": 9.155555555555555, "grad_norm": 0.20057950913906097, "learning_rate": 5.874901232043988e-05, "loss": 0.020959481596946716, "step": 2060 }, { "epoch": 9.2, "grad_norm": 0.37113210558891296, "learning_rate": 5.872227397357522e-05, "loss": 0.018901588022708894, "step": 2070 }, { "epoch": 9.244444444444444, "grad_norm": 0.2561708092689514, "learning_rate": 5.8695259105688334e-05, "loss": 0.027983573079109193, "step": 2080 }, { "epoch": 9.28888888888889, "grad_norm": 0.28498613834381104, "learning_rate": 5.8667967976862354e-05, "loss": 0.027293893694877624, "step": 2090 }, { "epoch": 9.333333333333334, "grad_norm": 0.1498035043478012, "learning_rate": 5.8640400849840084e-05, "loss": 0.0197441428899765, "step": 2100 }, { "epoch": 9.377777777777778, "grad_norm": 0.2116042822599411, "learning_rate": 5.8612557990021485e-05, "loss": 0.018968820571899414, "step": 2110 }, { "epoch": 9.422222222222222, "grad_norm": 0.10620342195034027, "learning_rate": 5.858443966546108e-05, "loss": 0.019327281415462493, "step": 2120 }, { "epoch": 9.466666666666667, "grad_norm": 0.39922022819519043, "learning_rate": 5.855604614686544e-05, "loss": 0.019729509949684143, "step": 2130 }, { "epoch": 9.511111111111111, "grad_norm": 0.37401795387268066, "learning_rate": 5.852737770759053e-05, "loss": 0.017794091999530793, "step": 2140 }, { "epoch": 9.555555555555555, "grad_norm": 0.15316298604011536, "learning_rate": 5.8498434623639075e-05, "loss": 0.016887250542640685, "step": 2150 }, { "epoch": 9.6, "grad_norm": 0.41028714179992676, "learning_rate": 5.8469217173657915e-05, "loss": 0.022824101150035858, "step": 2160 }, { "epoch": 9.644444444444444, "grad_norm": 1.0843021869659424, "learning_rate": 5.843972563893535e-05, "loss": 0.022220319509506224, "step": 2170 }, { "epoch": 9.688888888888888, "grad_norm": 0.27494609355926514, "learning_rate": 5.840996030339838e-05, "loss": 0.021847550570964814, "step": 2180 }, { "epoch": 9.733333333333333, "grad_norm": 0.17890681326389313, "learning_rate": 5.837992145361001e-05, "loss": 0.01540495753288269, "step": 2190 }, { "epoch": 9.777777777777779, "grad_norm": 1.7246273756027222, "learning_rate": 5.8349609378766475e-05, "loss": 0.021896225214004517, "step": 2200 }, { "epoch": 9.822222222222223, "grad_norm": 0.26342257857322693, "learning_rate": 5.8319024370694456e-05, "loss": 0.017678411304950715, "step": 2210 }, { "epoch": 9.866666666666667, "grad_norm": 0.16534309089183807, "learning_rate": 5.828816672384827e-05, "loss": 0.023056669533252715, "step": 2220 }, { "epoch": 9.911111111111111, "grad_norm": 0.44752565026283264, "learning_rate": 5.8257036735307045e-05, "loss": 0.01582224667072296, "step": 2230 }, { "epoch": 9.955555555555556, "grad_norm": 2.0666565895080566, "learning_rate": 5.822563470477185e-05, "loss": 0.021694257855415344, "step": 2240 }, { "epoch": 10.0, "grad_norm": 0.23703497648239136, "learning_rate": 5.819396093456282e-05, "loss": 0.01860710084438324, "step": 2250 }, { "epoch": 10.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9848576935018577, "eval_iou_background": 0.0, "eval_iou_crop": 0.9848576935018577, "eval_loss": 0.0180215984582901, "eval_mean_accuracy": 0.9848576935018577, "eval_mean_iou": 0.49242884675092885, "eval_overall_accuracy": 0.9848576935018577, "eval_runtime": 4.9586, "eval_samples_per_second": 64.131, "eval_steps_per_second": 8.067, "step": 2250 }, { "epoch": 10.044444444444444, "grad_norm": 0.39713430404663086, "learning_rate": 5.816201572961623e-05, "loss": 0.018186010420322418, "step": 2260 }, { "epoch": 10.088888888888889, "grad_norm": 0.39852485060691833, "learning_rate": 5.812979939748156e-05, "loss": 0.01676541566848755, "step": 2270 }, { "epoch": 10.133333333333333, "grad_norm": 0.23559890687465668, "learning_rate": 5.809731224831857e-05, "loss": 0.017047233879566193, "step": 2280 }, { "epoch": 10.177777777777777, "grad_norm": 1.0538610219955444, "learning_rate": 5.806455459489426e-05, "loss": 0.02245011627674103, "step": 2290 }, { "epoch": 10.222222222222221, "grad_norm": 0.24289731681346893, "learning_rate": 5.803152675257989e-05, "loss": 0.017808344960212708, "step": 2300 }, { "epoch": 10.266666666666667, "grad_norm": 0.10697416961193085, "learning_rate": 5.799822903934794e-05, "loss": 0.024378865957260132, "step": 2310 }, { "epoch": 10.311111111111112, "grad_norm": 0.6996863484382629, "learning_rate": 5.796466177576906e-05, "loss": 0.026009055972099304, "step": 2320 }, { "epoch": 10.355555555555556, "grad_norm": 0.4658281207084656, "learning_rate": 5.793082528500895e-05, "loss": 0.021320921182632447, "step": 2330 }, { "epoch": 10.4, "grad_norm": 0.4343336522579193, "learning_rate": 5.789671989282528e-05, "loss": 0.020815525949001313, "step": 2340 }, { "epoch": 10.444444444444445, "grad_norm": 0.16455000638961792, "learning_rate": 5.786234592756454e-05, "loss": 0.02079024165868759, "step": 2350 }, { "epoch": 10.488888888888889, "grad_norm": 0.3502999544143677, "learning_rate": 5.782770372015889e-05, "loss": 0.019926668703556062, "step": 2360 }, { "epoch": 10.533333333333333, "grad_norm": 0.3744206428527832, "learning_rate": 5.779279360412295e-05, "loss": 0.018947923183441163, "step": 2370 }, { "epoch": 10.577777777777778, "grad_norm": 0.3867523968219757, "learning_rate": 5.7757615915550633e-05, "loss": 0.019462314248085023, "step": 2380 }, { "epoch": 10.622222222222222, "grad_norm": 0.15724360942840576, "learning_rate": 5.772217099311185e-05, "loss": 0.015563493967056275, "step": 2390 }, { "epoch": 10.666666666666666, "grad_norm": 1.2062114477157593, "learning_rate": 5.7686459178049306e-05, "loss": 0.01959804743528366, "step": 2400 }, { "epoch": 10.71111111111111, "grad_norm": 0.10765093564987183, "learning_rate": 5.7650480814175176e-05, "loss": 0.018212300539016724, "step": 2410 }, { "epoch": 10.755555555555556, "grad_norm": 0.18617188930511475, "learning_rate": 5.7614236247867814e-05, "loss": 0.01866161972284317, "step": 2420 }, { "epoch": 10.8, "grad_norm": 0.17051208019256592, "learning_rate": 5.757772582806842e-05, "loss": 0.02406514883041382, "step": 2430 }, { "epoch": 10.844444444444445, "grad_norm": 0.7377229332923889, "learning_rate": 5.754094990627764e-05, "loss": 0.0193157821893692, "step": 2440 }, { "epoch": 10.88888888888889, "grad_norm": 0.16451075673103333, "learning_rate": 5.7503908836552275e-05, "loss": 0.020191529393196107, "step": 2450 }, { "epoch": 10.933333333333334, "grad_norm": 0.589508593082428, "learning_rate": 5.7466602975501765e-05, "loss": 0.01552746444940567, "step": 2460 }, { "epoch": 10.977777777777778, "grad_norm": 0.20275713503360748, "learning_rate": 5.742903268228481e-05, "loss": 0.019462943077087402, "step": 2470 }, { "epoch": 11.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9854695577219651, "eval_iou_background": 0.0, "eval_iou_crop": 0.9854695577219651, "eval_loss": 0.018634160980582237, "eval_mean_accuracy": 0.9854695577219651, "eval_mean_iou": 0.49273477886098255, "eval_overall_accuracy": 0.9854695577219651, "eval_runtime": 4.0886, "eval_samples_per_second": 77.778, "eval_steps_per_second": 9.783, "step": 2475 }, { "epoch": 11.022222222222222, "grad_norm": 0.22702719271183014, "learning_rate": 5.7391198318605936e-05, "loss": 0.021507586538791656, "step": 2480 }, { "epoch": 11.066666666666666, "grad_norm": 0.15014351904392242, "learning_rate": 5.735310024871194e-05, "loss": 0.01483003944158554, "step": 2490 }, { "epoch": 11.11111111111111, "grad_norm": 0.1705402284860611, "learning_rate": 5.731473883938846e-05, "loss": 0.018740904331207276, "step": 2500 }, { "epoch": 11.155555555555555, "grad_norm": 0.23914994299411774, "learning_rate": 5.72761144599564e-05, "loss": 0.019413051009178162, "step": 2510 }, { "epoch": 11.2, "grad_norm": 0.1302383542060852, "learning_rate": 5.723722748226836e-05, "loss": 0.01516767293214798, "step": 2520 }, { "epoch": 11.244444444444444, "grad_norm": 0.41887909173965454, "learning_rate": 5.719807828070514e-05, "loss": 0.016580724716186525, "step": 2530 }, { "epoch": 11.28888888888889, "grad_norm": 0.4549539387226105, "learning_rate": 5.7158667232172004e-05, "loss": 0.01691744029521942, "step": 2540 }, { "epoch": 11.333333333333334, "grad_norm": 0.2458135187625885, "learning_rate": 5.711899471609517e-05, "loss": 0.02118345946073532, "step": 2550 }, { "epoch": 11.377777777777778, "grad_norm": 0.22240404784679413, "learning_rate": 5.70790611144181e-05, "loss": 0.02034774571657181, "step": 2560 }, { "epoch": 11.422222222222222, "grad_norm": 0.22506876289844513, "learning_rate": 5.7038866811597826e-05, "loss": 0.019588840007781983, "step": 2570 }, { "epoch": 11.466666666666667, "grad_norm": 0.5556941032409668, "learning_rate": 5.699841219460127e-05, "loss": 0.02597571015357971, "step": 2580 }, { "epoch": 11.511111111111111, "grad_norm": 0.2758418619632721, "learning_rate": 5.695769765290148e-05, "loss": 0.015017086267471313, "step": 2590 }, { "epoch": 11.555555555555555, "grad_norm": 0.8639801144599915, "learning_rate": 5.6916723578473955e-05, "loss": 0.0170652836561203, "step": 2600 }, { "epoch": 11.6, "grad_norm": 0.22511881589889526, "learning_rate": 5.687549036579275e-05, "loss": 0.016348060965538026, "step": 2610 }, { "epoch": 11.644444444444444, "grad_norm": 0.3932984471321106, "learning_rate": 5.6833998411826795e-05, "loss": 0.01571182757616043, "step": 2620 }, { "epoch": 11.688888888888888, "grad_norm": 0.8065228462219238, "learning_rate": 5.679224811603603e-05, "loss": 0.022435690462589263, "step": 2630 }, { "epoch": 11.733333333333333, "grad_norm": 0.24713853001594543, "learning_rate": 5.675023988036754e-05, "loss": 0.023287481069564818, "step": 2640 }, { "epoch": 11.777777777777779, "grad_norm": 0.2708222270011902, "learning_rate": 5.670797410925171e-05, "loss": 0.022461412847042082, "step": 2650 }, { "epoch": 11.822222222222223, "grad_norm": 0.44739246368408203, "learning_rate": 5.666545120959831e-05, "loss": 0.01553283929824829, "step": 2660 }, { "epoch": 11.866666666666667, "grad_norm": 0.45830896496772766, "learning_rate": 5.662267159079262e-05, "loss": 0.01808589994907379, "step": 2670 }, { "epoch": 11.911111111111111, "grad_norm": 0.2438342273235321, "learning_rate": 5.6579635664691445e-05, "loss": 0.015603311359882355, "step": 2680 }, { "epoch": 11.955555555555556, "grad_norm": 0.29044410586357117, "learning_rate": 5.653634384561914e-05, "loss": 0.016543711721897125, "step": 2690 }, { "epoch": 12.0, "grad_norm": 0.3219044506549835, "learning_rate": 5.649279655036368e-05, "loss": 0.013632658123970031, "step": 2700 }, { "epoch": 12.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.983479450630916, "eval_iou_background": 0.0, "eval_iou_crop": 0.983479450630916, "eval_loss": 0.017393598333001137, "eval_mean_accuracy": 0.983479450630916, "eval_mean_iou": 0.491739725315458, "eval_overall_accuracy": 0.983479450630916, "eval_runtime": 5.0032, "eval_samples_per_second": 63.56, "eval_steps_per_second": 7.995, "step": 2700 }, { "epoch": 12.044444444444444, "grad_norm": 0.6327373385429382, "learning_rate": 5.6448994198172606e-05, "loss": 0.01692250221967697, "step": 2710 }, { "epoch": 12.088888888888889, "grad_norm": 0.30729398131370544, "learning_rate": 5.6404937210748994e-05, "loss": 0.014396494626998902, "step": 2720 }, { "epoch": 12.133333333333333, "grad_norm": 0.33513402938842773, "learning_rate": 5.636062601224737e-05, "loss": 0.015194615721702576, "step": 2730 }, { "epoch": 12.177777777777777, "grad_norm": 1.0292479991912842, "learning_rate": 5.631606102926971e-05, "loss": 0.019913801550865175, "step": 2740 }, { "epoch": 12.222222222222221, "grad_norm": 0.7539405822753906, "learning_rate": 5.6271242690861226e-05, "loss": 0.019662556052207947, "step": 2750 }, { "epoch": 12.266666666666667, "grad_norm": 0.369282066822052, "learning_rate": 5.622617142850631e-05, "loss": 0.019444176554679872, "step": 2760 }, { "epoch": 12.311111111111112, "grad_norm": 4.0517497062683105, "learning_rate": 5.618084767612434e-05, "loss": 0.01853087991476059, "step": 2770 }, { "epoch": 12.355555555555556, "grad_norm": 0.35096538066864014, "learning_rate": 5.613527187006555e-05, "loss": 0.020319417119026184, "step": 2780 }, { "epoch": 12.4, "grad_norm": 0.538619339466095, "learning_rate": 5.608944444910674e-05, "loss": 0.014907598495483398, "step": 2790 }, { "epoch": 12.444444444444445, "grad_norm": 0.3902283310890198, "learning_rate": 5.604336585444718e-05, "loss": 0.014838707447052003, "step": 2800 }, { "epoch": 12.488888888888889, "grad_norm": 0.520384669303894, "learning_rate": 5.599703652970423e-05, "loss": 0.01920664757490158, "step": 2810 }, { "epoch": 12.533333333333333, "grad_norm": 0.12784866988658905, "learning_rate": 5.5950456920909174e-05, "loss": 0.01594909280538559, "step": 2820 }, { "epoch": 12.577777777777778, "grad_norm": 0.25229910016059875, "learning_rate": 5.5903627476502855e-05, "loss": 0.019417032599449158, "step": 2830 }, { "epoch": 12.622222222222222, "grad_norm": 0.441182941198349, "learning_rate": 5.585654864733141e-05, "loss": 0.020194678008556365, "step": 2840 }, { "epoch": 12.666666666666666, "grad_norm": 0.6845587491989136, "learning_rate": 5.580922088664188e-05, "loss": 0.016160233318805693, "step": 2850 }, { "epoch": 12.71111111111111, "grad_norm": 0.3858337998390198, "learning_rate": 5.576164465007786e-05, "loss": 0.02434242218732834, "step": 2860 }, { "epoch": 12.755555555555556, "grad_norm": 0.18722186982631683, "learning_rate": 5.571382039567517e-05, "loss": 0.01821141690015793, "step": 2870 }, { "epoch": 12.8, "grad_norm": 0.19352248311042786, "learning_rate": 5.566574858385737e-05, "loss": 0.015436571836471558, "step": 2880 }, { "epoch": 12.844444444444445, "grad_norm": 0.22652943432331085, "learning_rate": 5.561742967743135e-05, "loss": 0.019451597332954408, "step": 2890 }, { "epoch": 12.88888888888889, "grad_norm": 0.24467973411083221, "learning_rate": 5.55688641415829e-05, "loss": 0.02115028500556946, "step": 2900 }, { "epoch": 12.933333333333334, "grad_norm": 0.20933757722377777, "learning_rate": 5.5520052443872186e-05, "loss": 0.01737414002418518, "step": 2910 }, { "epoch": 12.977777777777778, "grad_norm": 0.21362937986850739, "learning_rate": 5.547099505422931e-05, "loss": 0.0196531280875206, "step": 2920 }, { "epoch": 13.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9898356002002386, "eval_iou_background": 0.0, "eval_iou_crop": 0.9898356002002386, "eval_loss": 0.018248561769723892, "eval_mean_accuracy": 0.9898356002002386, "eval_mean_iou": 0.4949178001001193, "eval_overall_accuracy": 0.9898356002002386, "eval_runtime": 4.4802, "eval_samples_per_second": 70.978, "eval_steps_per_second": 8.928, "step": 2925 }, { "epoch": 13.022222222222222, "grad_norm": 0.5187875032424927, "learning_rate": 5.5421692444949704e-05, "loss": 0.017868484556674957, "step": 2930 }, { "epoch": 13.066666666666666, "grad_norm": 0.666745662689209, "learning_rate": 5.5372145090689684e-05, "loss": 0.02043323814868927, "step": 2940 }, { "epoch": 13.11111111111111, "grad_norm": 0.24603652954101562, "learning_rate": 5.532235346846177e-05, "loss": 0.017392222583293915, "step": 2950 }, { "epoch": 13.155555555555555, "grad_norm": 0.1025647222995758, "learning_rate": 5.5272318057630196e-05, "loss": 0.017882135510444642, "step": 2960 }, { "epoch": 13.2, "grad_norm": 0.13730789721012115, "learning_rate": 5.5222039339906205e-05, "loss": 0.016534918546676637, "step": 2970 }, { "epoch": 13.244444444444444, "grad_norm": 0.10700178891420364, "learning_rate": 5.51715177993435e-05, "loss": 0.014750665426254273, "step": 2980 }, { "epoch": 13.28888888888889, "grad_norm": 0.40602031350135803, "learning_rate": 5.5120753922333506e-05, "loss": 0.020720386505126955, "step": 2990 }, { "epoch": 13.333333333333334, "grad_norm": 0.5984240174293518, "learning_rate": 5.5069748197600735e-05, "loss": 0.018232697248458864, "step": 3000 }, { "epoch": 13.377777777777778, "grad_norm": 0.49178346991539, "learning_rate": 5.501850111619805e-05, "loss": 0.015743085741996767, "step": 3010 }, { "epoch": 13.422222222222222, "grad_norm": 0.20866259932518005, "learning_rate": 5.496701317150196e-05, "loss": 0.015244263410568237, "step": 3020 }, { "epoch": 13.466666666666667, "grad_norm": 0.3186033070087433, "learning_rate": 5.491528485920788e-05, "loss": 0.014633914828300476, "step": 3030 }, { "epoch": 13.511111111111111, "grad_norm": 0.31360217928886414, "learning_rate": 5.486331667732532e-05, "loss": 0.020519538223743437, "step": 3040 }, { "epoch": 13.555555555555555, "grad_norm": 0.3415757119655609, "learning_rate": 5.481110912617311e-05, "loss": 0.020377354323863985, "step": 3050 }, { "epoch": 13.6, "grad_norm": 0.43776458501815796, "learning_rate": 5.475866270837461e-05, "loss": 0.01740396022796631, "step": 3060 }, { "epoch": 13.644444444444444, "grad_norm": 0.3046082854270935, "learning_rate": 5.4705977928852825e-05, "loss": 0.018137095868587493, "step": 3070 }, { "epoch": 13.688888888888888, "grad_norm": 0.12367811053991318, "learning_rate": 5.465305529482557e-05, "loss": 0.01658170223236084, "step": 3080 }, { "epoch": 13.733333333333333, "grad_norm": 0.29606443643569946, "learning_rate": 5.459989531580058e-05, "loss": 0.016600155830383302, "step": 3090 }, { "epoch": 13.777777777777779, "grad_norm": 0.2304660528898239, "learning_rate": 5.4546498503570626e-05, "loss": 0.016639120876789093, "step": 3100 }, { "epoch": 13.822222222222223, "grad_norm": 0.24718496203422546, "learning_rate": 5.449286537220853e-05, "loss": 0.020870281755924223, "step": 3110 }, { "epoch": 13.866666666666667, "grad_norm": 0.4153110086917877, "learning_rate": 5.443899643806229e-05, "loss": 0.016263550519943236, "step": 3120 }, { "epoch": 13.911111111111111, "grad_norm": 0.3598655164241791, "learning_rate": 5.4384892219750074e-05, "loss": 0.014671218395233155, "step": 3130 }, { "epoch": 13.955555555555556, "grad_norm": 0.24351271986961365, "learning_rate": 5.4330553238155195e-05, "loss": 0.016386467218399047, "step": 3140 }, { "epoch": 14.0, "grad_norm": 0.4209583103656769, "learning_rate": 5.427598001642115e-05, "loss": 0.014098793268203735, "step": 3150 }, { "epoch": 14.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9861287079895378, "eval_iou_background": 0.0, "eval_iou_crop": 0.9861287079895378, "eval_loss": 0.01644517481327057, "eval_mean_accuracy": 0.9861287079895378, "eval_mean_iou": 0.4930643539947689, "eval_overall_accuracy": 0.9861287079895378, "eval_runtime": 5.0203, "eval_samples_per_second": 63.343, "eval_steps_per_second": 7.968, "step": 3150 }, { "epoch": 14.044444444444444, "grad_norm": 0.14950770139694214, "learning_rate": 5.4221173079946556e-05, "loss": 0.016168467700481415, "step": 3160 }, { "epoch": 14.088888888888889, "grad_norm": 0.16931293904781342, "learning_rate": 5.4166132956380094e-05, "loss": 0.013228373229503631, "step": 3170 }, { "epoch": 14.133333333333333, "grad_norm": 0.14218904078006744, "learning_rate": 5.411086017561545e-05, "loss": 0.018651790916919708, "step": 3180 }, { "epoch": 14.177777777777777, "grad_norm": 0.0931057557463646, "learning_rate": 5.405535526978619e-05, "loss": 0.015197348594665528, "step": 3190 }, { "epoch": 14.222222222222221, "grad_norm": 0.21674780547618866, "learning_rate": 5.3999618773260606e-05, "loss": 0.013788039982318877, "step": 3200 }, { "epoch": 14.266666666666667, "grad_norm": 9.478878021240234, "learning_rate": 5.394365122263664e-05, "loss": 0.021974164247512817, "step": 3210 }, { "epoch": 14.311111111111112, "grad_norm": 0.1716259866952896, "learning_rate": 5.388745315673671e-05, "loss": 0.016454142332077027, "step": 3220 }, { "epoch": 14.355555555555556, "grad_norm": 0.38121506571769714, "learning_rate": 5.383102511660244e-05, "loss": 0.017990656197071075, "step": 3230 }, { "epoch": 14.4, "grad_norm": 0.2882017195224762, "learning_rate": 5.377436764548955e-05, "loss": 0.015024635195732116, "step": 3240 }, { "epoch": 14.444444444444445, "grad_norm": 0.20212651789188385, "learning_rate": 5.371748128886259e-05, "loss": 0.013451874256134033, "step": 3250 }, { "epoch": 14.488888888888889, "grad_norm": 1.434191346168518, "learning_rate": 5.366036659438965e-05, "loss": 0.016176268458366394, "step": 3260 }, { "epoch": 14.533333333333333, "grad_norm": 0.5465851426124573, "learning_rate": 5.3603024111937146e-05, "loss": 0.016791558265686034, "step": 3270 }, { "epoch": 14.577777777777778, "grad_norm": 0.2687932848930359, "learning_rate": 5.3545454393564506e-05, "loss": 0.017058029770851135, "step": 3280 }, { "epoch": 14.622222222222222, "grad_norm": 0.45476430654525757, "learning_rate": 5.348765799351882e-05, "loss": 0.022091104090213774, "step": 3290 }, { "epoch": 14.666666666666666, "grad_norm": 0.1616237759590149, "learning_rate": 5.3429635468229584e-05, "loss": 0.017325878143310547, "step": 3300 }, { "epoch": 14.71111111111111, "grad_norm": 0.38689810037612915, "learning_rate": 5.337138737630324e-05, "loss": 0.015759383141994477, "step": 3310 }, { "epoch": 14.755555555555556, "grad_norm": 0.37098243832588196, "learning_rate": 5.3312914278517885e-05, "loss": 0.01436927318572998, "step": 3320 }, { "epoch": 14.8, "grad_norm": 0.2093076854944229, "learning_rate": 5.325421673781784e-05, "loss": 0.01572567820549011, "step": 3330 }, { "epoch": 14.844444444444445, "grad_norm": 0.1502954065799713, "learning_rate": 5.319529531930822e-05, "loss": 0.015441009402275085, "step": 3340 }, { "epoch": 14.88888888888889, "grad_norm": 0.05795728787779808, "learning_rate": 5.313615059024949e-05, "loss": 0.01906130164861679, "step": 3350 }, { "epoch": 14.933333333333334, "grad_norm": 0.25697875022888184, "learning_rate": 5.3076783120052046e-05, "loss": 0.012249890714883804, "step": 3360 }, { "epoch": 14.977777777777778, "grad_norm": 0.26788923144340515, "learning_rate": 5.3017193480270675e-05, "loss": 0.01380850374698639, "step": 3370 }, { "epoch": 15.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9834813894665752, "eval_iou_background": 0.0, "eval_iou_crop": 0.9834813894665752, "eval_loss": 0.016938913613557816, "eval_mean_accuracy": 0.9834813894665752, "eval_mean_iou": 0.4917406947332876, "eval_overall_accuracy": 0.9834813894665752, "eval_runtime": 4.9765, "eval_samples_per_second": 63.9, "eval_steps_per_second": 8.038, "step": 3375 }, { "epoch": 15.022222222222222, "grad_norm": 0.14800319075584412, "learning_rate": 5.2957382244599106e-05, "loss": 0.015058769285678864, "step": 3380 }, { "epoch": 15.066666666666666, "grad_norm": 0.46365201473236084, "learning_rate": 5.2897349988864426e-05, "loss": 0.01727105677127838, "step": 3390 }, { "epoch": 15.11111111111111, "grad_norm": 0.20886977016925812, "learning_rate": 5.283709729102162e-05, "loss": 0.015442529320716858, "step": 3400 }, { "epoch": 15.155555555555555, "grad_norm": 0.16950465738773346, "learning_rate": 5.277662473114793e-05, "loss": 0.01710917353630066, "step": 3410 }, { "epoch": 15.2, "grad_norm": 0.14677827060222626, "learning_rate": 5.27159328914373e-05, "loss": 0.01569821834564209, "step": 3420 }, { "epoch": 15.244444444444444, "grad_norm": 0.15767405927181244, "learning_rate": 5.265502235619477e-05, "loss": 0.015042471885681152, "step": 3430 }, { "epoch": 15.28888888888889, "grad_norm": 0.11843352019786835, "learning_rate": 5.259389371183086e-05, "loss": 0.014518451690673829, "step": 3440 }, { "epoch": 15.333333333333334, "grad_norm": 0.3046417236328125, "learning_rate": 5.2532547546855923e-05, "loss": 0.015474611520767212, "step": 3450 }, { "epoch": 15.377777777777778, "grad_norm": 0.2158462405204773, "learning_rate": 5.247098445187442e-05, "loss": 0.014826107025146484, "step": 3460 }, { "epoch": 15.422222222222222, "grad_norm": 0.7991043925285339, "learning_rate": 5.240920501957937e-05, "loss": 0.01627553105354309, "step": 3470 }, { "epoch": 15.466666666666667, "grad_norm": 0.20679478347301483, "learning_rate": 5.2347209844746484e-05, "loss": 0.015085215866565704, "step": 3480 }, { "epoch": 15.511111111111111, "grad_norm": 0.25514882802963257, "learning_rate": 5.2284999524228544e-05, "loss": 0.01894485652446747, "step": 3490 }, { "epoch": 15.555555555555555, "grad_norm": 0.21953126788139343, "learning_rate": 5.2222574656949646e-05, "loss": 0.020057114958763122, "step": 3500 }, { "epoch": 15.6, "grad_norm": 0.28845933079719543, "learning_rate": 5.215993584389938e-05, "loss": 0.014156970381736755, "step": 3510 }, { "epoch": 15.644444444444444, "grad_norm": 0.2641865611076355, "learning_rate": 5.20970836881271e-05, "loss": 0.01988045424222946, "step": 3520 }, { "epoch": 15.688888888888888, "grad_norm": 0.1309666782617569, "learning_rate": 5.203401879473609e-05, "loss": 0.016284553706645964, "step": 3530 }, { "epoch": 15.733333333333333, "grad_norm": 0.40189066529273987, "learning_rate": 5.197074177087775e-05, "loss": 0.01664513498544693, "step": 3540 }, { "epoch": 15.777777777777779, "grad_norm": 0.32680052518844604, "learning_rate": 5.190725322574574e-05, "loss": 0.013683022558689117, "step": 3550 }, { "epoch": 15.822222222222223, "grad_norm": 0.2134275883436203, "learning_rate": 5.1843553770570135e-05, "loss": 0.015080173313617707, "step": 3560 }, { "epoch": 15.866666666666667, "grad_norm": 0.15053214132785797, "learning_rate": 5.1779644018611504e-05, "loss": 0.01286524087190628, "step": 3570 }, { "epoch": 15.911111111111111, "grad_norm": 0.11935795098543167, "learning_rate": 5.1715524585155055e-05, "loss": 0.01499553769826889, "step": 3580 }, { "epoch": 15.955555555555556, "grad_norm": 0.30144304037094116, "learning_rate": 5.165119608750466e-05, "loss": 0.012784159183502198, "step": 3590 }, { "epoch": 16.0, "grad_norm": 0.16827891767024994, "learning_rate": 5.158665914497695e-05, "loss": 0.012316960096359252, "step": 3600 }, { "epoch": 16.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9851745854190402, "eval_iou_background": 0.0, "eval_iou_crop": 0.9851745854190402, "eval_loss": 0.017505981028079987, "eval_mean_accuracy": 0.9851745854190402, "eval_mean_iou": 0.4925872927095201, "eval_overall_accuracy": 0.9851745854190402, "eval_runtime": 4.4631, "eval_samples_per_second": 71.251, "eval_steps_per_second": 8.962, "step": 3600 }, { "epoch": 16.044444444444444, "grad_norm": 0.2909557819366455, "learning_rate": 5.1521914378895365e-05, "loss": 0.015978696942329406, "step": 3610 }, { "epoch": 16.08888888888889, "grad_norm": 0.279092013835907, "learning_rate": 5.145696241258408e-05, "loss": 0.014709393680095672, "step": 3620 }, { "epoch": 16.133333333333333, "grad_norm": 0.13046345114707947, "learning_rate": 5.139180387136214e-05, "loss": 0.01317310631275177, "step": 3630 }, { "epoch": 16.177777777777777, "grad_norm": 0.199358269572258, "learning_rate": 5.132643938253732e-05, "loss": 0.015848933160305022, "step": 3640 }, { "epoch": 16.22222222222222, "grad_norm": 0.15392941236495972, "learning_rate": 5.126086957540019e-05, "loss": 0.014615638554096222, "step": 3650 }, { "epoch": 16.266666666666666, "grad_norm": 0.12797755002975464, "learning_rate": 5.1195095081217944e-05, "loss": 0.013077689707279206, "step": 3660 }, { "epoch": 16.31111111111111, "grad_norm": 0.2860284745693207, "learning_rate": 5.1129116533228425e-05, "loss": 0.015378519892692566, "step": 3670 }, { "epoch": 16.355555555555554, "grad_norm": 0.1093951165676117, "learning_rate": 5.106293456663396e-05, "loss": 0.019132941961288452, "step": 3680 }, { "epoch": 16.4, "grad_norm": 0.1277124434709549, "learning_rate": 5.099654981859529e-05, "loss": 0.012462624162435532, "step": 3690 }, { "epoch": 16.444444444444443, "grad_norm": 0.30958092212677, "learning_rate": 5.092996292822539e-05, "loss": 0.015587472915649414, "step": 3700 }, { "epoch": 16.488888888888887, "grad_norm": 0.13282138109207153, "learning_rate": 5.086317453658337e-05, "loss": 0.01358308345079422, "step": 3710 }, { "epoch": 16.533333333333335, "grad_norm": 0.22578182816505432, "learning_rate": 5.079618528666826e-05, "loss": 0.01614467203617096, "step": 3720 }, { "epoch": 16.57777777777778, "grad_norm": 0.13008703291416168, "learning_rate": 5.072899582341282e-05, "loss": 0.014336599409580231, "step": 3730 }, { "epoch": 16.622222222222224, "grad_norm": 0.2419137954711914, "learning_rate": 5.066160679367737e-05, "loss": 0.018063643574714662, "step": 3740 }, { "epoch": 16.666666666666668, "grad_norm": 0.28087955713272095, "learning_rate": 5.059401884624354e-05, "loss": 0.014685027301311493, "step": 3750 }, { "epoch": 16.711111111111112, "grad_norm": 0.2836267650127411, "learning_rate": 5.052623263180799e-05, "loss": 0.014226374030113221, "step": 3760 }, { "epoch": 16.755555555555556, "grad_norm": 0.11046747118234634, "learning_rate": 5.045824880297621e-05, "loss": 0.012857003509998322, "step": 3770 }, { "epoch": 16.8, "grad_norm": 0.15025067329406738, "learning_rate": 5.0390068014256184e-05, "loss": 0.014658236503601074, "step": 3780 }, { "epoch": 16.844444444444445, "grad_norm": 0.10254954546689987, "learning_rate": 5.032169092205212e-05, "loss": 0.011833485215902328, "step": 3790 }, { "epoch": 16.88888888888889, "grad_norm": 0.21225418150424957, "learning_rate": 5.025311818465811e-05, "loss": 0.018314675986766817, "step": 3800 }, { "epoch": 16.933333333333334, "grad_norm": 0.14111171662807465, "learning_rate": 5.018435046225182e-05, "loss": 0.012658929824829102, "step": 3810 }, { "epoch": 16.977777777777778, "grad_norm": 0.2379542738199234, "learning_rate": 5.01153884168881e-05, "loss": 0.01706341505050659, "step": 3820 }, { "epoch": 17.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9839445557629332, "eval_iou_background": 0.0, "eval_iou_crop": 0.9839445557629332, "eval_loss": 0.01656997948884964, "eval_mean_accuracy": 0.9839445557629332, "eval_mean_iou": 0.4919722778814666, "eval_overall_accuracy": 0.9839445557629332, "eval_runtime": 5.0215, "eval_samples_per_second": 63.328, "eval_steps_per_second": 7.966, "step": 3825 }, { "epoch": 17.022222222222222, "grad_norm": 0.39262789487838745, "learning_rate": 5.004623271249263e-05, "loss": 0.014760017395019531, "step": 3830 }, { "epoch": 17.066666666666666, "grad_norm": 0.19445766508579254, "learning_rate": 4.997688401485551e-05, "loss": 0.014318600296974182, "step": 3840 }, { "epoch": 17.11111111111111, "grad_norm": 0.37851327657699585, "learning_rate": 4.99073429916249e-05, "loss": 0.017509520053863525, "step": 3850 }, { "epoch": 17.155555555555555, "grad_norm": 0.39725691080093384, "learning_rate": 4.983761031230051e-05, "loss": 0.015525509417057038, "step": 3860 }, { "epoch": 17.2, "grad_norm": 0.19558538496494293, "learning_rate": 4.976768664822725e-05, "loss": 0.021957294642925264, "step": 3870 }, { "epoch": 17.244444444444444, "grad_norm": Infinity, "learning_rate": 4.9697572672588694e-05, "loss": 0.01650039404630661, "step": 3880 }, { "epoch": 17.288888888888888, "grad_norm": 0.21717479825019836, "learning_rate": 4.962726906040062e-05, "loss": 0.015944221615791322, "step": 3890 }, { "epoch": 17.333333333333332, "grad_norm": 0.14977721869945526, "learning_rate": 4.95567764885045e-05, "loss": 0.014208893477916717, "step": 3900 }, { "epoch": 17.377777777777776, "grad_norm": 0.2550029158592224, "learning_rate": 4.9486095635561035e-05, "loss": 0.023358891904354095, "step": 3910 }, { "epoch": 17.42222222222222, "grad_norm": 0.2689019441604614, "learning_rate": 4.9415227182043563e-05, "loss": 0.017782679200172423, "step": 3920 }, { "epoch": 17.466666666666665, "grad_norm": 0.2438889890909195, "learning_rate": 4.934417181023152e-05, "loss": 0.015798898041248323, "step": 3930 }, { "epoch": 17.511111111111113, "grad_norm": 0.2148306518793106, "learning_rate": 4.927293020420391e-05, "loss": 0.015784426033496855, "step": 3940 }, { "epoch": 17.555555555555557, "grad_norm": 0.12729798257350922, "learning_rate": 4.920150304983267e-05, "loss": 0.013893619179725647, "step": 3950 }, { "epoch": 17.6, "grad_norm": 0.16336530447006226, "learning_rate": 4.912989103477606e-05, "loss": 0.013018724322319031, "step": 3960 }, { "epoch": 17.644444444444446, "grad_norm": 0.2534140348434448, "learning_rate": 4.905809484847213e-05, "loss": 0.022515588998794557, "step": 3970 }, { "epoch": 17.68888888888889, "grad_norm": 0.10193440318107605, "learning_rate": 4.898611518213197e-05, "loss": 0.014378860592842102, "step": 3980 }, { "epoch": 17.733333333333334, "grad_norm": 0.16317637264728546, "learning_rate": 4.8913952728733136e-05, "loss": 0.012696251273155212, "step": 3990 }, { "epoch": 17.77777777777778, "grad_norm": 0.17505896091461182, "learning_rate": 4.8841608183012926e-05, "loss": 0.011806779354810715, "step": 4000 }, { "epoch": 17.822222222222223, "grad_norm": 0.16301144659519196, "learning_rate": 4.876908224146174e-05, "loss": 0.014675123989582062, "step": 4010 }, { "epoch": 17.866666666666667, "grad_norm": 0.3365599513053894, "learning_rate": 4.869637560231632e-05, "loss": 0.014278171956539154, "step": 4020 }, { "epoch": 17.91111111111111, "grad_norm": 0.108104407787323, "learning_rate": 4.86234889655531e-05, "loss": 0.011147437244653701, "step": 4030 }, { "epoch": 17.955555555555556, "grad_norm": 0.5049643516540527, "learning_rate": 4.855042303288138e-05, "loss": 0.012674018740653992, "step": 4040 }, { "epoch": 18.0, "grad_norm": 0.15814153850078583, "learning_rate": 4.847717850773664e-05, "loss": 0.013458079099655152, "step": 4050 }, { "epoch": 18.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9860373134308262, "eval_iou_background": 0.0, "eval_iou_crop": 0.9860373134308262, "eval_loss": 0.015890469774603844, "eval_mean_accuracy": 0.9860373134308262, "eval_mean_iou": 0.4930186567154131, "eval_overall_accuracy": 0.9860373134308262, "eval_runtime": 5.0111, "eval_samples_per_second": 63.459, "eval_steps_per_second": 7.982, "step": 4050 }, { "epoch": 18.044444444444444, "grad_norm": 0.2705215513706207, "learning_rate": 4.840375609527373e-05, "loss": 0.013046360015869141, "step": 4060 }, { "epoch": 18.08888888888889, "grad_norm": 0.18584178388118744, "learning_rate": 4.83301565023601e-05, "loss": 0.012838506698608398, "step": 4070 }, { "epoch": 18.133333333333333, "grad_norm": 0.17411309480667114, "learning_rate": 4.825638043756901e-05, "loss": 0.012041444331407547, "step": 4080 }, { "epoch": 18.177777777777777, "grad_norm": 0.33050012588500977, "learning_rate": 4.818242861117263e-05, "loss": 0.015820732712745665, "step": 4090 }, { "epoch": 18.22222222222222, "grad_norm": 0.3740712106227875, "learning_rate": 4.810830173513531e-05, "loss": 0.012328142672777176, "step": 4100 }, { "epoch": 18.266666666666666, "grad_norm": 0.19381961226463318, "learning_rate": 4.8034000523106665e-05, "loss": 0.01469101756811142, "step": 4110 }, { "epoch": 18.31111111111111, "grad_norm": 0.5021510720252991, "learning_rate": 4.7959525690414694e-05, "loss": 0.011269740015268325, "step": 4120 }, { "epoch": 18.355555555555554, "grad_norm": 0.2622928321361542, "learning_rate": 4.7884877954058925e-05, "loss": 0.01223604753613472, "step": 4130 }, { "epoch": 18.4, "grad_norm": 0.17169535160064697, "learning_rate": 4.78100580327035e-05, "loss": 0.013732567429542542, "step": 4140 }, { "epoch": 18.444444444444443, "grad_norm": 0.11435951292514801, "learning_rate": 4.773506664667026e-05, "loss": 0.011069429665803909, "step": 4150 }, { "epoch": 18.488888888888887, "grad_norm": 0.23226188123226166, "learning_rate": 4.7659904517931806e-05, "loss": 0.014789837598800658, "step": 4160 }, { "epoch": 18.533333333333335, "grad_norm": 0.1889769583940506, "learning_rate": 4.758457237010452e-05, "loss": 0.017169690132141112, "step": 4170 }, { "epoch": 18.57777777777778, "grad_norm": 0.12727473676204681, "learning_rate": 4.750907092844168e-05, "loss": 0.013718323409557342, "step": 4180 }, { "epoch": 18.622222222222224, "grad_norm": 0.3296601474285126, "learning_rate": 4.743340091982638e-05, "loss": 0.01722012609243393, "step": 4190 }, { "epoch": 18.666666666666668, "grad_norm": 0.17683351039886475, "learning_rate": 4.73575630727646e-05, "loss": 0.014707109332084656, "step": 4200 }, { "epoch": 18.711111111111112, "grad_norm": 0.38984397053718567, "learning_rate": 4.728155811737816e-05, "loss": 0.01865033507347107, "step": 4210 }, { "epoch": 18.755555555555556, "grad_norm": 0.14279262721538544, "learning_rate": 4.7205386785397696e-05, "loss": 0.014495043456554413, "step": 4220 }, { "epoch": 18.8, "grad_norm": 0.9067888259887695, "learning_rate": 4.712904981015563e-05, "loss": 0.016548363864421843, "step": 4230 }, { "epoch": 18.844444444444445, "grad_norm": 0.13014072179794312, "learning_rate": 4.705254792657909e-05, "loss": 0.011523249000310898, "step": 4240 }, { "epoch": 18.88888888888889, "grad_norm": 0.19852551817893982, "learning_rate": 4.697588187118285e-05, "loss": 0.018079638481140137, "step": 4250 }, { "epoch": 18.933333333333334, "grad_norm": 0.17358213663101196, "learning_rate": 4.6899052382062236e-05, "loss": 0.014190353453159332, "step": 4260 }, { "epoch": 18.977777777777778, "grad_norm": 0.23657366633415222, "learning_rate": 4.6822060198885996e-05, "loss": 0.015455757081508637, "step": 4270 }, { "epoch": 19.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9861772327375632, "eval_iou_background": 0.0, "eval_iou_crop": 0.9861772327375632, "eval_loss": 0.015139489434659481, "eval_mean_accuracy": 0.9861772327375632, "eval_mean_iou": 0.4930886163687816, "eval_overall_accuracy": 0.9861772327375632, "eval_runtime": 4.373, "eval_samples_per_second": 72.718, "eval_steps_per_second": 9.147, "step": 4275 }, { "epoch": 19.022222222222222, "grad_norm": 0.10885288566350937, "learning_rate": 4.674490606288923e-05, "loss": 0.012244389206171036, "step": 4280 }, { "epoch": 19.066666666666666, "grad_norm": 0.15863460302352905, "learning_rate": 4.6667590716866195e-05, "loss": 0.013228732347488403, "step": 4290 }, { "epoch": 19.11111111111111, "grad_norm": 0.1918136030435562, "learning_rate": 4.659011490516321e-05, "loss": 0.011203145235776901, "step": 4300 }, { "epoch": 19.155555555555555, "grad_norm": 0.19905351102352142, "learning_rate": 4.6512479373671446e-05, "loss": 0.01351548582315445, "step": 4310 }, { "epoch": 19.2, "grad_norm": 0.30459675192832947, "learning_rate": 4.643468486981976e-05, "loss": 0.019450746476650238, "step": 4320 }, { "epoch": 19.244444444444444, "grad_norm": 0.2183472216129303, "learning_rate": 4.635673214256751e-05, "loss": 0.019338572025299074, "step": 4330 }, { "epoch": 19.288888888888888, "grad_norm": 0.2814614772796631, "learning_rate": 4.627862194239731e-05, "loss": 0.016339717805385588, "step": 4340 }, { "epoch": 19.333333333333332, "grad_norm": 0.1068657636642456, "learning_rate": 4.620035502130788e-05, "loss": 0.012785866856575012, "step": 4350 }, { "epoch": 19.377777777777776, "grad_norm": 0.1997951865196228, "learning_rate": 4.612193213280671e-05, "loss": 0.01232658252120018, "step": 4360 }, { "epoch": 19.42222222222222, "grad_norm": 0.14932139217853546, "learning_rate": 4.6043354031902874e-05, "loss": 0.012750166654586791, "step": 4370 }, { "epoch": 19.466666666666665, "grad_norm": 0.18346615135669708, "learning_rate": 4.5964621475099724e-05, "loss": 0.013776150345802308, "step": 4380 }, { "epoch": 19.511111111111113, "grad_norm": 0.306440532207489, "learning_rate": 4.5885735220387635e-05, "loss": 0.013980616629123688, "step": 4390 }, { "epoch": 19.555555555555557, "grad_norm": 0.15862058103084564, "learning_rate": 4.580669602723668e-05, "loss": 0.01154005229473114, "step": 4400 }, { "epoch": 19.6, "grad_norm": 0.4324413537979126, "learning_rate": 4.572750465658936e-05, "loss": 0.01448594182729721, "step": 4410 }, { "epoch": 19.644444444444446, "grad_norm": 0.14381954073905945, "learning_rate": 4.5648161870853236e-05, "loss": 0.01420983225107193, "step": 4420 }, { "epoch": 19.68888888888889, "grad_norm": 0.14194971323013306, "learning_rate": 4.556866843389358e-05, "loss": 0.012863323092460632, "step": 4430 }, { "epoch": 19.733333333333334, "grad_norm": 0.2435237318277359, "learning_rate": 4.5489025111026076e-05, "loss": 0.016433939337730408, "step": 4440 }, { "epoch": 19.77777777777778, "grad_norm": 0.10523701459169388, "learning_rate": 4.540923266900941e-05, "loss": 0.01074020266532898, "step": 4450 }, { "epoch": 19.822222222222223, "grad_norm": 0.18980276584625244, "learning_rate": 4.53292918760379e-05, "loss": 0.0112264484167099, "step": 4460 }, { "epoch": 19.866666666666667, "grad_norm": 0.2752103805541992, "learning_rate": 4.52492035017341e-05, "loss": 0.015635377168655394, "step": 4470 }, { "epoch": 19.91111111111111, "grad_norm": 1.3737664222717285, "learning_rate": 4.516896831714137e-05, "loss": 0.016879482567310332, "step": 4480 }, { "epoch": 19.955555555555556, "grad_norm": 0.12320782244205475, "learning_rate": 4.508858709471651e-05, "loss": 0.012201451510190964, "step": 4490 }, { "epoch": 20.0, "grad_norm": 0.4416322112083435, "learning_rate": 4.500806060832226e-05, "loss": 0.014090846478939056, "step": 4500 }, { "epoch": 20.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9871135287913056, "eval_iou_background": 0.0, "eval_iou_crop": 0.9871135287913056, "eval_loss": 0.015118477866053581, "eval_mean_accuracy": 0.9871135287913056, "eval_mean_iou": 0.4935567643956528, "eval_overall_accuracy": 0.9871135287913056, "eval_runtime": 4.8935, "eval_samples_per_second": 64.985, "eval_steps_per_second": 8.174, "step": 4500 }, { "epoch": 20.044444444444444, "grad_norm": 0.12081073224544525, "learning_rate": 4.492738963321988e-05, "loss": 0.013557195663452148, "step": 4510 }, { "epoch": 20.08888888888889, "grad_norm": 0.1313193291425705, "learning_rate": 4.484657494606168e-05, "loss": 0.015050242841243743, "step": 4520 }, { "epoch": 20.133333333333333, "grad_norm": 0.08254443854093552, "learning_rate": 4.476561732488355e-05, "loss": 0.01053604856133461, "step": 4530 }, { "epoch": 20.177777777777777, "grad_norm": 0.8921693563461304, "learning_rate": 4.468451754909745e-05, "loss": 0.014754563570022583, "step": 4540 }, { "epoch": 20.22222222222222, "grad_norm": 0.14051100611686707, "learning_rate": 4.460327639948396e-05, "loss": 0.011931516230106354, "step": 4550 }, { "epoch": 20.266666666666666, "grad_norm": 0.12428005039691925, "learning_rate": 4.452189465818466e-05, "loss": 0.013863354921340942, "step": 4560 }, { "epoch": 20.31111111111111, "grad_norm": 0.1111815869808197, "learning_rate": 4.444037310869472e-05, "loss": 0.011757607758045196, "step": 4570 }, { "epoch": 20.355555555555554, "grad_norm": 0.11765488237142563, "learning_rate": 4.435871253585526e-05, "loss": 0.01123102381825447, "step": 4580 }, { "epoch": 20.4, "grad_norm": 0.11271458864212036, "learning_rate": 4.427691372584588e-05, "loss": 0.012464137375354766, "step": 4590 }, { "epoch": 20.444444444444443, "grad_norm": 0.41501984000205994, "learning_rate": 4.419497746617699e-05, "loss": 0.012224309146404266, "step": 4600 }, { "epoch": 20.488888888888887, "grad_norm": 0.3214302361011505, "learning_rate": 4.4112904545682335e-05, "loss": 0.013756099343299865, "step": 4610 }, { "epoch": 20.533333333333335, "grad_norm": 0.25750476121902466, "learning_rate": 4.403069575451131e-05, "loss": 0.013290074467658997, "step": 4620 }, { "epoch": 20.57777777777778, "grad_norm": 0.12883925437927246, "learning_rate": 4.394835188412141e-05, "loss": 0.014426285028457641, "step": 4630 }, { "epoch": 20.622222222222224, "grad_norm": 0.17055150866508484, "learning_rate": 4.38658737272706e-05, "loss": 0.014699026942253113, "step": 4640 }, { "epoch": 20.666666666666668, "grad_norm": 0.23172207176685333, "learning_rate": 4.3783262078009655e-05, "loss": 0.01762499362230301, "step": 4650 }, { "epoch": 20.711111111111112, "grad_norm": 0.23253442347049713, "learning_rate": 4.370051773167457e-05, "loss": 0.01439288556575775, "step": 4660 }, { "epoch": 20.755555555555556, "grad_norm": 0.5481510758399963, "learning_rate": 4.361764148487882e-05, "loss": 0.013316360116004945, "step": 4670 }, { "epoch": 20.8, "grad_norm": 0.1219111755490303, "learning_rate": 4.353463413550577e-05, "loss": 0.011680652946233749, "step": 4680 }, { "epoch": 20.844444444444445, "grad_norm": 0.147952601313591, "learning_rate": 4.3451496482700974e-05, "loss": 0.014628009498119354, "step": 4690 }, { "epoch": 20.88888888888889, "grad_norm": 0.4712466299533844, "learning_rate": 4.336822932686443e-05, "loss": 0.01690339744091034, "step": 4700 }, { "epoch": 20.933333333333334, "grad_norm": 0.2511211931705475, "learning_rate": 4.3284833469642974e-05, "loss": 0.012376104295253754, "step": 4710 }, { "epoch": 20.977777777777778, "grad_norm": 0.1344117820262909, "learning_rate": 4.320130971392244e-05, "loss": 0.017363159358501433, "step": 4720 }, { "epoch": 21.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9870075391086042, "eval_iou_background": 0.0, "eval_iou_crop": 0.9870075391086042, "eval_loss": 0.015117301605641842, "eval_mean_accuracy": 0.9870075391086042, "eval_mean_iou": 0.4935037695543021, "eval_overall_accuracy": 0.9870075391086042, "eval_runtime": 4.9353, "eval_samples_per_second": 64.433, "eval_steps_per_second": 8.105, "step": 4725 }, { "epoch": 21.022222222222222, "grad_norm": 0.14625823497772217, "learning_rate": 4.311765886382002e-05, "loss": 0.010718516260385513, "step": 4730 }, { "epoch": 21.066666666666666, "grad_norm": 0.39296555519104004, "learning_rate": 4.303388172467651e-05, "loss": 0.016242168843746185, "step": 4740 }, { "epoch": 21.11111111111111, "grad_norm": 0.07368537783622742, "learning_rate": 4.294997910304854e-05, "loss": 0.01154414564371109, "step": 4750 }, { "epoch": 21.155555555555555, "grad_norm": 0.2829134166240692, "learning_rate": 4.286595180670076e-05, "loss": 0.013675840198993683, "step": 4760 }, { "epoch": 21.2, "grad_norm": 0.1971064805984497, "learning_rate": 4.2781800644598176e-05, "loss": 0.014820921421051025, "step": 4770 }, { "epoch": 21.244444444444444, "grad_norm": 1.2101424932479858, "learning_rate": 4.269752642689829e-05, "loss": 0.013227643072605133, "step": 4780 }, { "epoch": 21.288888888888888, "grad_norm": 0.23676154017448425, "learning_rate": 4.261312996494326e-05, "loss": 0.013315065205097199, "step": 4790 }, { "epoch": 21.333333333333332, "grad_norm": 0.45034775137901306, "learning_rate": 4.252861207125221e-05, "loss": 0.013164311647415161, "step": 4800 }, { "epoch": 21.377777777777776, "grad_norm": 0.3524860143661499, "learning_rate": 4.24439735595133e-05, "loss": 0.01475537270307541, "step": 4810 }, { "epoch": 21.42222222222222, "grad_norm": 0.09781530499458313, "learning_rate": 4.235921524457592e-05, "loss": 0.012807892262935638, "step": 4820 }, { "epoch": 21.466666666666665, "grad_norm": 0.18226628005504608, "learning_rate": 4.227433794244287e-05, "loss": 0.012039326876401902, "step": 4830 }, { "epoch": 21.511111111111113, "grad_norm": 0.12963774800300598, "learning_rate": 4.2189342470262495e-05, "loss": 0.014795947074890136, "step": 4840 }, { "epoch": 21.555555555555557, "grad_norm": 0.10910047590732574, "learning_rate": 4.210422964632079e-05, "loss": 0.011096320301294326, "step": 4850 }, { "epoch": 21.6, "grad_norm": 0.138892263174057, "learning_rate": 4.2019000290033546e-05, "loss": 0.01069805771112442, "step": 4860 }, { "epoch": 21.644444444444446, "grad_norm": 0.2884569466114044, "learning_rate": 4.19336552219385e-05, "loss": 0.013404151797294617, "step": 4870 }, { "epoch": 21.68888888888889, "grad_norm": 0.27250146865844727, "learning_rate": 4.184819526368732e-05, "loss": 0.01478063315153122, "step": 4880 }, { "epoch": 21.733333333333334, "grad_norm": 0.219447523355484, "learning_rate": 4.176262123803782e-05, "loss": 0.01309678852558136, "step": 4890 }, { "epoch": 21.77777777777778, "grad_norm": 0.20271621644496918, "learning_rate": 4.167693396884599e-05, "loss": 0.0123354472219944, "step": 4900 }, { "epoch": 21.822222222222223, "grad_norm": 1.4013220071792603, "learning_rate": 4.1591134281058056e-05, "loss": 0.010517559200525283, "step": 4910 }, { "epoch": 21.866666666666667, "grad_norm": 0.48052576184272766, "learning_rate": 4.1505223000702495e-05, "loss": 0.018875105679035185, "step": 4920 }, { "epoch": 21.91111111111111, "grad_norm": 0.09969591349363327, "learning_rate": 4.14192009548822e-05, "loss": 0.014596067368984222, "step": 4930 }, { "epoch": 21.955555555555556, "grad_norm": 3.0228359699249268, "learning_rate": 4.133306897176643e-05, "loss": 0.020536874234676362, "step": 4940 }, { "epoch": 22.0, "grad_norm": 0.3174501657485962, "learning_rate": 4.1246827880582804e-05, "loss": 0.01253487914800644, "step": 4950 }, { "epoch": 22.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9871358254013861, "eval_iou_background": 0.0, "eval_iou_crop": 0.9871358254013861, "eval_loss": 0.01550846267491579, "eval_mean_accuracy": 0.9871358254013861, "eval_mean_iou": 0.49356791270069306, "eval_overall_accuracy": 0.9871358254013861, "eval_runtime": 4.6526, "eval_samples_per_second": 68.348, "eval_steps_per_second": 8.597, "step": 4950 }, { "epoch": 22.044444444444444, "grad_norm": 0.23235675692558289, "learning_rate": 4.1160478511609445e-05, "loss": 0.011753221601247787, "step": 4960 }, { "epoch": 22.08888888888889, "grad_norm": 0.2998289167881012, "learning_rate": 4.1074021696166856e-05, "loss": 0.013770183920860291, "step": 4970 }, { "epoch": 22.133333333333333, "grad_norm": 0.13231034576892853, "learning_rate": 4.098745826661e-05, "loss": 0.012192551046609879, "step": 4980 }, { "epoch": 22.177777777777777, "grad_norm": 0.24910154938697815, "learning_rate": 4.090078905632024e-05, "loss": 0.014448168873786926, "step": 4990 }, { "epoch": 22.22222222222222, "grad_norm": 0.13580670952796936, "learning_rate": 4.0814014899697354e-05, "loss": 0.011927390843629837, "step": 5000 }, { "epoch": 22.266666666666666, "grad_norm": 0.21380552649497986, "learning_rate": 4.072713663215144e-05, "loss": 0.010641471296548844, "step": 5010 }, { "epoch": 22.31111111111111, "grad_norm": 0.09145312756299973, "learning_rate": 4.064015509009495e-05, "loss": 0.01175723373889923, "step": 5020 }, { "epoch": 22.355555555555554, "grad_norm": 0.37142959237098694, "learning_rate": 4.055307111093463e-05, "loss": 0.013820433616638183, "step": 5030 }, { "epoch": 22.4, "grad_norm": 0.2674047648906708, "learning_rate": 4.046588553306334e-05, "loss": 0.013798479735851289, "step": 5040 }, { "epoch": 22.444444444444443, "grad_norm": 0.11118604242801666, "learning_rate": 4.037859919585215e-05, "loss": 0.011561152338981629, "step": 5050 }, { "epoch": 22.488888888888887, "grad_norm": 0.24756036698818207, "learning_rate": 4.029121293964215e-05, "loss": 0.01610407531261444, "step": 5060 }, { "epoch": 22.533333333333335, "grad_norm": 0.09399569779634476, "learning_rate": 4.020372760573641e-05, "loss": 0.01333436816930771, "step": 5070 }, { "epoch": 22.57777777777778, "grad_norm": 0.3573289215564728, "learning_rate": 4.011614403639182e-05, "loss": 0.012633901834487916, "step": 5080 }, { "epoch": 22.622222222222224, "grad_norm": 0.42219462990760803, "learning_rate": 4.002846307481109e-05, "loss": 0.012138797342777253, "step": 5090 }, { "epoch": 22.666666666666668, "grad_norm": 0.07215817272663116, "learning_rate": 3.99406855651345e-05, "loss": 0.012292763590812683, "step": 5100 }, { "epoch": 22.711111111111112, "grad_norm": 0.30937665700912476, "learning_rate": 3.9852812352431854e-05, "loss": 0.013484591245651245, "step": 5110 }, { "epoch": 22.755555555555556, "grad_norm": 0.3903883695602417, "learning_rate": 3.9764844282694376e-05, "loss": 0.012490253150463104, "step": 5120 }, { "epoch": 22.8, "grad_norm": 0.19917690753936768, "learning_rate": 3.9676782202826434e-05, "loss": 0.016570541262626647, "step": 5130 }, { "epoch": 22.844444444444445, "grad_norm": 0.21992650628089905, "learning_rate": 3.9588626960637535e-05, "loss": 0.011049211025238037, "step": 5140 }, { "epoch": 22.88888888888889, "grad_norm": 0.42348355054855347, "learning_rate": 3.9500379404834086e-05, "loss": 0.010096324235200882, "step": 5150 }, { "epoch": 22.933333333333334, "grad_norm": 0.19451011717319489, "learning_rate": 3.9412040385011214e-05, "loss": 0.012554092705249787, "step": 5160 }, { "epoch": 22.977777777777778, "grad_norm": 0.14549313485622406, "learning_rate": 3.9323610751644615e-05, "loss": 0.011503917723894119, "step": 5170 }, { "epoch": 23.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9852042603759349, "eval_iou_background": 0.0, "eval_iou_crop": 0.9852042603759349, "eval_loss": 0.015733828768134117, "eval_mean_accuracy": 0.9852042603759349, "eval_mean_iou": 0.49260213018796745, "eval_overall_accuracy": 0.9852042603759349, "eval_runtime": 5.0158, "eval_samples_per_second": 63.399, "eval_steps_per_second": 7.975, "step": 5175 }, { "epoch": 23.022222222222222, "grad_norm": 0.1476505547761917, "learning_rate": 3.9235091356082367e-05, "loss": 0.011009421199560165, "step": 5180 }, { "epoch": 23.066666666666666, "grad_norm": 0.1859346628189087, "learning_rate": 3.914648305053674e-05, "loss": 0.011327420175075532, "step": 5190 }, { "epoch": 23.11111111111111, "grad_norm": 0.14264126121997833, "learning_rate": 3.905778668807591e-05, "loss": 0.01147976741194725, "step": 5200 }, { "epoch": 23.155555555555555, "grad_norm": 1.5061616897583008, "learning_rate": 3.8969003122615914e-05, "loss": 0.012967683374881744, "step": 5210 }, { "epoch": 23.2, "grad_norm": 0.16320443153381348, "learning_rate": 3.888013320891224e-05, "loss": 0.013108810782432556, "step": 5220 }, { "epoch": 23.244444444444444, "grad_norm": 1.5962873697280884, "learning_rate": 3.879117780255172e-05, "loss": 0.011633485555648804, "step": 5230 }, { "epoch": 23.288888888888888, "grad_norm": 0.21468575298786163, "learning_rate": 3.8702137759944284e-05, "loss": 0.010622628778219224, "step": 5240 }, { "epoch": 23.333333333333332, "grad_norm": 0.157609224319458, "learning_rate": 3.861301393831463e-05, "loss": 0.014727635681629181, "step": 5250 }, { "epoch": 23.377777777777776, "grad_norm": 0.23265589773654938, "learning_rate": 3.8523807195694085e-05, "loss": 0.011964748054742813, "step": 5260 }, { "epoch": 23.42222222222222, "grad_norm": 0.2714417278766632, "learning_rate": 3.843451839091227e-05, "loss": 0.011475460976362229, "step": 5270 }, { "epoch": 23.466666666666665, "grad_norm": 0.28275594115257263, "learning_rate": 3.834514838358885e-05, "loss": 0.011530306190252304, "step": 5280 }, { "epoch": 23.511111111111113, "grad_norm": 0.24730411171913147, "learning_rate": 3.825569803412525e-05, "loss": 0.010997382551431656, "step": 5290 }, { "epoch": 23.555555555555557, "grad_norm": 0.18561764061450958, "learning_rate": 3.816616820369641e-05, "loss": 0.009711622446775436, "step": 5300 }, { "epoch": 23.6, "grad_norm": 0.0866253450512886, "learning_rate": 3.807655975424243e-05, "loss": 0.010072186589241028, "step": 5310 }, { "epoch": 23.644444444444446, "grad_norm": 0.12349536269903183, "learning_rate": 3.798687354846034e-05, "loss": 0.014086106419563293, "step": 5320 }, { "epoch": 23.68888888888889, "grad_norm": 0.15099185705184937, "learning_rate": 3.789711044979573e-05, "loss": 0.011693022400140762, "step": 5330 }, { "epoch": 23.733333333333334, "grad_norm": 0.28846660256385803, "learning_rate": 3.780727132243452e-05, "loss": 0.011923646926879883, "step": 5340 }, { "epoch": 23.77777777777778, "grad_norm": 0.29731401801109314, "learning_rate": 3.7717357031294535e-05, "loss": 0.014544971287250519, "step": 5350 }, { "epoch": 23.822222222222223, "grad_norm": 0.37740805745124817, "learning_rate": 3.7627368442017236e-05, "loss": 0.01352475881576538, "step": 5360 }, { "epoch": 23.866666666666667, "grad_norm": 0.14040984213352203, "learning_rate": 3.7537306420959424e-05, "loss": 0.011473823338747025, "step": 5370 }, { "epoch": 23.91111111111111, "grad_norm": 0.17914456129074097, "learning_rate": 3.744717183518483e-05, "loss": 0.012021134793758392, "step": 5380 }, { "epoch": 23.955555555555556, "grad_norm": 0.20067499577999115, "learning_rate": 3.7356965552455785e-05, "loss": 0.016151851415634154, "step": 5390 }, { "epoch": 24.0, "grad_norm": 0.7884600162506104, "learning_rate": 3.7266688441224904e-05, "loss": 0.0123899906873703, "step": 5400 }, { "epoch": 24.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9866449768403388, "eval_iou_background": 0.0, "eval_iou_crop": 0.9866449768403388, "eval_loss": 0.015573155134916306, "eval_mean_accuracy": 0.9866449768403388, "eval_mean_iou": 0.4933224884201694, "eval_overall_accuracy": 0.9866449768403388, "eval_runtime": 4.264, "eval_samples_per_second": 74.579, "eval_steps_per_second": 9.381, "step": 5400 }, { "epoch": 24.044444444444444, "grad_norm": 0.10348880290985107, "learning_rate": 3.717634137062668e-05, "loss": 0.011656184494495393, "step": 5410 }, { "epoch": 24.08888888888889, "grad_norm": 0.5171974301338196, "learning_rate": 3.708592521046913e-05, "loss": 0.01098921000957489, "step": 5420 }, { "epoch": 24.133333333333333, "grad_norm": 0.3164861500263214, "learning_rate": 3.6995440831225426e-05, "loss": 0.01155562549829483, "step": 5430 }, { "epoch": 24.177777777777777, "grad_norm": 0.3504844307899475, "learning_rate": 3.690488910402553e-05, "loss": 0.010869145393371582, "step": 5440 }, { "epoch": 24.22222222222222, "grad_norm": 0.20645228028297424, "learning_rate": 3.681427090064776e-05, "loss": 0.01712305247783661, "step": 5450 }, { "epoch": 24.266666666666666, "grad_norm": 0.32779228687286377, "learning_rate": 3.672358709351045e-05, "loss": 0.014332300424575806, "step": 5460 }, { "epoch": 24.31111111111111, "grad_norm": 0.20337463915348053, "learning_rate": 3.663283855566353e-05, "loss": 0.01195482760667801, "step": 5470 }, { "epoch": 24.355555555555554, "grad_norm": 0.13555671274662018, "learning_rate": 3.65420261607801e-05, "loss": 0.011140601336956024, "step": 5480 }, { "epoch": 24.4, "grad_norm": 0.2225894033908844, "learning_rate": 3.645115078314805e-05, "loss": 0.011093582957983017, "step": 5490 }, { "epoch": 24.444444444444443, "grad_norm": 0.10018553584814072, "learning_rate": 3.636021329766165e-05, "loss": 0.01577068567276001, "step": 5500 }, { "epoch": 24.488888888888887, "grad_norm": 0.3362257182598114, "learning_rate": 3.6269214579813046e-05, "loss": 0.013499508798122405, "step": 5510 }, { "epoch": 24.533333333333335, "grad_norm": 0.2308507263660431, "learning_rate": 3.6178155505683964e-05, "loss": 0.011980080604553222, "step": 5520 }, { "epoch": 24.57777777777778, "grad_norm": 0.17472414672374725, "learning_rate": 3.6087036951937165e-05, "loss": 0.011762392520904542, "step": 5530 }, { "epoch": 24.622222222222224, "grad_norm": 0.23287011682987213, "learning_rate": 3.599585979580806e-05, "loss": 0.012690469622612, "step": 5540 }, { "epoch": 24.666666666666668, "grad_norm": 0.09947798401117325, "learning_rate": 3.5904624915096226e-05, "loss": 0.012333554029464722, "step": 5550 }, { "epoch": 24.711111111111112, "grad_norm": 0.14346957206726074, "learning_rate": 3.5813333188157014e-05, "loss": 0.01637963056564331, "step": 5560 }, { "epoch": 24.755555555555556, "grad_norm": 0.16500172019004822, "learning_rate": 3.5721985493893026e-05, "loss": 0.011947260797023773, "step": 5570 }, { "epoch": 24.8, "grad_norm": 0.2326505184173584, "learning_rate": 3.563058271174569e-05, "loss": 0.012176967412233352, "step": 5580 }, { "epoch": 24.844444444444445, "grad_norm": 0.16783250868320465, "learning_rate": 3.553912572168681e-05, "loss": 0.012898531556129456, "step": 5590 }, { "epoch": 24.88888888888889, "grad_norm": 0.3663642108440399, "learning_rate": 3.544761540421005e-05, "loss": 0.016441190242767335, "step": 5600 }, { "epoch": 24.933333333333334, "grad_norm": 0.2823609411716461, "learning_rate": 3.535605264032246e-05, "loss": 0.011934293806552887, "step": 5610 }, { "epoch": 24.977777777777778, "grad_norm": 0.09860006719827652, "learning_rate": 3.526443831153607e-05, "loss": 0.012221427261829376, "step": 5620 }, { "epoch": 25.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9867470349951758, "eval_iou_background": 0.0, "eval_iou_crop": 0.9867470349951758, "eval_loss": 0.014899875968694687, "eval_mean_accuracy": 0.9867470349951758, "eval_mean_iou": 0.4933735174975879, "eval_overall_accuracy": 0.9867470349951758, "eval_runtime": 5.0471, "eval_samples_per_second": 63.006, "eval_steps_per_second": 7.925, "step": 5625 }, { "epoch": 25.022222222222222, "grad_norm": 0.6275083422660828, "learning_rate": 3.517277329985929e-05, "loss": 0.01147039458155632, "step": 5630 }, { "epoch": 25.066666666666666, "grad_norm": 0.22475898265838623, "learning_rate": 3.508105848778851e-05, "loss": 0.010911081731319428, "step": 5640 }, { "epoch": 25.11111111111111, "grad_norm": 0.16361036896705627, "learning_rate": 3.498929475829955e-05, "loss": 0.010758935660123824, "step": 5650 }, { "epoch": 25.155555555555555, "grad_norm": 0.22789868712425232, "learning_rate": 3.489748299483919e-05, "loss": 0.014520451426506042, "step": 5660 }, { "epoch": 25.2, "grad_norm": 0.08977847546339035, "learning_rate": 3.480562408131663e-05, "loss": 0.01100596711039543, "step": 5670 }, { "epoch": 25.244444444444444, "grad_norm": 0.43810445070266724, "learning_rate": 3.471371890209504e-05, "loss": 0.020305152237415313, "step": 5680 }, { "epoch": 25.288888888888888, "grad_norm": 0.17655257880687714, "learning_rate": 3.462176834198297e-05, "loss": 0.014110589027404785, "step": 5690 }, { "epoch": 25.333333333333332, "grad_norm": 0.17637833952903748, "learning_rate": 3.45297732862259e-05, "loss": 0.01766664832830429, "step": 5700 }, { "epoch": 25.377777777777776, "grad_norm": 1.1034839153289795, "learning_rate": 3.443773462049767e-05, "loss": 0.0161713108420372, "step": 5710 }, { "epoch": 25.42222222222222, "grad_norm": 0.11659952998161316, "learning_rate": 3.434565323089199e-05, "loss": 0.01219017654657364, "step": 5720 }, { "epoch": 25.466666666666665, "grad_norm": 0.2809595763683319, "learning_rate": 3.4253530003913863e-05, "loss": 0.014115968346595764, "step": 5730 }, { "epoch": 25.511111111111113, "grad_norm": 0.33750391006469727, "learning_rate": 3.4161365826471086e-05, "loss": 0.013754937052726745, "step": 5740 }, { "epoch": 25.555555555555557, "grad_norm": 0.164851576089859, "learning_rate": 3.4069161585865736e-05, "loss": 0.010193625837564469, "step": 5750 }, { "epoch": 25.6, "grad_norm": 0.3351067900657654, "learning_rate": 3.397691816978553e-05, "loss": 0.010195306688547134, "step": 5760 }, { "epoch": 25.644444444444446, "grad_norm": 0.20620349049568176, "learning_rate": 3.388463646629541e-05, "loss": 0.010879864543676376, "step": 5770 }, { "epoch": 25.68888888888889, "grad_norm": 0.285849928855896, "learning_rate": 3.3792317363828886e-05, "loss": 0.011786533892154694, "step": 5780 }, { "epoch": 25.733333333333334, "grad_norm": 0.1767425388097763, "learning_rate": 3.369996175117953e-05, "loss": 0.011195920407772064, "step": 5790 }, { "epoch": 25.77777777777778, "grad_norm": 0.11831331998109818, "learning_rate": 3.360757051749242e-05, "loss": 0.011466329544782638, "step": 5800 }, { "epoch": 25.822222222222223, "grad_norm": 1.135332465171814, "learning_rate": 3.351514455225556e-05, "loss": 0.011681647598743438, "step": 5810 }, { "epoch": 25.866666666666667, "grad_norm": 0.2006159871816635, "learning_rate": 3.342268474529136e-05, "loss": 0.01074204444885254, "step": 5820 }, { "epoch": 25.91111111111111, "grad_norm": 0.15597520768642426, "learning_rate": 3.333019198674798e-05, "loss": 0.014154984056949616, "step": 5830 }, { "epoch": 25.955555555555556, "grad_norm": 0.20347462594509125, "learning_rate": 3.323766716709088e-05, "loss": 0.010158039629459381, "step": 5840 }, { "epoch": 26.0, "grad_norm": 0.24911624193191528, "learning_rate": 3.314511117709415e-05, "loss": 0.011566416174173356, "step": 5850 }, { "epoch": 26.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9844452600719147, "eval_iou_background": 0.0, "eval_iou_crop": 0.9844452600719147, "eval_loss": 0.016405673697590828, "eval_mean_accuracy": 0.9844452600719147, "eval_mean_iou": 0.49222263003595734, "eval_overall_accuracy": 0.9844452600719147, "eval_runtime": 4.8416, "eval_samples_per_second": 65.68, "eval_steps_per_second": 8.262, "step": 5850 }, { "epoch": 26.044444444444444, "grad_norm": 0.10023295879364014, "learning_rate": 3.305252490783199e-05, "loss": 0.011167434602975845, "step": 5860 }, { "epoch": 26.08888888888889, "grad_norm": 0.3265562951564789, "learning_rate": 3.2959909250670084e-05, "loss": 0.010879386961460114, "step": 5870 }, { "epoch": 26.133333333333333, "grad_norm": 0.2507272958755493, "learning_rate": 3.2867265097257055e-05, "loss": 0.010885369777679444, "step": 5880 }, { "epoch": 26.177777777777777, "grad_norm": 0.2532482445240021, "learning_rate": 3.27745933395159e-05, "loss": 0.01658028960227966, "step": 5890 }, { "epoch": 26.22222222222222, "grad_norm": 0.10449657589197159, "learning_rate": 3.268189486963532e-05, "loss": 0.009108587354421615, "step": 5900 }, { "epoch": 26.266666666666666, "grad_norm": 0.31126868724823, "learning_rate": 3.2589170580061255e-05, "loss": 0.011730895936489105, "step": 5910 }, { "epoch": 26.31111111111111, "grad_norm": 0.30979806184768677, "learning_rate": 3.249642136348814e-05, "loss": 0.012382631748914718, "step": 5920 }, { "epoch": 26.355555555555554, "grad_norm": 0.17805983126163483, "learning_rate": 3.240364811285046e-05, "loss": 0.011482105404138566, "step": 5930 }, { "epoch": 26.4, "grad_norm": 0.15789909660816193, "learning_rate": 3.2310851721314056e-05, "loss": 0.011602327227592468, "step": 5940 }, { "epoch": 26.444444444444443, "grad_norm": 0.28331345319747925, "learning_rate": 3.221803308226755e-05, "loss": 0.012444787472486497, "step": 5950 }, { "epoch": 26.488888888888887, "grad_norm": 0.4744703471660614, "learning_rate": 3.212519308931377e-05, "loss": 0.012493985146284104, "step": 5960 }, { "epoch": 26.533333333333335, "grad_norm": 0.11163220554590225, "learning_rate": 3.203233263626111e-05, "loss": 0.011258383095264436, "step": 5970 }, { "epoch": 26.57777777777778, "grad_norm": 0.13809651136398315, "learning_rate": 3.1939452617114965e-05, "loss": 0.016604061424732208, "step": 5980 }, { "epoch": 26.622222222222224, "grad_norm": 0.191380113363266, "learning_rate": 3.184655392606904e-05, "loss": 0.011605524271726609, "step": 5990 }, { "epoch": 26.666666666666668, "grad_norm": 0.330387145280838, "learning_rate": 3.17536374574969e-05, "loss": 0.010701074451208114, "step": 6000 }, { "epoch": 26.711111111111112, "grad_norm": 0.1112818568944931, "learning_rate": 3.166070410594317e-05, "loss": 0.010595397651195526, "step": 6010 }, { "epoch": 26.755555555555556, "grad_norm": 0.11170977354049683, "learning_rate": 3.156775476611508e-05, "loss": 0.015293391048908233, "step": 6020 }, { "epoch": 26.8, "grad_norm": 0.13096198439598083, "learning_rate": 3.147479033287373e-05, "loss": 0.00949217975139618, "step": 6030 }, { "epoch": 26.844444444444445, "grad_norm": 0.21226289868354797, "learning_rate": 3.138181170122557e-05, "loss": 0.012370071560144424, "step": 6040 }, { "epoch": 26.88888888888889, "grad_norm": 0.36949422955513, "learning_rate": 3.128881976631373e-05, "loss": 0.011191224306821823, "step": 6050 }, { "epoch": 26.933333333333334, "grad_norm": 0.19004829227924347, "learning_rate": 3.119581542340942e-05, "loss": 0.012466524541378022, "step": 6060 }, { "epoch": 26.977777777777778, "grad_norm": 0.08695580810308456, "learning_rate": 3.11027995679033e-05, "loss": 0.01224166750907898, "step": 6070 }, { "epoch": 27.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9880429312071487, "eval_iou_background": 0.0, "eval_iou_crop": 0.9880429312071487, "eval_loss": 0.01458834670484066, "eval_mean_accuracy": 0.9880429312071487, "eval_mean_iou": 0.49402146560357435, "eval_overall_accuracy": 0.9880429312071487, "eval_runtime": 4.2387, "eval_samples_per_second": 75.023, "eval_steps_per_second": 9.437, "step": 6075 }, { "epoch": 27.022222222222222, "grad_norm": 0.18274766206741333, "learning_rate": 3.1009773095296873e-05, "loss": 0.011431704461574554, "step": 6080 }, { "epoch": 27.066666666666666, "grad_norm": 0.15859104692935944, "learning_rate": 3.0916736901193854e-05, "loss": 0.0103001207113266, "step": 6090 }, { "epoch": 27.11111111111111, "grad_norm": 0.642759382724762, "learning_rate": 3.082369188129156e-05, "loss": 0.010660682618618012, "step": 6100 }, { "epoch": 27.155555555555555, "grad_norm": 0.14561355113983154, "learning_rate": 3.073063893137226e-05, "loss": 0.010623028129339218, "step": 6110 }, { "epoch": 27.2, "grad_norm": 0.0921848937869072, "learning_rate": 3.063757894729457e-05, "loss": 0.01016542837023735, "step": 6120 }, { "epoch": 27.244444444444444, "grad_norm": 0.1914316862821579, "learning_rate": 3.054451282498485e-05, "loss": 0.008079152554273605, "step": 6130 }, { "epoch": 27.288888888888888, "grad_norm": 0.2698880434036255, "learning_rate": 3.045144146042853e-05, "loss": 0.01516740620136261, "step": 6140 }, { "epoch": 27.333333333333332, "grad_norm": 0.6637910008430481, "learning_rate": 3.0358365749661517e-05, "loss": 0.010320000350475311, "step": 6150 }, { "epoch": 27.377777777777776, "grad_norm": 0.20076143741607666, "learning_rate": 3.0265286588761588e-05, "loss": 0.012548622488975526, "step": 6160 }, { "epoch": 27.42222222222222, "grad_norm": 0.7379605174064636, "learning_rate": 3.0172204873839676e-05, "loss": 0.013736668229103088, "step": 6170 }, { "epoch": 27.466666666666665, "grad_norm": 0.38915207982063293, "learning_rate": 3.0079121501031354e-05, "loss": 0.01312054693698883, "step": 6180 }, { "epoch": 27.511111111111113, "grad_norm": 0.1722690761089325, "learning_rate": 2.9986037366488142e-05, "loss": 0.014683559536933899, "step": 6190 }, { "epoch": 27.555555555555557, "grad_norm": 0.10579387843608856, "learning_rate": 2.989295336636888e-05, "loss": 0.010989271104335785, "step": 6200 }, { "epoch": 27.6, "grad_norm": 0.16910874843597412, "learning_rate": 2.979987039683113e-05, "loss": 0.009782166033983231, "step": 6210 }, { "epoch": 27.644444444444446, "grad_norm": 0.2963481545448303, "learning_rate": 2.9706789354022535e-05, "loss": 0.013343298435211181, "step": 6220 }, { "epoch": 27.68888888888889, "grad_norm": 0.3728535771369934, "learning_rate": 2.961371113407217e-05, "loss": 0.012581153213977814, "step": 6230 }, { "epoch": 27.733333333333334, "grad_norm": 0.11326458305120468, "learning_rate": 2.9520636633081944e-05, "loss": 0.01098373755812645, "step": 6240 }, { "epoch": 27.77777777777778, "grad_norm": 0.1970817893743515, "learning_rate": 2.9427566747117953e-05, "loss": 0.014856463670730591, "step": 6250 }, { "epoch": 27.822222222222223, "grad_norm": 0.11784834414720535, "learning_rate": 2.9334502372201907e-05, "loss": 0.011664532124996185, "step": 6260 }, { "epoch": 27.866666666666667, "grad_norm": 0.3700436055660248, "learning_rate": 2.9241444404302383e-05, "loss": 0.012449257820844651, "step": 6270 }, { "epoch": 27.91111111111111, "grad_norm": 0.12162601202726364, "learning_rate": 2.9148393739326323e-05, "loss": 0.011024379730224609, "step": 6280 }, { "epoch": 27.955555555555556, "grad_norm": 0.4037908911705017, "learning_rate": 2.9055351273110377e-05, "loss": 0.010775818675756454, "step": 6290 }, { "epoch": 28.0, "grad_norm": 0.12008745223283768, "learning_rate": 2.8962317901412207e-05, "loss": 0.008546200394630433, "step": 6300 }, { "epoch": 28.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9863816183299677, "eval_iou_background": 0.0, "eval_iou_crop": 0.9863816183299677, "eval_loss": 0.016118589788675308, "eval_mean_accuracy": 0.9863816183299677, "eval_mean_iou": 0.49319080916498387, "eval_overall_accuracy": 0.9863816183299677, "eval_runtime": 4.9918, "eval_samples_per_second": 63.705, "eval_steps_per_second": 8.013, "step": 6300 }, { "epoch": 28.044444444444444, "grad_norm": 0.3273818790912628, "learning_rate": 2.886929451990196e-05, "loss": 0.010573575645685196, "step": 6310 }, { "epoch": 28.08888888888889, "grad_norm": 0.13690316677093506, "learning_rate": 2.8776282024153604e-05, "loss": 0.010925211012363434, "step": 6320 }, { "epoch": 28.133333333333333, "grad_norm": 1.3951421976089478, "learning_rate": 2.8683281309636287e-05, "loss": 0.010952311009168625, "step": 6330 }, { "epoch": 28.177777777777777, "grad_norm": 0.17371580004692078, "learning_rate": 2.8590293271705737e-05, "loss": 0.015090391039848328, "step": 6340 }, { "epoch": 28.22222222222222, "grad_norm": 0.21769016981124878, "learning_rate": 2.8497318805595643e-05, "loss": 0.01143813282251358, "step": 6350 }, { "epoch": 28.266666666666666, "grad_norm": 0.3074902296066284, "learning_rate": 2.8404358806409034e-05, "loss": 0.01333291232585907, "step": 6360 }, { "epoch": 28.31111111111111, "grad_norm": 0.17221790552139282, "learning_rate": 2.831141416910967e-05, "loss": 0.01153416559100151, "step": 6370 }, { "epoch": 28.355555555555554, "grad_norm": 0.14881093800067902, "learning_rate": 2.821848578851339e-05, "loss": 0.010437451303005219, "step": 6380 }, { "epoch": 28.4, "grad_norm": 0.31512516736984253, "learning_rate": 2.8125574559279544e-05, "loss": 0.01140696331858635, "step": 6390 }, { "epoch": 28.444444444444443, "grad_norm": 0.19587089121341705, "learning_rate": 2.803268137590236e-05, "loss": 0.012051345407962799, "step": 6400 }, { "epoch": 28.488888888888887, "grad_norm": 0.393690824508667, "learning_rate": 2.7939807132702316e-05, "loss": 0.014799095690250397, "step": 6410 }, { "epoch": 28.533333333333335, "grad_norm": 0.1491280347108841, "learning_rate": 2.784695272381755e-05, "loss": 0.010019892454147339, "step": 6420 }, { "epoch": 28.57777777777778, "grad_norm": 0.11496465653181076, "learning_rate": 2.7754119043195256e-05, "loss": 0.01111874207854271, "step": 6430 }, { "epoch": 28.622222222222224, "grad_norm": 0.11041788756847382, "learning_rate": 2.7661306984583073e-05, "loss": 0.009301931411027909, "step": 6440 }, { "epoch": 28.666666666666668, "grad_norm": 0.08826632052659988, "learning_rate": 2.7568517441520442e-05, "loss": 0.010417788475751876, "step": 6450 }, { "epoch": 28.711111111111112, "grad_norm": 0.11172500997781754, "learning_rate": 2.747575130733008e-05, "loss": 0.010028854012489319, "step": 6460 }, { "epoch": 28.755555555555556, "grad_norm": 0.39798468351364136, "learning_rate": 2.738300947510932e-05, "loss": 0.01048857569694519, "step": 6470 }, { "epoch": 28.8, "grad_norm": 0.1887478232383728, "learning_rate": 2.729029283772152e-05, "loss": 0.00968843698501587, "step": 6480 }, { "epoch": 28.844444444444445, "grad_norm": 0.5798330307006836, "learning_rate": 2.7197602287787488e-05, "loss": 0.01351466476917267, "step": 6490 }, { "epoch": 28.88888888888889, "grad_norm": 0.4834788739681244, "learning_rate": 2.7104938717676867e-05, "loss": 0.011734419316053391, "step": 6500 }, { "epoch": 28.933333333333334, "grad_norm": 0.1687028706073761, "learning_rate": 2.7012303019499597e-05, "loss": 0.009863308817148208, "step": 6510 }, { "epoch": 28.977777777777778, "grad_norm": 0.0730297863483429, "learning_rate": 2.691969608509721e-05, "loss": 0.012214501202106477, "step": 6520 }, { "epoch": 29.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9850724734076571, "eval_iou_background": 0.0, "eval_iou_crop": 0.9850724734076571, "eval_loss": 0.015054170042276382, "eval_mean_accuracy": 0.9850724734076571, "eval_mean_iou": 0.49253623670382857, "eval_overall_accuracy": 0.9850724734076571, "eval_runtime": 5.2949, "eval_samples_per_second": 60.057, "eval_steps_per_second": 7.554, "step": 6525 }, { "epoch": 29.022222222222222, "grad_norm": 0.08802998811006546, "learning_rate": 2.6827118806034366e-05, "loss": 0.01121232882142067, "step": 6530 }, { "epoch": 29.066666666666666, "grad_norm": 0.13001635670661926, "learning_rate": 2.6734572073590236e-05, "loss": 0.013424272835254668, "step": 6540 }, { "epoch": 29.11111111111111, "grad_norm": 0.15384559333324432, "learning_rate": 2.6642056778749854e-05, "loss": 0.009384750574827194, "step": 6550 }, { "epoch": 29.155555555555555, "grad_norm": 0.39465025067329407, "learning_rate": 2.654957381219562e-05, "loss": 0.012998400628566742, "step": 6560 }, { "epoch": 29.2, "grad_norm": 0.18288381397724152, "learning_rate": 2.645712406429871e-05, "loss": 0.010790080577135087, "step": 6570 }, { "epoch": 29.244444444444444, "grad_norm": 0.10786467790603638, "learning_rate": 2.6364708425110492e-05, "loss": 0.009722784906625748, "step": 6580 }, { "epoch": 29.288888888888888, "grad_norm": 0.22115680575370789, "learning_rate": 2.6272327784353895e-05, "loss": 0.01283152997493744, "step": 6590 }, { "epoch": 29.333333333333332, "grad_norm": 0.12815697491168976, "learning_rate": 2.6179983031414982e-05, "loss": 0.008868549764156342, "step": 6600 }, { "epoch": 29.377777777777776, "grad_norm": 0.15104149281978607, "learning_rate": 2.6087675055334266e-05, "loss": 0.010656814277172088, "step": 6610 }, { "epoch": 29.42222222222222, "grad_norm": 0.16669240593910217, "learning_rate": 2.599540474479821e-05, "loss": 0.013940072059631348, "step": 6620 }, { "epoch": 29.466666666666665, "grad_norm": 0.316628098487854, "learning_rate": 2.5903172988130645e-05, "loss": 0.01218143329024315, "step": 6630 }, { "epoch": 29.511111111111113, "grad_norm": 0.11885285377502441, "learning_rate": 2.5810980673284232e-05, "loss": 0.011870156228542327, "step": 6640 }, { "epoch": 29.555555555555557, "grad_norm": 0.15962514281272888, "learning_rate": 2.5718828687831917e-05, "loss": 0.012683700025081634, "step": 6650 }, { "epoch": 29.6, "grad_norm": 0.22314725816249847, "learning_rate": 2.562671791895836e-05, "loss": 0.008866249024868012, "step": 6660 }, { "epoch": 29.644444444444446, "grad_norm": 0.25528484582901, "learning_rate": 2.5534649253451433e-05, "loss": 0.009602761268615723, "step": 6670 }, { "epoch": 29.68888888888889, "grad_norm": 0.10503140836954117, "learning_rate": 2.5442623577693654e-05, "loss": 0.013110527396202087, "step": 6680 }, { "epoch": 29.733333333333334, "grad_norm": 0.45969295501708984, "learning_rate": 2.5350641777653667e-05, "loss": 0.011281903088092803, "step": 6690 }, { "epoch": 29.77777777777778, "grad_norm": 0.11433500051498413, "learning_rate": 2.525870473887768e-05, "loss": 0.01127450168132782, "step": 6700 }, { "epoch": 29.822222222222223, "grad_norm": 0.06937149167060852, "learning_rate": 2.5166813346480995e-05, "loss": 0.00975840985774994, "step": 6710 }, { "epoch": 29.866666666666667, "grad_norm": 0.10273576527833939, "learning_rate": 2.507496848513946e-05, "loss": 0.011079522967338561, "step": 6720 }, { "epoch": 29.91111111111111, "grad_norm": 0.10626525431871414, "learning_rate": 2.4983171039080927e-05, "loss": 0.01035545915365219, "step": 6730 }, { "epoch": 29.955555555555556, "grad_norm": 0.6682873964309692, "learning_rate": 2.4891421892076768e-05, "loss": 0.009857004880905152, "step": 6740 }, { "epoch": 30.0, "grad_norm": 0.18725700676441193, "learning_rate": 2.479972192743337e-05, "loss": 0.011546111106872559, "step": 6750 }, { "epoch": 30.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9860615488765659, "eval_iou_background": 0.0, "eval_iou_crop": 0.9860615488765659, "eval_loss": 0.016514327377080917, "eval_mean_accuracy": 0.9860615488765659, "eval_mean_iou": 0.49303077443828297, "eval_overall_accuracy": 0.9860615488765659, "eval_runtime": 4.9455, "eval_samples_per_second": 64.301, "eval_steps_per_second": 8.088, "step": 6750 }, { "epoch": 30.044444444444444, "grad_norm": 0.09658083319664001, "learning_rate": 2.4708072027983636e-05, "loss": 0.010866087675094605, "step": 6760 }, { "epoch": 30.08888888888889, "grad_norm": 0.775265634059906, "learning_rate": 2.4616473076078426e-05, "loss": 0.011167645454406738, "step": 6770 }, { "epoch": 30.133333333333333, "grad_norm": 0.4111640751361847, "learning_rate": 2.452492595357813e-05, "loss": 0.010454432666301727, "step": 6780 }, { "epoch": 30.177777777777777, "grad_norm": 0.09661434590816498, "learning_rate": 2.4433431541844195e-05, "loss": 0.009932644665241241, "step": 6790 }, { "epoch": 30.22222222222222, "grad_norm": 0.1857939064502716, "learning_rate": 2.434199072173052e-05, "loss": 0.010906673967838287, "step": 6800 }, { "epoch": 30.266666666666666, "grad_norm": 0.17614109814167023, "learning_rate": 2.4250604373575115e-05, "loss": 0.010186655074357986, "step": 6810 }, { "epoch": 30.31111111111111, "grad_norm": 0.22867712378501892, "learning_rate": 2.4159273377191558e-05, "loss": 0.009553482383489608, "step": 6820 }, { "epoch": 30.355555555555554, "grad_norm": 1.5361841917037964, "learning_rate": 2.4067998611860533e-05, "loss": 0.009537860751152039, "step": 6830 }, { "epoch": 30.4, "grad_norm": 0.26202863454818726, "learning_rate": 2.3976780956321325e-05, "loss": 0.015572449564933777, "step": 6840 }, { "epoch": 30.444444444444443, "grad_norm": 0.37827956676483154, "learning_rate": 2.3885621288763457e-05, "loss": 0.009512580186128616, "step": 6850 }, { "epoch": 30.488888888888887, "grad_norm": 0.7923609614372253, "learning_rate": 2.3794520486818148e-05, "loss": 0.015737615525722504, "step": 6860 }, { "epoch": 30.533333333333335, "grad_norm": 0.20107302069664001, "learning_rate": 2.3703479427549902e-05, "loss": 0.01286223828792572, "step": 6870 }, { "epoch": 30.57777777777778, "grad_norm": 0.25387513637542725, "learning_rate": 2.3612498987448038e-05, "loss": 0.013643796741962432, "step": 6880 }, { "epoch": 30.622222222222224, "grad_norm": 0.1061081737279892, "learning_rate": 2.35215800424183e-05, "loss": 0.00965401455760002, "step": 6890 }, { "epoch": 30.666666666666668, "grad_norm": 0.5697869658470154, "learning_rate": 2.3430723467774374e-05, "loss": 0.010193152725696564, "step": 6900 }, { "epoch": 30.711111111111112, "grad_norm": 0.15205205976963043, "learning_rate": 2.3339930138229477e-05, "loss": 0.01098535880446434, "step": 6910 }, { "epoch": 30.755555555555556, "grad_norm": 0.14245957136154175, "learning_rate": 2.3249200927887952e-05, "loss": 0.01170566827058792, "step": 6920 }, { "epoch": 30.8, "grad_norm": 0.1448567509651184, "learning_rate": 2.3158536710236842e-05, "loss": 0.009716469794511795, "step": 6930 }, { "epoch": 30.844444444444445, "grad_norm": 0.7255468964576721, "learning_rate": 2.306793835813747e-05, "loss": 0.010287973284721374, "step": 6940 }, { "epoch": 30.88888888888889, "grad_norm": 0.6124976277351379, "learning_rate": 2.2977406743817044e-05, "loss": 0.01724327802658081, "step": 6950 }, { "epoch": 30.933333333333334, "grad_norm": 0.12847739458084106, "learning_rate": 2.288694273886026e-05, "loss": 0.008896269649267197, "step": 6960 }, { "epoch": 30.977777777777778, "grad_norm": 0.3263874053955078, "learning_rate": 2.279654721420093e-05, "loss": 0.011659268289804459, "step": 6970 }, { "epoch": 31.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9848313037942744, "eval_iou_background": 0.0, "eval_iou_crop": 0.9848313037942744, "eval_loss": 0.016041168943047523, "eval_mean_accuracy": 0.9848313037942744, "eval_mean_iou": 0.4924156518971372, "eval_overall_accuracy": 0.9848313037942744, "eval_runtime": 5.0684, "eval_samples_per_second": 62.742, "eval_steps_per_second": 7.892, "step": 6975 }, { "epoch": 31.022222222222222, "grad_norm": 0.16682875156402588, "learning_rate": 2.2706221040113546e-05, "loss": 0.00912664234638214, "step": 6980 }, { "epoch": 31.066666666666666, "grad_norm": 0.14082539081573486, "learning_rate": 2.2615965086204958e-05, "loss": 0.010323713719844817, "step": 6990 }, { "epoch": 31.11111111111111, "grad_norm": 0.17910431325435638, "learning_rate": 2.2525780221405975e-05, "loss": 0.010289929062128066, "step": 7000 }, { "epoch": 31.155555555555555, "grad_norm": 0.232297882437706, "learning_rate": 2.2435667313962997e-05, "loss": 0.011357175558805466, "step": 7010 }, { "epoch": 31.2, "grad_norm": 0.09302005171775818, "learning_rate": 2.2345627231429654e-05, "loss": 0.010168468952178955, "step": 7020 }, { "epoch": 31.244444444444444, "grad_norm": 0.2787386178970337, "learning_rate": 2.2255660840658474e-05, "loss": 0.00917961224913597, "step": 7030 }, { "epoch": 31.288888888888888, "grad_norm": 0.1925794631242752, "learning_rate": 2.216576900779251e-05, "loss": 0.013990086317062379, "step": 7040 }, { "epoch": 31.333333333333332, "grad_norm": 0.22789886593818665, "learning_rate": 2.2075952598257055e-05, "loss": 0.009609445929527283, "step": 7050 }, { "epoch": 31.377777777777776, "grad_norm": 0.24586650729179382, "learning_rate": 2.1986212476751206e-05, "loss": 0.01113196536898613, "step": 7060 }, { "epoch": 31.42222222222222, "grad_norm": 0.1293639838695526, "learning_rate": 2.1896549507239657e-05, "loss": 0.011127153784036637, "step": 7070 }, { "epoch": 31.466666666666665, "grad_norm": 2.9639546871185303, "learning_rate": 2.1806964552944326e-05, "loss": 0.01163620948791504, "step": 7080 }, { "epoch": 31.511111111111113, "grad_norm": 0.14920338988304138, "learning_rate": 2.171745847633599e-05, "loss": 0.013256612420082092, "step": 7090 }, { "epoch": 31.555555555555557, "grad_norm": 0.10384750366210938, "learning_rate": 2.162803213912611e-05, "loss": 0.011627873778343201, "step": 7100 }, { "epoch": 31.6, "grad_norm": 0.16100211441516876, "learning_rate": 2.1538686402258426e-05, "loss": 0.010562192648649216, "step": 7110 }, { "epoch": 31.644444444444446, "grad_norm": 0.19589664041996002, "learning_rate": 2.1449422125900716e-05, "loss": 0.010439652204513549, "step": 7120 }, { "epoch": 31.68888888888889, "grad_norm": 0.27025485038757324, "learning_rate": 2.13602401694365e-05, "loss": 0.010094983130693435, "step": 7130 }, { "epoch": 31.733333333333334, "grad_norm": 0.17635492980480194, "learning_rate": 2.1271141391456764e-05, "loss": 0.009413100033998489, "step": 7140 }, { "epoch": 31.77777777777778, "grad_norm": 0.3619304299354553, "learning_rate": 2.118212664975172e-05, "loss": 0.010358908772468567, "step": 7150 }, { "epoch": 31.822222222222223, "grad_norm": 0.2444721907377243, "learning_rate": 2.109319680130251e-05, "loss": 0.010250823199748993, "step": 7160 }, { "epoch": 31.866666666666667, "grad_norm": 0.13545142114162445, "learning_rate": 2.100435270227298e-05, "loss": 0.01089079976081848, "step": 7170 }, { "epoch": 31.91111111111111, "grad_norm": 0.1618206799030304, "learning_rate": 2.0915595208001442e-05, "loss": 0.009754135459661483, "step": 7180 }, { "epoch": 31.955555555555556, "grad_norm": 0.18217962980270386, "learning_rate": 2.0826925172992423e-05, "loss": 0.010863299667835235, "step": 7190 }, { "epoch": 32.0, "grad_norm": 0.17610441148281097, "learning_rate": 2.073834345090842e-05, "loss": 0.010512910783290863, "step": 7200 }, { "epoch": 32.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9882703674012789, "eval_iou_background": 0.0, "eval_iou_crop": 0.9882703674012789, "eval_loss": 0.01614859327673912, "eval_mean_accuracy": 0.9882703674012789, "eval_mean_iou": 0.49413518370063947, "eval_overall_accuracy": 0.9882703674012789, "eval_runtime": 4.3816, "eval_samples_per_second": 72.577, "eval_steps_per_second": 9.129, "step": 7200 }, { "epoch": 32.044444444444444, "grad_norm": 0.1752193421125412, "learning_rate": 2.0649850894561745e-05, "loss": 0.011098603904247283, "step": 7210 }, { "epoch": 32.08888888888889, "grad_norm": 0.12485916167497635, "learning_rate": 2.0561448355906257e-05, "loss": 0.009263231605291366, "step": 7220 }, { "epoch": 32.13333333333333, "grad_norm": 0.16271120309829712, "learning_rate": 2.0473136686029166e-05, "loss": 0.008045147359371185, "step": 7230 }, { "epoch": 32.17777777777778, "grad_norm": 0.13527393341064453, "learning_rate": 2.038491673514287e-05, "loss": 0.011750352382659913, "step": 7240 }, { "epoch": 32.22222222222222, "grad_norm": 0.11836022883653641, "learning_rate": 2.0296789352576738e-05, "loss": 0.010277514904737472, "step": 7250 }, { "epoch": 32.266666666666666, "grad_norm": 0.10061638802289963, "learning_rate": 2.0208755386768968e-05, "loss": 0.012383222579956055, "step": 7260 }, { "epoch": 32.31111111111111, "grad_norm": 0.5306994318962097, "learning_rate": 2.0120815685258365e-05, "loss": 0.012659221887588501, "step": 7270 }, { "epoch": 32.355555555555554, "grad_norm": 0.18847441673278809, "learning_rate": 2.003297109467623e-05, "loss": 0.010454923659563065, "step": 7280 }, { "epoch": 32.4, "grad_norm": 0.10300065577030182, "learning_rate": 1.994522246073819e-05, "loss": 0.009790068119764328, "step": 7290 }, { "epoch": 32.44444444444444, "grad_norm": 0.12303325533866882, "learning_rate": 1.985757062823609e-05, "loss": 0.010908884555101394, "step": 7300 }, { "epoch": 32.48888888888889, "grad_norm": 0.139863982796669, "learning_rate": 1.9770016441029753e-05, "loss": 0.009946569800376892, "step": 7310 }, { "epoch": 32.53333333333333, "grad_norm": 0.2760835587978363, "learning_rate": 1.9682560742038993e-05, "loss": 0.010641241073608398, "step": 7320 }, { "epoch": 32.577777777777776, "grad_norm": 0.164348766207695, "learning_rate": 1.9595204373235442e-05, "loss": 0.010138192772865295, "step": 7330 }, { "epoch": 32.62222222222222, "grad_norm": 0.20397959649562836, "learning_rate": 1.9507948175634384e-05, "loss": 0.011526837944984436, "step": 7340 }, { "epoch": 32.666666666666664, "grad_norm": 0.18409305810928345, "learning_rate": 1.9420792989286764e-05, "loss": 0.011180511116981507, "step": 7350 }, { "epoch": 32.71111111111111, "grad_norm": 0.1896786391735077, "learning_rate": 1.9333739653271044e-05, "loss": 0.01116919219493866, "step": 7360 }, { "epoch": 32.75555555555555, "grad_norm": 0.42628219723701477, "learning_rate": 1.9246789005685126e-05, "loss": 0.010931698232889175, "step": 7370 }, { "epoch": 32.8, "grad_norm": 0.1807331144809723, "learning_rate": 1.915994188363826e-05, "loss": 0.010138377547264099, "step": 7380 }, { "epoch": 32.84444444444444, "grad_norm": 0.47357308864593506, "learning_rate": 1.9073199123243053e-05, "loss": 0.009827225655317306, "step": 7390 }, { "epoch": 32.888888888888886, "grad_norm": 0.7533900141716003, "learning_rate": 1.8986561559607382e-05, "loss": 0.012663301825523377, "step": 7400 }, { "epoch": 32.93333333333333, "grad_norm": 0.13555842638015747, "learning_rate": 1.8900030026826303e-05, "loss": 0.010066298395395279, "step": 7410 }, { "epoch": 32.977777777777774, "grad_norm": 0.2096281498670578, "learning_rate": 1.881360535797412e-05, "loss": 0.011264577507972717, "step": 7420 }, { "epoch": 33.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9859489886952417, "eval_iou_background": 0.0, "eval_iou_crop": 0.9859489886952417, "eval_loss": 0.015504099428653717, "eval_mean_accuracy": 0.9859489886952417, "eval_mean_iou": 0.49297449434762086, "eval_overall_accuracy": 0.9859489886952417, "eval_runtime": 5.3018, "eval_samples_per_second": 59.979, "eval_steps_per_second": 7.545, "step": 7425 }, { "epoch": 33.022222222222226, "grad_norm": 0.2538856863975525, "learning_rate": 1.8727288385096306e-05, "loss": 0.010771843791007995, "step": 7430 }, { "epoch": 33.06666666666667, "grad_norm": 0.11803525686264038, "learning_rate": 1.8641079939201485e-05, "loss": 0.012811534106731415, "step": 7440 }, { "epoch": 33.111111111111114, "grad_norm": 0.4706506133079529, "learning_rate": 1.8554980850253448e-05, "loss": 0.011524637043476105, "step": 7450 }, { "epoch": 33.15555555555556, "grad_norm": 0.25968462228775024, "learning_rate": 1.8468991947163166e-05, "loss": 0.012441815435886383, "step": 7460 }, { "epoch": 33.2, "grad_norm": 0.8820908665657043, "learning_rate": 1.838311405778083e-05, "loss": 0.013223965466022492, "step": 7470 }, { "epoch": 33.24444444444445, "grad_norm": 0.36212411522865295, "learning_rate": 1.829734800888781e-05, "loss": 0.0092201828956604, "step": 7480 }, { "epoch": 33.28888888888889, "grad_norm": 0.4232669472694397, "learning_rate": 1.8211694626188785e-05, "loss": 0.012005984038114547, "step": 7490 }, { "epoch": 33.333333333333336, "grad_norm": 0.23899516463279724, "learning_rate": 1.8126154734303725e-05, "loss": 0.010467199236154556, "step": 7500 }, { "epoch": 33.37777777777778, "grad_norm": 0.5283910036087036, "learning_rate": 1.8040729156759992e-05, "loss": 0.010115320980548858, "step": 7510 }, { "epoch": 33.422222222222224, "grad_norm": 0.11861249059438705, "learning_rate": 1.7955418715984384e-05, "loss": 0.010419557243585587, "step": 7520 }, { "epoch": 33.46666666666667, "grad_norm": 1.8094379901885986, "learning_rate": 1.787022423329524e-05, "loss": 0.012799093127250671, "step": 7530 }, { "epoch": 33.51111111111111, "grad_norm": 0.09505440294742584, "learning_rate": 1.7785146528894517e-05, "loss": 0.011368632316589355, "step": 7540 }, { "epoch": 33.55555555555556, "grad_norm": 0.12374678254127502, "learning_rate": 1.7700186421859933e-05, "loss": 0.016125121712684633, "step": 7550 }, { "epoch": 33.6, "grad_norm": 0.17453926801681519, "learning_rate": 1.7615344730136974e-05, "loss": 0.008206681907176971, "step": 7560 }, { "epoch": 33.644444444444446, "grad_norm": 0.16836631298065186, "learning_rate": 1.7530622270531164e-05, "loss": 0.011044959723949432, "step": 7570 }, { "epoch": 33.68888888888889, "grad_norm": 0.12782208621501923, "learning_rate": 1.744601985870011e-05, "loss": 0.009859148412942886, "step": 7580 }, { "epoch": 33.733333333333334, "grad_norm": 0.1061973124742508, "learning_rate": 1.7361538309145654e-05, "loss": 0.010578135401010514, "step": 7590 }, { "epoch": 33.77777777777778, "grad_norm": 0.15195927023887634, "learning_rate": 1.7277178435206065e-05, "loss": 0.008789992332458496, "step": 7600 }, { "epoch": 33.82222222222222, "grad_norm": 0.19253112375736237, "learning_rate": 1.7192941049048186e-05, "loss": 0.008525656908750534, "step": 7610 }, { "epoch": 33.86666666666667, "grad_norm": 0.32572317123413086, "learning_rate": 1.7108826961659628e-05, "loss": 0.010634499043226242, "step": 7620 }, { "epoch": 33.91111111111111, "grad_norm": 0.17816489934921265, "learning_rate": 1.702483698284093e-05, "loss": 0.009241054207086563, "step": 7630 }, { "epoch": 33.955555555555556, "grad_norm": 0.15832415223121643, "learning_rate": 1.694097192119781e-05, "loss": 0.009616616368293762, "step": 7640 }, { "epoch": 34.0, "grad_norm": 0.16053107380867004, "learning_rate": 1.6857232584133354e-05, "loss": 0.00886504426598549, "step": 7650 }, { "epoch": 34.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.987349635889356, "eval_iou_background": 0.0, "eval_iou_crop": 0.987349635889356, "eval_loss": 0.016093412414193153, "eval_mean_accuracy": 0.987349635889356, "eval_mean_iou": 0.493674817944678, "eval_overall_accuracy": 0.987349635889356, "eval_runtime": 4.9331, "eval_samples_per_second": 64.463, "eval_steps_per_second": 8.109, "step": 7650 }, { "epoch": 34.044444444444444, "grad_norm": 0.10610102862119675, "learning_rate": 1.677361977784025e-05, "loss": 0.009546398371458053, "step": 7660 }, { "epoch": 34.08888888888889, "grad_norm": 0.22379638254642487, "learning_rate": 1.6690134307293e-05, "loss": 0.0101467065513134, "step": 7670 }, { "epoch": 34.13333333333333, "grad_norm": 0.343379944562912, "learning_rate": 1.660677697624023e-05, "loss": 0.008497150987386704, "step": 7680 }, { "epoch": 34.17777777777778, "grad_norm": 0.22120223939418793, "learning_rate": 1.652354858719689e-05, "loss": 0.010910794883966447, "step": 7690 }, { "epoch": 34.22222222222222, "grad_norm": 0.15080679953098297, "learning_rate": 1.6440449941436545e-05, "loss": 0.010526084899902343, "step": 7700 }, { "epoch": 34.266666666666666, "grad_norm": 0.30526238679885864, "learning_rate": 1.6357481838983673e-05, "loss": 0.011884907633066178, "step": 7710 }, { "epoch": 34.31111111111111, "grad_norm": 0.23559217154979706, "learning_rate": 1.6274645078606004e-05, "loss": 0.0159156933426857, "step": 7720 }, { "epoch": 34.355555555555554, "grad_norm": 0.14082294702529907, "learning_rate": 1.619194045780672e-05, "loss": 0.009219977259635925, "step": 7730 }, { "epoch": 34.4, "grad_norm": 0.2513488829135895, "learning_rate": 1.6109368772816867e-05, "loss": 0.009757281839847564, "step": 7740 }, { "epoch": 34.44444444444444, "grad_norm": 0.09470014274120331, "learning_rate": 1.6026930818587673e-05, "loss": 0.009167073667049408, "step": 7750 }, { "epoch": 34.48888888888889, "grad_norm": 0.13641005754470825, "learning_rate": 1.594462738878288e-05, "loss": 0.011327899992465973, "step": 7760 }, { "epoch": 34.53333333333333, "grad_norm": 0.3275153338909149, "learning_rate": 1.5862459275771085e-05, "loss": 0.009165005385875702, "step": 7770 }, { "epoch": 34.577777777777776, "grad_norm": 0.11175866425037384, "learning_rate": 1.5780427270618186e-05, "loss": 0.009274663031101226, "step": 7780 }, { "epoch": 34.62222222222222, "grad_norm": 0.14954638481140137, "learning_rate": 1.5698532163079673e-05, "loss": 0.009301595389842987, "step": 7790 }, { "epoch": 34.666666666666664, "grad_norm": 0.12754788994789124, "learning_rate": 1.5616774741593088e-05, "loss": 0.010568148642778396, "step": 7800 }, { "epoch": 34.71111111111111, "grad_norm": 0.09315014630556107, "learning_rate": 1.5535155793270387e-05, "loss": 0.011067824810743332, "step": 7810 }, { "epoch": 34.75555555555555, "grad_norm": 0.10851321369409561, "learning_rate": 1.5453676103890412e-05, "loss": 0.008293892443180084, "step": 7820 }, { "epoch": 34.8, "grad_norm": 0.1154833436012268, "learning_rate": 1.5372336457891304e-05, "loss": 0.008684559166431427, "step": 7830 }, { "epoch": 34.84444444444444, "grad_norm": 0.16019223630428314, "learning_rate": 1.529113763836294e-05, "loss": 0.01096649542450905, "step": 7840 }, { "epoch": 34.888888888888886, "grad_norm": 0.1327367126941681, "learning_rate": 1.52100804270394e-05, "loss": 0.013495345413684846, "step": 7850 }, { "epoch": 34.93333333333333, "grad_norm": 0.35757553577423096, "learning_rate": 1.512916560429146e-05, "loss": 0.010800091177225113, "step": 7860 }, { "epoch": 34.977777777777774, "grad_norm": 0.3380919098854065, "learning_rate": 1.5048393949119054e-05, "loss": 0.011361131072044372, "step": 7870 }, { "epoch": 35.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9877207613484494, "eval_iou_background": 0.0, "eval_iou_crop": 0.9877207613484494, "eval_loss": 0.015683069825172424, "eval_mean_accuracy": 0.9877207613484494, "eval_mean_iou": 0.4938603806742247, "eval_overall_accuracy": 0.9877207613484494, "eval_runtime": 4.1983, "eval_samples_per_second": 75.744, "eval_steps_per_second": 9.528, "step": 7875 }, { "epoch": 35.022222222222226, "grad_norm": 0.1441982537508011, "learning_rate": 1.4967766239143765e-05, "loss": 0.009061855077743531, "step": 7880 }, { "epoch": 35.06666666666667, "grad_norm": 0.19607199728488922, "learning_rate": 1.4887283250601386e-05, "loss": 0.009152691811323166, "step": 7890 }, { "epoch": 35.111111111111114, "grad_norm": 0.15149147808551788, "learning_rate": 1.4806945758334407e-05, "loss": 0.008919592201709747, "step": 7900 }, { "epoch": 35.15555555555556, "grad_norm": 0.11700580269098282, "learning_rate": 1.472675453578456e-05, "loss": 0.00888640359044075, "step": 7910 }, { "epoch": 35.2, "grad_norm": 0.24411945044994354, "learning_rate": 1.4646710354985393e-05, "loss": 0.011847062408924103, "step": 7920 }, { "epoch": 35.24444444444445, "grad_norm": 0.6391777992248535, "learning_rate": 1.4566813986554805e-05, "loss": 0.010287994146347046, "step": 7930 }, { "epoch": 35.28888888888889, "grad_norm": 0.2236059457063675, "learning_rate": 1.4487066199687673e-05, "loss": 0.011360323429107666, "step": 7940 }, { "epoch": 35.333333333333336, "grad_norm": 0.13868439197540283, "learning_rate": 1.4407467762148374e-05, "loss": 0.011205317825078965, "step": 7950 }, { "epoch": 35.37777777777778, "grad_norm": 0.20370614528656006, "learning_rate": 1.432801944026348e-05, "loss": 0.008879441767930984, "step": 7960 }, { "epoch": 35.422222222222224, "grad_norm": 1.2366740703582764, "learning_rate": 1.4248721998914309e-05, "loss": 0.012083116173744201, "step": 7970 }, { "epoch": 35.46666666666667, "grad_norm": 0.13267114758491516, "learning_rate": 1.4169576201529635e-05, "loss": 0.008464067429304122, "step": 7980 }, { "epoch": 35.51111111111111, "grad_norm": 0.15909196436405182, "learning_rate": 1.4090582810078239e-05, "loss": 0.010950255393981933, "step": 7990 }, { "epoch": 35.55555555555556, "grad_norm": 0.09778666496276855, "learning_rate": 1.4011742585061657e-05, "loss": 0.009682464599609374, "step": 8000 }, { "epoch": 35.6, "grad_norm": 0.13918869197368622, "learning_rate": 1.393305628550684e-05, "loss": 0.008658059686422349, "step": 8010 }, { "epoch": 35.644444444444446, "grad_norm": 0.15457627177238464, "learning_rate": 1.3854524668958783e-05, "loss": 0.009674222767353058, "step": 8020 }, { "epoch": 35.68888888888889, "grad_norm": 0.10907674580812454, "learning_rate": 1.3776148491473363e-05, "loss": 0.011147359758615494, "step": 8030 }, { "epoch": 35.733333333333334, "grad_norm": 0.32708513736724854, "learning_rate": 1.3697928507609923e-05, "loss": 0.01181158870458603, "step": 8040 }, { "epoch": 35.77777777777778, "grad_norm": 0.075588159263134, "learning_rate": 1.3619865470424104e-05, "loss": 0.008575809746980667, "step": 8050 }, { "epoch": 35.82222222222222, "grad_norm": 0.36726707220077515, "learning_rate": 1.3541960131460512e-05, "loss": 0.00925149917602539, "step": 8060 }, { "epoch": 35.86666666666667, "grad_norm": 0.2146628499031067, "learning_rate": 1.3464213240745564e-05, "loss": 0.011378446221351623, "step": 8070 }, { "epoch": 35.91111111111111, "grad_norm": 0.18562643229961395, "learning_rate": 1.3386625546780227e-05, "loss": 0.00802200585603714, "step": 8080 }, { "epoch": 35.955555555555556, "grad_norm": 0.2347923368215561, "learning_rate": 1.3309197796532805e-05, "loss": 0.009500047564506531, "step": 8090 }, { "epoch": 36.0, "grad_norm": 0.22689056396484375, "learning_rate": 1.323193073543177e-05, "loss": 0.009397213906049728, "step": 8100 }, { "epoch": 36.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9886972343855736, "eval_iou_background": 0.0, "eval_iou_crop": 0.9886972343855736, "eval_loss": 0.016109108924865723, "eval_mean_accuracy": 0.9886972343855736, "eval_mean_iou": 0.4943486171927868, "eval_overall_accuracy": 0.9886972343855736, "eval_runtime": 5.0256, "eval_samples_per_second": 63.276, "eval_steps_per_second": 7.959, "step": 8100 }, { "epoch": 36.044444444444444, "grad_norm": 0.17394810914993286, "learning_rate": 1.3154825107358568e-05, "loss": 0.00973832756280899, "step": 8110 }, { "epoch": 36.08888888888889, "grad_norm": 0.20927636325359344, "learning_rate": 1.307788165464047e-05, "loss": 0.010629218816757203, "step": 8120 }, { "epoch": 36.13333333333333, "grad_norm": 0.15015459060668945, "learning_rate": 1.3001101118043395e-05, "loss": 0.008879870921373368, "step": 8130 }, { "epoch": 36.17777777777778, "grad_norm": 0.1626884788274765, "learning_rate": 1.2924484236764836e-05, "loss": 0.010640408098697662, "step": 8140 }, { "epoch": 36.22222222222222, "grad_norm": 0.21271207928657532, "learning_rate": 1.2848031748426689e-05, "loss": 0.008810238540172577, "step": 8150 }, { "epoch": 36.266666666666666, "grad_norm": 0.2290344387292862, "learning_rate": 1.2771744389068174e-05, "loss": 0.00866846665740013, "step": 8160 }, { "epoch": 36.31111111111111, "grad_norm": 0.452323317527771, "learning_rate": 1.2695622893138756e-05, "loss": 0.010568013787269593, "step": 8170 }, { "epoch": 36.355555555555554, "grad_norm": 0.18893477320671082, "learning_rate": 1.2619667993491061e-05, "loss": 0.017853713035583495, "step": 8180 }, { "epoch": 36.4, "grad_norm": 0.1229911521077156, "learning_rate": 1.2543880421373826e-05, "loss": 0.009917914867401123, "step": 8190 }, { "epoch": 36.44444444444444, "grad_norm": 0.36613601446151733, "learning_rate": 1.246826090642484e-05, "loss": 0.010736520588397979, "step": 8200 }, { "epoch": 36.48888888888889, "grad_norm": 1.054783582687378, "learning_rate": 1.2392810176663964e-05, "loss": 0.010082517564296723, "step": 8210 }, { "epoch": 36.53333333333333, "grad_norm": 0.0944657102227211, "learning_rate": 1.2317528958486071e-05, "loss": 0.008532854914665221, "step": 8220 }, { "epoch": 36.577777777777776, "grad_norm": 0.20097963511943817, "learning_rate": 1.2242417976654123e-05, "loss": 0.010825511068105698, "step": 8230 }, { "epoch": 36.62222222222222, "grad_norm": 0.16960740089416504, "learning_rate": 1.216747795429208e-05, "loss": 0.009948232769966125, "step": 8240 }, { "epoch": 36.666666666666664, "grad_norm": 0.6997804641723633, "learning_rate": 1.209270961287805e-05, "loss": 0.01187824159860611, "step": 8250 }, { "epoch": 36.71111111111111, "grad_norm": 0.2355063408613205, "learning_rate": 1.2018113672237302e-05, "loss": 0.010560347139835358, "step": 8260 }, { "epoch": 36.75555555555555, "grad_norm": 0.14960607886314392, "learning_rate": 1.1943690850535296e-05, "loss": 0.009540726989507675, "step": 8270 }, { "epoch": 36.8, "grad_norm": 0.14744175970554352, "learning_rate": 1.1869441864270824e-05, "loss": 0.010541623830795288, "step": 8280 }, { "epoch": 36.84444444444444, "grad_norm": 0.14729435741901398, "learning_rate": 1.179536742826913e-05, "loss": 0.008599544316530228, "step": 8290 }, { "epoch": 36.888888888888886, "grad_norm": 0.30318766832351685, "learning_rate": 1.1721468255674949e-05, "loss": 0.011206484586000442, "step": 8300 }, { "epoch": 36.93333333333333, "grad_norm": 0.1659647673368454, "learning_rate": 1.164774505794568e-05, "loss": 0.009773840755224228, "step": 8310 }, { "epoch": 36.977777777777774, "grad_norm": 0.12480331212282181, "learning_rate": 1.1574198544844563e-05, "loss": 0.008205689489841461, "step": 8320 }, { "epoch": 37.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9871156830531491, "eval_iou_background": 0.0, "eval_iou_crop": 0.9871156830531491, "eval_loss": 0.016175413504242897, "eval_mean_accuracy": 0.9871156830531491, "eval_mean_iou": 0.49355784152657456, "eval_overall_accuracy": 0.9871156830531491, "eval_runtime": 4.3564, "eval_samples_per_second": 72.996, "eval_steps_per_second": 9.182, "step": 8325 }, { "epoch": 37.022222222222226, "grad_norm": 0.19714780151844025, "learning_rate": 1.1500829424433825e-05, "loss": 0.008260628581047058, "step": 8330 }, { "epoch": 37.06666666666667, "grad_norm": 0.34514838457107544, "learning_rate": 1.1427638403067817e-05, "loss": 0.010611176490783691, "step": 8340 }, { "epoch": 37.111111111111114, "grad_norm": 0.16801612079143524, "learning_rate": 1.135462618538633e-05, "loss": 0.0086660698056221, "step": 8350 }, { "epoch": 37.15555555555556, "grad_norm": 0.18599268794059753, "learning_rate": 1.1281793474307686e-05, "loss": 0.010147134959697723, "step": 8360 }, { "epoch": 37.2, "grad_norm": 0.09529401361942291, "learning_rate": 1.120914097102205e-05, "loss": 0.010002662241458894, "step": 8370 }, { "epoch": 37.24444444444445, "grad_norm": 0.08701646327972412, "learning_rate": 1.1136669374984623e-05, "loss": 0.008551066368818283, "step": 8380 }, { "epoch": 37.28888888888889, "grad_norm": 0.1116730123758316, "learning_rate": 1.1064379383908969e-05, "loss": 0.012113143503665925, "step": 8390 }, { "epoch": 37.333333333333336, "grad_norm": 0.36920425295829773, "learning_rate": 1.0992271693760256e-05, "loss": 0.009505388885736465, "step": 8400 }, { "epoch": 37.37777777777778, "grad_norm": 0.30732259154319763, "learning_rate": 1.0920346998748564e-05, "loss": 0.00952598825097084, "step": 8410 }, { "epoch": 37.422222222222224, "grad_norm": 0.11631600558757782, "learning_rate": 1.084860599132221e-05, "loss": 0.008099675923585892, "step": 8420 }, { "epoch": 37.46666666666667, "grad_norm": 0.19066797196865082, "learning_rate": 1.077704936216107e-05, "loss": 0.008108977973461152, "step": 8430 }, { "epoch": 37.51111111111111, "grad_norm": 0.19728882610797882, "learning_rate": 1.0705677800169954e-05, "loss": 0.00889047235250473, "step": 8440 }, { "epoch": 37.55555555555556, "grad_norm": 0.11411871016025543, "learning_rate": 1.0634491992471911e-05, "loss": 0.010507308691740037, "step": 8450 }, { "epoch": 37.6, "grad_norm": 0.18581266701221466, "learning_rate": 1.05634926244017e-05, "loss": 0.008106718957424163, "step": 8460 }, { "epoch": 37.644444444444446, "grad_norm": 0.06667740643024445, "learning_rate": 1.0492680379499128e-05, "loss": 0.008549075573682785, "step": 8470 }, { "epoch": 37.68888888888889, "grad_norm": 0.14750997722148895, "learning_rate": 1.0422055939502528e-05, "loss": 0.01161084696650505, "step": 8480 }, { "epoch": 37.733333333333334, "grad_norm": 0.3073539137840271, "learning_rate": 1.0351619984342099e-05, "loss": 0.008877433836460114, "step": 8490 }, { "epoch": 37.77777777777778, "grad_norm": 0.14369788765907288, "learning_rate": 1.028137319213346e-05, "loss": 0.012289269268512726, "step": 8500 }, { "epoch": 37.82222222222222, "grad_norm": 0.1440463364124298, "learning_rate": 1.0211316239171081e-05, "loss": 0.008424662053585052, "step": 8510 }, { "epoch": 37.86666666666667, "grad_norm": 0.17496487498283386, "learning_rate": 1.0141449799921745e-05, "loss": 0.011977940052747726, "step": 8520 }, { "epoch": 37.91111111111111, "grad_norm": 0.15452471375465393, "learning_rate": 1.0071774547018097e-05, "loss": 0.010050833225250244, "step": 8530 }, { "epoch": 37.955555555555556, "grad_norm": 0.2379625290632248, "learning_rate": 1.0002291151252183e-05, "loss": 0.009011054039001464, "step": 8540 }, { "epoch": 38.0, "grad_norm": 0.3319093883037567, "learning_rate": 9.933000281568927e-06, "loss": 0.008132915943861008, "step": 8550 }, { "epoch": 38.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9853259761700941, "eval_iou_background": 0.0, "eval_iou_crop": 0.9853259761700941, "eval_loss": 0.016127141192555428, "eval_mean_accuracy": 0.9853259761700941, "eval_mean_iou": 0.49266298808504705, "eval_overall_accuracy": 0.9853259761700941, "eval_runtime": 4.9914, "eval_samples_per_second": 63.709, "eval_steps_per_second": 8.014, "step": 8550 }, { "epoch": 38.044444444444444, "grad_norm": 0.08342853933572769, "learning_rate": 9.863902605059723e-06, "loss": 0.009858573228120804, "step": 8560 }, { "epoch": 38.08888888888889, "grad_norm": 0.13003942370414734, "learning_rate": 9.794998786956029e-06, "loss": 0.008732558786869049, "step": 8570 }, { "epoch": 38.13333333333333, "grad_norm": 0.16534218192100525, "learning_rate": 9.726289490622964e-06, "loss": 0.008687300235033035, "step": 8580 }, { "epoch": 38.17777777777778, "grad_norm": 0.33109521865844727, "learning_rate": 9.657775377552857e-06, "loss": 0.0142244353890419, "step": 8590 }, { "epoch": 38.22222222222222, "grad_norm": 0.14419220387935638, "learning_rate": 9.589457107358991e-06, "loss": 0.008839359134435653, "step": 8600 }, { "epoch": 38.266666666666666, "grad_norm": 0.1888597309589386, "learning_rate": 9.521335337769154e-06, "loss": 0.014219576120376587, "step": 8610 }, { "epoch": 38.31111111111111, "grad_norm": 0.32233986258506775, "learning_rate": 9.453410724619353e-06, "loss": 0.010401470214128494, "step": 8620 }, { "epoch": 38.355555555555554, "grad_norm": 0.17485755681991577, "learning_rate": 9.38568392184747e-06, "loss": 0.008073202520608901, "step": 8630 }, { "epoch": 38.4, "grad_norm": 0.19004598259925842, "learning_rate": 9.318155581487014e-06, "loss": 0.009592197090387344, "step": 8640 }, { "epoch": 38.44444444444444, "grad_norm": 0.4857015907764435, "learning_rate": 9.2508263536608e-06, "loss": 0.009050561487674713, "step": 8650 }, { "epoch": 38.48888888888889, "grad_norm": 0.16593524813652039, "learning_rate": 9.183696886574706e-06, "loss": 0.010384495556354522, "step": 8660 }, { "epoch": 38.53333333333333, "grad_norm": 0.08969233930110931, "learning_rate": 9.116767826511442e-06, "loss": 0.01090916246175766, "step": 8670 }, { "epoch": 38.577777777777776, "grad_norm": 0.17988525331020355, "learning_rate": 9.050039817824303e-06, "loss": 0.009622099995613097, "step": 8680 }, { "epoch": 38.62222222222222, "grad_norm": 0.12048563361167908, "learning_rate": 8.983513502931007e-06, "loss": 0.008557760715484619, "step": 8690 }, { "epoch": 38.666666666666664, "grad_norm": 0.38834285736083984, "learning_rate": 8.917189522307442e-06, "loss": 0.010668180137872695, "step": 8700 }, { "epoch": 38.71111111111111, "grad_norm": 0.1947161853313446, "learning_rate": 8.851068514481573e-06, "loss": 0.0088848777115345, "step": 8710 }, { "epoch": 38.75555555555555, "grad_norm": 0.16620716452598572, "learning_rate": 8.785151116027257e-06, "loss": 0.009028815478086472, "step": 8720 }, { "epoch": 38.8, "grad_norm": 0.14173457026481628, "learning_rate": 8.719437961558115e-06, "loss": 0.009423910081386567, "step": 8730 }, { "epoch": 38.84444444444444, "grad_norm": 0.2560481131076813, "learning_rate": 8.65392968372144e-06, "loss": 0.009656582772731782, "step": 8740 }, { "epoch": 38.888888888888886, "grad_norm": 0.2174036055803299, "learning_rate": 8.588626913192082e-06, "loss": 0.009034762531518937, "step": 8750 }, { "epoch": 38.93333333333333, "grad_norm": 0.09497933089733124, "learning_rate": 8.523530278666399e-06, "loss": 0.007124392688274384, "step": 8760 }, { "epoch": 38.977777777777774, "grad_norm": 0.31073257327079773, "learning_rate": 8.458640406856172e-06, "loss": 0.008978623151779174, "step": 8770 }, { "epoch": 39.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9862346438156933, "eval_iou_background": 0.0, "eval_iou_crop": 0.9862346438156933, "eval_loss": 0.016855206340551376, "eval_mean_accuracy": 0.9862346438156933, "eval_mean_iou": 0.49311732190784663, "eval_overall_accuracy": 0.9862346438156933, "eval_runtime": 4.9795, "eval_samples_per_second": 63.862, "eval_steps_per_second": 8.033, "step": 8775 }, { "epoch": 39.022222222222226, "grad_norm": 0.27861523628234863, "learning_rate": 8.39395792248261e-06, "loss": 0.009674544632434844, "step": 8780 }, { "epoch": 39.06666666666667, "grad_norm": 0.2110968381166458, "learning_rate": 8.329483448270335e-06, "loss": 0.010200072079896927, "step": 8790 }, { "epoch": 39.111111111111114, "grad_norm": 0.11281915009021759, "learning_rate": 8.265217604941353e-06, "loss": 0.007965505868196488, "step": 8800 }, { "epoch": 39.15555555555556, "grad_norm": 0.34016016125679016, "learning_rate": 8.201161011209072e-06, "loss": 0.010503782331943512, "step": 8810 }, { "epoch": 39.2, "grad_norm": 0.09845948219299316, "learning_rate": 8.13731428377241e-06, "loss": 0.011164815723896026, "step": 8820 }, { "epoch": 39.24444444444445, "grad_norm": 0.1427334100008011, "learning_rate": 8.073678037309802e-06, "loss": 0.008042615652084351, "step": 8830 }, { "epoch": 39.28888888888889, "grad_norm": 0.711721658706665, "learning_rate": 8.010252884473273e-06, "loss": 0.01185576617717743, "step": 8840 }, { "epoch": 39.333333333333336, "grad_norm": 3.748128652572632, "learning_rate": 7.947039435882604e-06, "loss": 0.010901518166065216, "step": 8850 }, { "epoch": 39.37777777777778, "grad_norm": 0.44545602798461914, "learning_rate": 7.884038300119394e-06, "loss": 0.009559103101491929, "step": 8860 }, { "epoch": 39.422222222222224, "grad_norm": 0.08467259258031845, "learning_rate": 7.82125008372122e-06, "loss": 0.0094651959836483, "step": 8870 }, { "epoch": 39.46666666666667, "grad_norm": 0.42417973279953003, "learning_rate": 7.758675391175787e-06, "loss": 0.010829713940620423, "step": 8880 }, { "epoch": 39.51111111111111, "grad_norm": 0.16081629693508148, "learning_rate": 7.696314824915136e-06, "loss": 0.010946983098983764, "step": 8890 }, { "epoch": 39.55555555555556, "grad_norm": 0.14074282348155975, "learning_rate": 7.63416898530982e-06, "loss": 0.009233842045068741, "step": 8900 }, { "epoch": 39.6, "grad_norm": 0.15290798246860504, "learning_rate": 7.5722384706631354e-06, "loss": 0.008949696272611617, "step": 8910 }, { "epoch": 39.644444444444446, "grad_norm": 0.12808571755886078, "learning_rate": 7.510523877205348e-06, "loss": 0.009515069425106049, "step": 8920 }, { "epoch": 39.68888888888889, "grad_norm": 0.09376636892557144, "learning_rate": 7.449025799087971e-06, "loss": 0.009142509847879409, "step": 8930 }, { "epoch": 39.733333333333334, "grad_norm": 0.08920039981603622, "learning_rate": 7.3877448283780435e-06, "loss": 0.009481516480445863, "step": 8940 }, { "epoch": 39.77777777777778, "grad_norm": 0.18315701186656952, "learning_rate": 7.326681555052395e-06, "loss": 0.009099499881267547, "step": 8950 }, { "epoch": 39.82222222222222, "grad_norm": 0.20228026807308197, "learning_rate": 7.265836566992019e-06, "loss": 0.008513420820236206, "step": 8960 }, { "epoch": 39.86666666666667, "grad_norm": 0.1185707300901413, "learning_rate": 7.205210449976385e-06, "loss": 0.009149493277072906, "step": 8970 }, { "epoch": 39.91111111111111, "grad_norm": 0.1808559149503708, "learning_rate": 7.144803787677796e-06, "loss": 0.01176646426320076, "step": 8980 }, { "epoch": 39.955555555555556, "grad_norm": 0.13035795092582703, "learning_rate": 7.084617161655776e-06, "loss": 0.008845588564872742, "step": 8990 }, { "epoch": 40.0, "grad_norm": 0.14816752076148987, "learning_rate": 7.024651151351474e-06, "loss": 0.008386646956205368, "step": 9000 }, { "epoch": 40.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9867986834228744, "eval_iou_background": 0.0, "eval_iou_crop": 0.9867986834228744, "eval_loss": 0.016107862815260887, "eval_mean_accuracy": 0.9867986834228744, "eval_mean_iou": 0.4933993417114372, "eval_overall_accuracy": 0.9867986834228744, "eval_runtime": 4.2491, "eval_samples_per_second": 74.839, "eval_steps_per_second": 9.414, "step": 9000 }, { "epoch": 40.044444444444444, "grad_norm": 0.11442097276449203, "learning_rate": 6.964906334082084e-06, "loss": 0.010162974148988724, "step": 9010 }, { "epoch": 40.08888888888889, "grad_norm": 0.12665948271751404, "learning_rate": 6.905383285035263e-06, "loss": 0.011018770933151244, "step": 9020 }, { "epoch": 40.13333333333333, "grad_norm": 0.30260199308395386, "learning_rate": 6.846082577263643e-06, "loss": 0.00993640273809433, "step": 9030 }, { "epoch": 40.17777777777778, "grad_norm": 0.23481261730194092, "learning_rate": 6.787004781679261e-06, "loss": 0.011438509821891785, "step": 9040 }, { "epoch": 40.22222222222222, "grad_norm": 0.6293283700942993, "learning_rate": 6.7281504670481295e-06, "loss": 0.009909652173519135, "step": 9050 }, { "epoch": 40.266666666666666, "grad_norm": 0.1908373236656189, "learning_rate": 6.669520199984667e-06, "loss": 0.008559158444404602, "step": 9060 }, { "epoch": 40.31111111111111, "grad_norm": 0.2800517976284027, "learning_rate": 6.611114544946326e-06, "loss": 0.010904067754745483, "step": 9070 }, { "epoch": 40.355555555555554, "grad_norm": 0.1679239124059677, "learning_rate": 6.552934064228126e-06, "loss": 0.008476626873016358, "step": 9080 }, { "epoch": 40.4, "grad_norm": 0.3395392894744873, "learning_rate": 6.4949793179572225e-06, "loss": 0.00960720032453537, "step": 9090 }, { "epoch": 40.44444444444444, "grad_norm": 0.15560856461524963, "learning_rate": 6.437250864087544e-06, "loss": 0.010442525893449784, "step": 9100 }, { "epoch": 40.48888888888889, "grad_norm": 0.19684119522571564, "learning_rate": 6.379749258394428e-06, "loss": 0.009402762353420257, "step": 9110 }, { "epoch": 40.53333333333333, "grad_norm": 0.10310734808444977, "learning_rate": 6.322475054469242e-06, "loss": 0.00812251791357994, "step": 9120 }, { "epoch": 40.577777777777776, "grad_norm": 0.3024386465549469, "learning_rate": 6.265428803714043e-06, "loss": 0.009917283803224564, "step": 9130 }, { "epoch": 40.62222222222222, "grad_norm": 0.1136888936161995, "learning_rate": 6.2086110553363095e-06, "loss": 0.009009785205125808, "step": 9140 }, { "epoch": 40.666666666666664, "grad_norm": 0.10895899683237076, "learning_rate": 6.152022356343635e-06, "loss": 0.009647868573665619, "step": 9150 }, { "epoch": 40.71111111111111, "grad_norm": 0.19797876477241516, "learning_rate": 6.095663251538453e-06, "loss": 0.011397708952426911, "step": 9160 }, { "epoch": 40.75555555555555, "grad_norm": 0.09987834841012955, "learning_rate": 6.039534283512813e-06, "loss": 0.00788293182849884, "step": 9170 }, { "epoch": 40.8, "grad_norm": 0.0898575559258461, "learning_rate": 5.9836359926431274e-06, "loss": 0.008983664959669114, "step": 9180 }, { "epoch": 40.84444444444444, "grad_norm": 0.17771229147911072, "learning_rate": 5.927968917085008e-06, "loss": 0.009258570522069931, "step": 9190 }, { "epoch": 40.888888888888886, "grad_norm": 0.1653849333524704, "learning_rate": 5.8725335927680336e-06, "loss": 0.011366803944110871, "step": 9200 }, { "epoch": 40.93333333333333, "grad_norm": 0.1255594789981842, "learning_rate": 5.817330553390638e-06, "loss": 0.010289539396762849, "step": 9210 }, { "epoch": 40.977777777777774, "grad_norm": 0.1295168399810791, "learning_rate": 5.762360330414957e-06, "loss": 0.011482463777065277, "step": 9220 }, { "epoch": 41.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9870389374749735, "eval_iou_background": 0.0, "eval_iou_crop": 0.9870389374749735, "eval_loss": 0.01579268090426922, "eval_mean_accuracy": 0.9870389374749735, "eval_mean_iou": 0.49351946873748676, "eval_overall_accuracy": 0.9870389374749735, "eval_runtime": 4.9573, "eval_samples_per_second": 64.148, "eval_steps_per_second": 8.069, "step": 9225 }, { "epoch": 41.022222222222226, "grad_norm": 0.5648945569992065, "learning_rate": 5.707623453061694e-06, "loss": 0.010472696274518967, "step": 9230 }, { "epoch": 41.06666666666667, "grad_norm": 0.24583551287651062, "learning_rate": 5.653120448305054e-06, "loss": 0.008899197727441788, "step": 9240 }, { "epoch": 41.111111111111114, "grad_norm": 0.17115260660648346, "learning_rate": 5.59885184086764e-06, "loss": 0.008308984339237213, "step": 9250 }, { "epoch": 41.15555555555556, "grad_norm": 0.13256648182868958, "learning_rate": 5.5448181532154385e-06, "loss": 0.008741877973079681, "step": 9260 }, { "epoch": 41.2, "grad_norm": 0.22882330417633057, "learning_rate": 5.491019905552737e-06, "loss": 0.010008525103330612, "step": 9270 }, { "epoch": 41.24444444444445, "grad_norm": 0.14104101061820984, "learning_rate": 5.4374576158171675e-06, "loss": 0.010174065083265304, "step": 9280 }, { "epoch": 41.28888888888889, "grad_norm": 0.13034752011299133, "learning_rate": 5.384131799674691e-06, "loss": 0.009599237143993378, "step": 9290 }, { "epoch": 41.333333333333336, "grad_norm": 0.21091969311237335, "learning_rate": 5.331042970514666e-06, "loss": 0.010817769169807433, "step": 9300 }, { "epoch": 41.37777777777778, "grad_norm": 0.3192712366580963, "learning_rate": 5.278191639444832e-06, "loss": 0.011463935673236846, "step": 9310 }, { "epoch": 41.422222222222224, "grad_norm": 0.13509511947631836, "learning_rate": 5.22557831528648e-06, "loss": 0.008219669759273528, "step": 9320 }, { "epoch": 41.46666666666667, "grad_norm": 0.30441412329673767, "learning_rate": 5.173203504569499e-06, "loss": 0.009334265440702438, "step": 9330 }, { "epoch": 41.51111111111111, "grad_norm": 0.15208688378334045, "learning_rate": 5.121067711527498e-06, "loss": 0.008971913158893586, "step": 9340 }, { "epoch": 41.55555555555556, "grad_norm": 0.1834406554698944, "learning_rate": 5.069171438092973e-06, "loss": 0.009166532754898071, "step": 9350 }, { "epoch": 41.6, "grad_norm": 0.09260621666908264, "learning_rate": 5.017515183892487e-06, "loss": 0.009075510501861572, "step": 9360 }, { "epoch": 41.644444444444446, "grad_norm": 0.12908564507961273, "learning_rate": 4.966099446241831e-06, "loss": 0.00834164097905159, "step": 9370 }, { "epoch": 41.68888888888889, "grad_norm": 0.3206913471221924, "learning_rate": 4.914924720141215e-06, "loss": 0.010787234455347062, "step": 9380 }, { "epoch": 41.733333333333334, "grad_norm": 0.20668160915374756, "learning_rate": 4.86399149827057e-06, "loss": 0.008846065402030945, "step": 9390 }, { "epoch": 41.77777777777778, "grad_norm": 0.44397252798080444, "learning_rate": 4.8133002709847525e-06, "loss": 0.01097593829035759, "step": 9400 }, { "epoch": 41.82222222222222, "grad_norm": 0.20189468562602997, "learning_rate": 4.76285152630884e-06, "loss": 0.00869334414601326, "step": 9410 }, { "epoch": 41.86666666666667, "grad_norm": 0.3745025396347046, "learning_rate": 4.712645749933433e-06, "loss": 0.00862944796681404, "step": 9420 }, { "epoch": 41.91111111111111, "grad_norm": 0.12419744580984116, "learning_rate": 4.662683425209971e-06, "loss": 0.010759425908327102, "step": 9430 }, { "epoch": 41.955555555555556, "grad_norm": 1.051476001739502, "learning_rate": 4.612965033146102e-06, "loss": 0.009813901036977768, "step": 9440 }, { "epoch": 42.0, "grad_norm": 0.2857818901538849, "learning_rate": 4.5634910524010055e-06, "loss": 0.00800687149167061, "step": 9450 }, { "epoch": 42.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9870036075807397, "eval_iou_background": 0.0, "eval_iou_crop": 0.9870036075807397, "eval_loss": 0.016197478398680687, "eval_mean_accuracy": 0.9870036075807397, "eval_mean_iou": 0.49350180379036984, "eval_overall_accuracy": 0.9870036075807397, "eval_runtime": 5.2, "eval_samples_per_second": 61.153, "eval_steps_per_second": 7.692, "step": 9450 }, { "epoch": 42.044444444444444, "grad_norm": 0.0808783769607544, "learning_rate": 4.514261959280843e-06, "loss": 0.00937308594584465, "step": 9460 }, { "epoch": 42.08888888888889, "grad_norm": 0.2844408452510834, "learning_rate": 4.465278227734123e-06, "loss": 0.010046932101249694, "step": 9470 }, { "epoch": 42.13333333333333, "grad_norm": 0.4044899642467499, "learning_rate": 4.416540329347175e-06, "loss": 0.009509791433811188, "step": 9480 }, { "epoch": 42.17777777777778, "grad_norm": 0.16986887156963348, "learning_rate": 4.368048733339582e-06, "loss": 0.009389126300811767, "step": 9490 }, { "epoch": 42.22222222222222, "grad_norm": 0.12908174097537994, "learning_rate": 4.3198039065596754e-06, "loss": 0.009671323001384735, "step": 9500 }, { "epoch": 42.266666666666666, "grad_norm": 0.19733834266662598, "learning_rate": 4.271806313480043e-06, "loss": 0.009784835577011108, "step": 9510 }, { "epoch": 42.31111111111111, "grad_norm": 0.06883057951927185, "learning_rate": 4.2240564161930416e-06, "loss": 0.008562954515218735, "step": 9520 }, { "epoch": 42.355555555555554, "grad_norm": 0.15110228955745697, "learning_rate": 4.176554674406372e-06, "loss": 0.009358204901218414, "step": 9530 }, { "epoch": 42.4, "grad_norm": 0.12839378416538239, "learning_rate": 4.129301545438637e-06, "loss": 0.010094927251338958, "step": 9540 }, { "epoch": 42.44444444444444, "grad_norm": 0.08893191069364548, "learning_rate": 4.082297484214942e-06, "loss": 0.009588159620761871, "step": 9550 }, { "epoch": 42.48888888888889, "grad_norm": 0.3865722119808197, "learning_rate": 4.035542943262518e-06, "loss": 0.00966174602508545, "step": 9560 }, { "epoch": 42.53333333333333, "grad_norm": 0.15124055743217468, "learning_rate": 3.989038372706356e-06, "loss": 0.009892082214355469, "step": 9570 }, { "epoch": 42.577777777777776, "grad_norm": 0.2203996628522873, "learning_rate": 3.942784220264892e-06, "loss": 0.00922955572605133, "step": 9580 }, { "epoch": 42.62222222222222, "grad_norm": 0.1409890204668045, "learning_rate": 3.89678093124568e-06, "loss": 0.008969445526599885, "step": 9590 }, { "epoch": 42.666666666666664, "grad_norm": 0.10689610242843628, "learning_rate": 3.85102894854109e-06, "loss": 0.008726874738931656, "step": 9600 }, { "epoch": 42.71111111111111, "grad_norm": 0.610434889793396, "learning_rate": 3.805528712624102e-06, "loss": 0.01204061508178711, "step": 9610 }, { "epoch": 42.75555555555555, "grad_norm": 0.25447696447372437, "learning_rate": 3.7602806615440042e-06, "loss": 0.00919174700975418, "step": 9620 }, { "epoch": 42.8, "grad_norm": 0.14492172002792358, "learning_rate": 3.7152852309221917e-06, "loss": 0.008265383541584015, "step": 9630 }, { "epoch": 42.84444444444444, "grad_norm": 0.14401572942733765, "learning_rate": 3.6705428539479923e-06, "loss": 0.009117917716503143, "step": 9640 }, { "epoch": 42.888888888888886, "grad_norm": 0.08602733910083771, "learning_rate": 3.6260539613744827e-06, "loss": 0.011313943564891816, "step": 9650 }, { "epoch": 42.93333333333333, "grad_norm": 0.12237777560949326, "learning_rate": 3.581818981514341e-06, "loss": 0.007242021709680557, "step": 9660 }, { "epoch": 42.977777777777774, "grad_norm": 0.07774618268013, "learning_rate": 3.5378383402357216e-06, "loss": 0.009667984396219253, "step": 9670 }, { "epoch": 43.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9873696705245009, "eval_iou_background": 0.0, "eval_iou_crop": 0.9873696705245009, "eval_loss": 0.016740724444389343, "eval_mean_accuracy": 0.9873696705245009, "eval_mean_iou": 0.49368483526225043, "eval_overall_accuracy": 0.9873696705245009, "eval_runtime": 5.002, "eval_samples_per_second": 63.574, "eval_steps_per_second": 7.997, "step": 9675 }, { "epoch": 43.022222222222226, "grad_norm": 0.2042597085237503, "learning_rate": 3.4941124609581578e-06, "loss": 0.014802937209606171, "step": 9680 }, { "epoch": 43.06666666666667, "grad_norm": 0.15077997744083405, "learning_rate": 3.4506417646484934e-06, "loss": 0.008730484545230866, "step": 9690 }, { "epoch": 43.111111111111114, "grad_norm": 0.0969257801771164, "learning_rate": 3.4074266698168056e-06, "loss": 0.008107737451791764, "step": 9700 }, { "epoch": 43.15555555555556, "grad_norm": 0.12220139801502228, "learning_rate": 3.364467592512409e-06, "loss": 0.010306209325790405, "step": 9710 }, { "epoch": 43.2, "grad_norm": 0.1910788118839264, "learning_rate": 3.321764946319821e-06, "loss": 0.010331282764673233, "step": 9720 }, { "epoch": 43.24444444444445, "grad_norm": 0.21679209172725677, "learning_rate": 3.279319142354802e-06, "loss": 0.009432458877563476, "step": 9730 }, { "epoch": 43.28888888888889, "grad_norm": 0.24441024661064148, "learning_rate": 3.237130589260382e-06, "loss": 0.010894263535737992, "step": 9740 }, { "epoch": 43.333333333333336, "grad_norm": 0.09884672611951828, "learning_rate": 3.1951996932029313e-06, "loss": 0.007973553240299225, "step": 9750 }, { "epoch": 43.37777777777778, "grad_norm": 1.3102566003799438, "learning_rate": 3.153526857868262e-06, "loss": 0.010812371224164962, "step": 9760 }, { "epoch": 43.422222222222224, "grad_norm": 0.44917213916778564, "learning_rate": 3.112112484457709e-06, "loss": 0.00949961319565773, "step": 9770 }, { "epoch": 43.46666666666667, "grad_norm": 0.15101133286952972, "learning_rate": 3.070956971684308e-06, "loss": 0.010940992087125779, "step": 9780 }, { "epoch": 43.51111111111111, "grad_norm": 0.2391185164451599, "learning_rate": 3.0300607157689318e-06, "loss": 0.00914691761136055, "step": 9790 }, { "epoch": 43.55555555555556, "grad_norm": 0.1306968331336975, "learning_rate": 2.9894241104364804e-06, "loss": 0.008083894848823547, "step": 9800 }, { "epoch": 43.6, "grad_norm": 0.18575072288513184, "learning_rate": 2.9490475469120926e-06, "loss": 0.009058014303445817, "step": 9810 }, { "epoch": 43.644444444444446, "grad_norm": 0.23239481449127197, "learning_rate": 2.908931413917386e-06, "loss": 0.0093460813164711, "step": 9820 }, { "epoch": 43.68888888888889, "grad_norm": 0.7371838092803955, "learning_rate": 2.8690760976666918e-06, "loss": 0.011135801672935486, "step": 9830 }, { "epoch": 43.733333333333334, "grad_norm": 0.15142948925495148, "learning_rate": 2.8294819818633755e-06, "loss": 0.010835631936788558, "step": 9840 }, { "epoch": 43.77777777777778, "grad_norm": 0.3591817319393158, "learning_rate": 2.790149447696091e-06, "loss": 0.008295612037181854, "step": 9850 }, { "epoch": 43.82222222222222, "grad_norm": 0.14152100682258606, "learning_rate": 2.751078873835157e-06, "loss": 0.009266762435436249, "step": 9860 }, { "epoch": 43.86666666666667, "grad_norm": 0.6529484987258911, "learning_rate": 2.712270636428902e-06, "loss": 0.011058161407709122, "step": 9870 }, { "epoch": 43.91111111111111, "grad_norm": 0.09463955461978912, "learning_rate": 2.673725109100009e-06, "loss": 0.007944537699222565, "step": 9880 }, { "epoch": 43.955555555555556, "grad_norm": 0.5518578886985779, "learning_rate": 2.6354426629419648e-06, "loss": 0.008981087803840637, "step": 9890 }, { "epoch": 44.0, "grad_norm": 0.2325361669063568, "learning_rate": 2.5974236665154606e-06, "loss": 0.008235058933496475, "step": 9900 }, { "epoch": 44.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9867232842583509, "eval_iou_background": 0.0, "eval_iou_crop": 0.9867232842583509, "eval_loss": 0.016649842262268066, "eval_mean_accuracy": 0.9867232842583509, "eval_mean_iou": 0.49336164212917544, "eval_overall_accuracy": 0.9867232842583509, "eval_runtime": 5.033, "eval_samples_per_second": 63.183, "eval_steps_per_second": 7.948, "step": 9900 }, { "epoch": 44.044444444444444, "grad_norm": 0.1768428534269333, "learning_rate": 2.5596684858448503e-06, "loss": 0.009393288940191268, "step": 9910 }, { "epoch": 44.08888888888889, "grad_norm": 0.0958385318517685, "learning_rate": 2.5221774844146237e-06, "loss": 0.009489041566848756, "step": 9920 }, { "epoch": 44.13333333333333, "grad_norm": 0.1517782062292099, "learning_rate": 2.4849510231659145e-06, "loss": 0.008564892411231994, "step": 9930 }, { "epoch": 44.17777777777778, "grad_norm": 0.22501669824123383, "learning_rate": 2.4479894604930198e-06, "loss": 0.009396791458129883, "step": 9940 }, { "epoch": 44.22222222222222, "grad_norm": 0.16278569400310516, "learning_rate": 2.411293152239937e-06, "loss": 0.008301478624343873, "step": 9950 }, { "epoch": 44.266666666666666, "grad_norm": 0.30498072504997253, "learning_rate": 2.3748624516969673e-06, "loss": 0.009221111238002778, "step": 9960 }, { "epoch": 44.31111111111111, "grad_norm": 0.21526700258255005, "learning_rate": 2.338697709597296e-06, "loss": 0.009778054803609848, "step": 9970 }, { "epoch": 44.355555555555554, "grad_norm": 0.7358174324035645, "learning_rate": 2.3027992741136107e-06, "loss": 0.008685538172721862, "step": 9980 }, { "epoch": 44.4, "grad_norm": 0.10848166793584824, "learning_rate": 2.2671674908547622e-06, "loss": 0.008999171108007431, "step": 9990 }, { "epoch": 44.44444444444444, "grad_norm": 0.18759377300739288, "learning_rate": 2.2318027028624365e-06, "loss": 0.008966409415006638, "step": 10000 }, { "epoch": 44.48888888888889, "grad_norm": 0.2606959640979767, "learning_rate": 2.1967052506078413e-06, "loss": 0.01044531911611557, "step": 10010 }, { "epoch": 44.53333333333333, "grad_norm": 0.4822573959827423, "learning_rate": 2.161875471988426e-06, "loss": 0.008816277980804444, "step": 10020 }, { "epoch": 44.577777777777776, "grad_norm": 0.1541290283203125, "learning_rate": 2.127313702324649e-06, "loss": 0.009886687248945236, "step": 10030 }, { "epoch": 44.62222222222222, "grad_norm": 0.09918457269668579, "learning_rate": 2.0930202743567395e-06, "loss": 0.008372654020786286, "step": 10040 }, { "epoch": 44.666666666666664, "grad_norm": 0.23362848162651062, "learning_rate": 2.0589955182414854e-06, "loss": 0.00953168272972107, "step": 10050 }, { "epoch": 44.71111111111111, "grad_norm": 0.18845488131046295, "learning_rate": 2.025239761549058e-06, "loss": 0.00930858999490738, "step": 10060 }, { "epoch": 44.75555555555555, "grad_norm": 0.13237494230270386, "learning_rate": 1.9917533292598732e-06, "loss": 0.009608256071805954, "step": 10070 }, { "epoch": 44.8, "grad_norm": 0.14511226117610931, "learning_rate": 1.958536543761441e-06, "loss": 0.008183569461107255, "step": 10080 }, { "epoch": 44.84444444444444, "grad_norm": 0.23729798197746277, "learning_rate": 1.925589724845278e-06, "loss": 0.009363599121570587, "step": 10090 }, { "epoch": 44.888888888888886, "grad_norm": 0.15703774988651276, "learning_rate": 1.8929131897038132e-06, "loss": 0.012626522779464721, "step": 10100 }, { "epoch": 44.93333333333333, "grad_norm": 0.12241744995117188, "learning_rate": 1.8605072529273538e-06, "loss": 0.007926612347364425, "step": 10110 }, { "epoch": 44.977777777777774, "grad_norm": 0.15030965209007263, "learning_rate": 1.8283722265010505e-06, "loss": 0.00966208428144455, "step": 10120 }, { "epoch": 45.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9872344367372735, "eval_iou_background": 0.0, "eval_iou_crop": 0.9872344367372735, "eval_loss": 0.01683403179049492, "eval_mean_accuracy": 0.9872344367372735, "eval_mean_iou": 0.49361721836863676, "eval_overall_accuracy": 0.9872344367372735, "eval_runtime": 4.3468, "eval_samples_per_second": 73.157, "eval_steps_per_second": 9.202, "step": 10125 }, { "epoch": 45.022222222222226, "grad_norm": 0.14358478784561157, "learning_rate": 1.796508419801871e-06, "loss": 0.00744950920343399, "step": 10130 }, { "epoch": 45.06666666666667, "grad_norm": 0.09707742184400558, "learning_rate": 1.7649161395956615e-06, "loss": 0.008669641613960267, "step": 10140 }, { "epoch": 45.111111111111114, "grad_norm": 0.13448195159435272, "learning_rate": 1.733595690034152e-06, "loss": 0.008796460181474685, "step": 10150 }, { "epoch": 45.15555555555556, "grad_norm": 0.1172659695148468, "learning_rate": 1.7025473726520736e-06, "loss": 0.00899576097726822, "step": 10160 }, { "epoch": 45.2, "grad_norm": 0.07522806525230408, "learning_rate": 1.6717714863641953e-06, "loss": 0.0095244862139225, "step": 10170 }, { "epoch": 45.24444444444445, "grad_norm": 0.324351966381073, "learning_rate": 1.6412683274625184e-06, "loss": 0.008086130768060685, "step": 10180 }, { "epoch": 45.28888888888889, "grad_norm": 0.11212663352489471, "learning_rate": 1.6110381896133641e-06, "loss": 0.008968541026115417, "step": 10190 }, { "epoch": 45.333333333333336, "grad_norm": 0.14548514783382416, "learning_rate": 1.5810813638545729e-06, "loss": 0.00902319848537445, "step": 10200 }, { "epoch": 45.37777777777778, "grad_norm": 0.1800372451543808, "learning_rate": 1.5513981385926934e-06, "loss": 0.00901309996843338, "step": 10210 }, { "epoch": 45.422222222222224, "grad_norm": 0.15941272675991058, "learning_rate": 1.521988799600228e-06, "loss": 0.00824701264500618, "step": 10220 }, { "epoch": 45.46666666666667, "grad_norm": 0.21419650316238403, "learning_rate": 1.492853630012845e-06, "loss": 0.009132985025644302, "step": 10230 }, { "epoch": 45.51111111111111, "grad_norm": 0.5608541965484619, "learning_rate": 1.4639929103266837e-06, "loss": 0.010330894589424133, "step": 10240 }, { "epoch": 45.55555555555556, "grad_norm": 0.10819529742002487, "learning_rate": 1.4354069183956408e-06, "loss": 0.009353923052549363, "step": 10250 }, { "epoch": 45.6, "grad_norm": 0.12354094535112381, "learning_rate": 1.4070959294286988e-06, "loss": 0.009289486706256867, "step": 10260 }, { "epoch": 45.644444444444446, "grad_norm": 0.2384805828332901, "learning_rate": 1.3790602159872646e-06, "loss": 0.01224862113595009, "step": 10270 }, { "epoch": 45.68888888888889, "grad_norm": 0.12412340193986893, "learning_rate": 1.3513000479825643e-06, "loss": 0.009660492837429046, "step": 10280 }, { "epoch": 45.733333333333334, "grad_norm": 0.1056385263800621, "learning_rate": 1.3238156926730372e-06, "loss": 0.01012292355298996, "step": 10290 }, { "epoch": 45.77777777777778, "grad_norm": 0.36509162187576294, "learning_rate": 1.296607414661759e-06, "loss": 0.00964486375451088, "step": 10300 }, { "epoch": 45.82222222222222, "grad_norm": 0.46307435631752014, "learning_rate": 1.2696754758938923e-06, "loss": 0.009910552948713302, "step": 10310 }, { "epoch": 45.86666666666667, "grad_norm": 0.2353232055902481, "learning_rate": 1.243020135654177e-06, "loss": 0.009340450167655945, "step": 10320 }, { "epoch": 45.91111111111111, "grad_norm": 0.2194313257932663, "learning_rate": 1.216641650564424e-06, "loss": 0.011595599353313446, "step": 10330 }, { "epoch": 45.955555555555556, "grad_norm": 0.15788255631923676, "learning_rate": 1.1905402745810456e-06, "loss": 0.0078891322016716, "step": 10340 }, { "epoch": 46.0, "grad_norm": 0.31992077827453613, "learning_rate": 1.1647162589926086e-06, "loss": 0.0076288096606731415, "step": 10350 }, { "epoch": 46.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9866115857817641, "eval_iou_background": 0.0, "eval_iou_crop": 0.9866115857817641, "eval_loss": 0.016716444864869118, "eval_mean_accuracy": 0.9866115857817641, "eval_mean_iou": 0.49330579289088206, "eval_overall_accuracy": 0.9866115857817641, "eval_runtime": 4.8983, "eval_samples_per_second": 64.921, "eval_steps_per_second": 8.166, "step": 10350 }, { "epoch": 46.044444444444444, "grad_norm": 0.09923288971185684, "learning_rate": 1.139169852417422e-06, "loss": 0.010118656605482102, "step": 10360 }, { "epoch": 46.08888888888889, "grad_norm": 0.06966205686330795, "learning_rate": 1.1139013008011467e-06, "loss": 0.009804841876029969, "step": 10370 }, { "epoch": 46.13333333333333, "grad_norm": 0.1781655251979828, "learning_rate": 1.0889108474144093e-06, "loss": 0.008346140384674072, "step": 10380 }, { "epoch": 46.17777777777778, "grad_norm": 0.08700993657112122, "learning_rate": 1.0641987328504755e-06, "loss": 0.009656400978565216, "step": 10390 }, { "epoch": 46.22222222222222, "grad_norm": 0.8780359029769897, "learning_rate": 1.0397651950229303e-06, "loss": 0.009275934845209121, "step": 10400 }, { "epoch": 46.266666666666666, "grad_norm": 0.1944754421710968, "learning_rate": 1.015610469163395e-06, "loss": 0.01210482120513916, "step": 10410 }, { "epoch": 46.31111111111111, "grad_norm": 0.14198417961597443, "learning_rate": 9.91734787819234e-07, "loss": 0.01035802736878395, "step": 10420 }, { "epoch": 46.355555555555554, "grad_norm": 0.32631927728652954, "learning_rate": 9.681383808513577e-07, "loss": 0.009440983831882476, "step": 10430 }, { "epoch": 46.4, "grad_norm": 0.12522903084754944, "learning_rate": 9.448214754319872e-07, "loss": 0.010252082347869873, "step": 10440 }, { "epoch": 46.44444444444444, "grad_norm": 0.13451677560806274, "learning_rate": 9.217842960424461e-07, "loss": 0.008742202818393708, "step": 10450 }, { "epoch": 46.48888888888889, "grad_norm": 0.15418018400669098, "learning_rate": 8.990270644710452e-07, "loss": 0.01160300001502037, "step": 10460 }, { "epoch": 46.53333333333333, "grad_norm": 0.12472720444202423, "learning_rate": 8.76549999810915e-07, "loss": 0.008368405699729919, "step": 10470 }, { "epoch": 46.577777777777776, "grad_norm": 0.8126120567321777, "learning_rate": 8.543533184579066e-07, "loss": 0.008904006332159042, "step": 10480 }, { "epoch": 46.62222222222222, "grad_norm": 0.11290091276168823, "learning_rate": 8.32437234108504e-07, "loss": 0.008595921099185944, "step": 10490 }, { "epoch": 46.666666666666664, "grad_norm": 0.1591264307498932, "learning_rate": 8.108019577577752e-07, "loss": 0.008525626361370086, "step": 10500 }, { "epoch": 46.71111111111111, "grad_norm": 0.2693161964416504, "learning_rate": 7.894476976973275e-07, "loss": 0.009313904494047166, "step": 10510 }, { "epoch": 46.75555555555555, "grad_norm": 0.13790342211723328, "learning_rate": 7.68374659513319e-07, "loss": 0.010252352058887481, "step": 10520 }, { "epoch": 46.8, "grad_norm": 0.09542079269886017, "learning_rate": 7.475830460844569e-07, "loss": 0.00888388156890869, "step": 10530 }, { "epoch": 46.84444444444444, "grad_norm": 0.22087839245796204, "learning_rate": 7.270730575800755e-07, "loss": 0.010214171558618545, "step": 10540 }, { "epoch": 46.888888888888886, "grad_norm": 0.3877478241920471, "learning_rate": 7.068448914581782e-07, "loss": 0.013484404981136322, "step": 10550 }, { "epoch": 46.93333333333333, "grad_norm": 0.3369724452495575, "learning_rate": 6.86898742463552e-07, "loss": 0.009100593626499176, "step": 10560 }, { "epoch": 46.977777777777774, "grad_norm": 0.13118089735507965, "learning_rate": 6.672348026258956e-07, "loss": 0.008454833179712296, "step": 10570 }, { "epoch": 47.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9872791376705267, "eval_iou_background": 0.0, "eval_iou_crop": 0.9872791376705267, "eval_loss": 0.016381528228521347, "eval_mean_accuracy": 0.9872791376705267, "eval_mean_iou": 0.49363956883526333, "eval_overall_accuracy": 0.9872791376705267, "eval_runtime": 4.9764, "eval_samples_per_second": 63.902, "eval_steps_per_second": 8.038, "step": 10575 }, { "epoch": 47.022222222222226, "grad_norm": 0.19740988314151764, "learning_rate": 6.47853261257958e-07, "loss": 0.00867820680141449, "step": 10580 }, { "epoch": 47.06666666666667, "grad_norm": 0.22520901262760162, "learning_rate": 6.287543049537359e-07, "loss": 0.01020711213350296, "step": 10590 }, { "epoch": 47.111111111111114, "grad_norm": 0.13782790303230286, "learning_rate": 6.099381175866392e-07, "loss": 0.00893133580684662, "step": 10600 }, { "epoch": 47.15555555555556, "grad_norm": 0.2860639989376068, "learning_rate": 5.914048803077754e-07, "loss": 0.008915774524211884, "step": 10610 }, { "epoch": 47.2, "grad_norm": 0.12642888724803925, "learning_rate": 5.731547715441576e-07, "loss": 0.009402428567409516, "step": 10620 }, { "epoch": 47.24444444444445, "grad_norm": 0.21845339238643646, "learning_rate": 5.551879669970128e-07, "loss": 0.009370029717683793, "step": 10630 }, { "epoch": 47.28888888888889, "grad_norm": 0.14646980166435242, "learning_rate": 5.375046396400829e-07, "loss": 0.009276290982961654, "step": 10640 }, { "epoch": 47.333333333333336, "grad_norm": 0.182325541973114, "learning_rate": 5.201049597179531e-07, "loss": 0.008968330919742584, "step": 10650 }, { "epoch": 47.37777777777778, "grad_norm": 0.6320025324821472, "learning_rate": 5.029890947444326e-07, "loss": 0.008211261034011841, "step": 10660 }, { "epoch": 47.422222222222224, "grad_norm": 0.44681885838508606, "learning_rate": 4.861572095009104e-07, "loss": 0.008349771052598954, "step": 10670 }, { "epoch": 47.46666666666667, "grad_norm": 0.12262383103370667, "learning_rate": 4.696094660347983e-07, "loss": 0.00871931090950966, "step": 10680 }, { "epoch": 47.51111111111111, "grad_norm": 0.16453778743743896, "learning_rate": 4.533460236579667e-07, "loss": 0.010838456451892853, "step": 10690 }, { "epoch": 47.55555555555556, "grad_norm": 0.213692769408226, "learning_rate": 4.373670389451856e-07, "loss": 0.009841958433389664, "step": 10700 }, { "epoch": 47.6, "grad_norm": 0.16784067451953888, "learning_rate": 4.2167266573264863e-07, "loss": 0.010410427302122115, "step": 10710 }, { "epoch": 47.644444444444446, "grad_norm": 0.23046283423900604, "learning_rate": 4.0626305511647476e-07, "loss": 0.009905047714710236, "step": 10720 }, { "epoch": 47.68888888888889, "grad_norm": 0.19466808438301086, "learning_rate": 3.9113835545125596e-07, "loss": 0.010098429769277573, "step": 10730 }, { "epoch": 47.733333333333334, "grad_norm": 0.10770225524902344, "learning_rate": 3.7629871234863165e-07, "loss": 0.008399660140275956, "step": 10740 }, { "epoch": 47.77777777777778, "grad_norm": 0.11249899119138718, "learning_rate": 3.617442686758898e-07, "loss": 0.008788956701755524, "step": 10750 }, { "epoch": 47.82222222222222, "grad_norm": 0.17780113220214844, "learning_rate": 3.4747516455457817e-07, "loss": 0.008843215554952622, "step": 10760 }, { "epoch": 47.86666666666667, "grad_norm": 0.20773084461688995, "learning_rate": 3.3349153735917847e-07, "loss": 0.008698216080665589, "step": 10770 }, { "epoch": 47.91111111111111, "grad_norm": 0.1742016077041626, "learning_rate": 3.1979352171575104e-07, "loss": 0.0082418791949749, "step": 10780 }, { "epoch": 47.955555555555556, "grad_norm": 0.34049326181411743, "learning_rate": 3.063812495006757e-07, "loss": 0.009095329046249389, "step": 10790 }, { "epoch": 48.0, "grad_norm": 0.1760391891002655, "learning_rate": 2.932548498393528e-07, "loss": 0.009018873423337936, "step": 10800 }, { "epoch": 48.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9870146481726878, "eval_iou_background": 0.0, "eval_iou_crop": 0.9870146481726878, "eval_loss": 0.016443083062767982, "eval_mean_accuracy": 0.9870146481726878, "eval_mean_iou": 0.4935073240863439, "eval_overall_accuracy": 0.9870146481726878, "eval_runtime": 4.896, "eval_samples_per_second": 64.951, "eval_steps_per_second": 8.17, "step": 10800 }, { "epoch": 48.044444444444444, "grad_norm": 0.1465587615966797, "learning_rate": 2.804144491049743e-07, "loss": 0.00973241925239563, "step": 10810 }, { "epoch": 48.08888888888889, "grad_norm": 0.9095686078071594, "learning_rate": 2.6786017091730455e-07, "loss": 0.009360039234161377, "step": 10820 }, { "epoch": 48.13333333333333, "grad_norm": 0.13800445199012756, "learning_rate": 2.5559213614149145e-07, "loss": 0.007514572888612747, "step": 10830 }, { "epoch": 48.17777777777778, "grad_norm": 0.14943262934684753, "learning_rate": 2.4361046288689737e-07, "loss": 0.00918971598148346, "step": 10840 }, { "epoch": 48.22222222222222, "grad_norm": 0.08516086637973785, "learning_rate": 2.3191526650596984e-07, "loss": 0.008401509374380112, "step": 10850 }, { "epoch": 48.266666666666666, "grad_norm": 0.1355172097682953, "learning_rate": 2.2050665959312266e-07, "loss": 0.00966365858912468, "step": 10860 }, { "epoch": 48.31111111111111, "grad_norm": 0.08837186545133591, "learning_rate": 2.093847519836567e-07, "loss": 0.009702187776565552, "step": 10870 }, { "epoch": 48.355555555555554, "grad_norm": 0.3552602231502533, "learning_rate": 1.9854965075270737e-07, "loss": 0.009125810861587525, "step": 10880 }, { "epoch": 48.4, "grad_norm": 0.1358860582113266, "learning_rate": 1.8800146021420218e-07, "loss": 0.008950908482074738, "step": 10890 }, { "epoch": 48.44444444444444, "grad_norm": 0.11094136536121368, "learning_rate": 1.7774028191986146e-07, "loss": 0.008135451376438141, "step": 10900 }, { "epoch": 48.48888888888889, "grad_norm": 0.140141561627388, "learning_rate": 1.6776621465823262e-07, "loss": 0.010136932134628296, "step": 10910 }, { "epoch": 48.53333333333333, "grad_norm": 0.1148114949464798, "learning_rate": 1.5807935445371736e-07, "loss": 0.009019139409065246, "step": 10920 }, { "epoch": 48.577777777777776, "grad_norm": 0.30004918575286865, "learning_rate": 1.4867979456565927e-07, "loss": 0.01003163531422615, "step": 10930 }, { "epoch": 48.62222222222222, "grad_norm": 0.13797500729560852, "learning_rate": 1.3956762548745117e-07, "loss": 0.009001925587654114, "step": 10940 }, { "epoch": 48.666666666666664, "grad_norm": 0.2995701730251312, "learning_rate": 1.3074293494564904e-07, "loss": 0.01100575104355812, "step": 10950 }, { "epoch": 48.71111111111111, "grad_norm": 0.09669066220521927, "learning_rate": 1.2220580789914614e-07, "loss": 0.010369318723678588, "step": 10960 }, { "epoch": 48.75555555555555, "grad_norm": 0.1455744057893753, "learning_rate": 1.1395632653833365e-07, "loss": 0.010063523054122924, "step": 10970 }, { "epoch": 48.8, "grad_norm": 0.10979176312685013, "learning_rate": 1.0599457028433124e-07, "loss": 0.009410152584314347, "step": 10980 }, { "epoch": 48.84444444444444, "grad_norm": 0.16523246467113495, "learning_rate": 9.83206157882044e-08, "loss": 0.008906940370798111, "step": 10990 }, { "epoch": 48.888888888888886, "grad_norm": 0.32376399636268616, "learning_rate": 9.0934536930235e-08, "loss": 0.010732753574848175, "step": 11000 }, { "epoch": 48.93333333333333, "grad_norm": 0.13908307254314423, "learning_rate": 8.383640481921528e-08, "loss": 0.007664051651954651, "step": 11010 }, { "epoch": 48.977777777777774, "grad_norm": 0.11137203872203827, "learning_rate": 7.702628779175158e-08, "loss": 0.008112792670726777, "step": 11020 }, { "epoch": 49.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9869244384579902, "eval_iou_background": 0.0, "eval_iou_crop": 0.9869244384579902, "eval_loss": 0.016392750665545464, "eval_mean_accuracy": 0.9869244384579902, "eval_mean_iou": 0.4934622192289951, "eval_overall_accuracy": 0.9869244384579902, "eval_runtime": 4.8664, "eval_samples_per_second": 65.346, "eval_steps_per_second": 8.22, "step": 11025 }, { "epoch": 49.022222222222226, "grad_norm": 0.09480363875627518, "learning_rate": 7.0504251411605e-08, "loss": 0.008777632564306258, "step": 11030 }, { "epoch": 49.06666666666667, "grad_norm": 0.47448936104774475, "learning_rate": 6.427035846908513e-08, "loss": 0.009276943653821946, "step": 11040 }, { "epoch": 49.111111111111114, "grad_norm": 0.22424659132957458, "learning_rate": 5.832466898040734e-08, "loss": 0.009609420597553254, "step": 11050 }, { "epoch": 49.15555555555556, "grad_norm": 0.3686755299568176, "learning_rate": 5.266724018714975e-08, "loss": 0.01045949086546898, "step": 11060 }, { "epoch": 49.2, "grad_norm": 0.16207093000411987, "learning_rate": 4.7298126555680445e-08, "loss": 0.009542020410299301, "step": 11070 }, { "epoch": 49.24444444444445, "grad_norm": 0.5662288069725037, "learning_rate": 4.221737977664453e-08, "loss": 0.00915139690041542, "step": 11080 }, { "epoch": 49.28888888888889, "grad_norm": 0.08856440335512161, "learning_rate": 3.7425048764454515e-08, "loss": 0.009465672820806504, "step": 11090 }, { "epoch": 49.333333333333336, "grad_norm": 0.1319837123155594, "learning_rate": 3.2921179656834056e-08, "loss": 0.008519663661718368, "step": 11100 }, { "epoch": 49.37777777777778, "grad_norm": 0.14947937428951263, "learning_rate": 2.8705815814364934e-08, "loss": 0.008964132517576218, "step": 11110 }, { "epoch": 49.422222222222224, "grad_norm": 0.22050626575946808, "learning_rate": 2.4778997820067427e-08, "loss": 0.008268860727548599, "step": 11120 }, { "epoch": 49.46666666666667, "grad_norm": 1.0557682514190674, "learning_rate": 2.1140763479020608e-08, "loss": 0.01003037840127945, "step": 11130 }, { "epoch": 49.51111111111111, "grad_norm": 0.10059035569429398, "learning_rate": 1.7791147817985965e-08, "loss": 0.008557784557342529, "step": 11140 }, { "epoch": 49.55555555555556, "grad_norm": 0.09918154776096344, "learning_rate": 1.4730183085074345e-08, "loss": 0.009109391272068024, "step": 11150 }, { "epoch": 49.6, "grad_norm": 0.13343732059001923, "learning_rate": 1.1957898749442864e-08, "loss": 0.008451895415782928, "step": 11160 }, { "epoch": 49.644444444444446, "grad_norm": 0.10850129276514053, "learning_rate": 9.474321501001804e-09, "loss": 0.008390432596206665, "step": 11170 }, { "epoch": 49.68888888888889, "grad_norm": 0.1959400326013565, "learning_rate": 7.279475250154821e-09, "loss": 0.009005936235189438, "step": 11180 }, { "epoch": 49.733333333333334, "grad_norm": 0.13622809946537018, "learning_rate": 5.3733811275857855e-09, "loss": 0.008410344272851944, "step": 11190 }, { "epoch": 49.77777777777778, "grad_norm": 0.16483131051063538, "learning_rate": 3.756057484035624e-09, "loss": 0.009318667650222778, "step": 11200 }, { "epoch": 49.82222222222222, "grad_norm": 0.2793676555156708, "learning_rate": 2.4275198901357875e-09, "loss": 0.007837989926338195, "step": 11210 }, { "epoch": 49.86666666666667, "grad_norm": 0.13267335295677185, "learning_rate": 1.387781136261701e-09, "loss": 0.008356810361146928, "step": 11220 }, { "epoch": 49.91111111111111, "grad_norm": 0.18488381803035736, "learning_rate": 6.368512324028686e-10, "loss": 0.01021805927157402, "step": 11230 }, { "epoch": 49.955555555555556, "grad_norm": 0.39978551864624023, "learning_rate": 1.747374080629527e-10, "loss": 0.008328566700220108, "step": 11240 }, { "epoch": 50.0, "grad_norm": 0.5280951857566833, "learning_rate": 1.4441121998221007e-12, "loss": 0.009911158680915832, "step": 11250 }, { "epoch": 50.0, "eval_accuracy_background": NaN, "eval_accuracy_crop": 0.9869486200471838, "eval_iou_background": 0.0, "eval_iou_crop": 0.9869486200471838, "eval_loss": 0.016488609835505486, "eval_mean_accuracy": 0.9869486200471838, "eval_mean_iou": 0.4934743100235919, "eval_overall_accuracy": 0.9869486200471838, "eval_runtime": 4.3646, "eval_samples_per_second": 72.858, "eval_steps_per_second": 9.165, "step": 11250 }, { "epoch": 50.0, "step": 11250, "total_flos": 1.5748868036100096e+18, "train_loss": 0.026947463490565617, "train_runtime": 1401.3412, "train_samples_per_second": 64.117, "train_steps_per_second": 8.028 } ], "logging_steps": 10, "max_steps": 11250, "num_input_tokens_seen": 0, "num_train_epochs": 50, "save_steps": 500, "stateful_callbacks": { "TrainerControl": { "args": { "should_epoch_stop": false, "should_evaluate": false, "should_log": false, "should_save": true, "should_training_stop": true }, "attributes": {} } }, "total_flos": 1.5748868036100096e+18, "train_batch_size": 8, "trial_name": null, "trial_params": null }