autocrop-bilder / trainer_state.json
Rolv-Arild's picture
End of training
3e34390 verified
Invalid JSON: Unexpected token 'N', ..."kground": NaN, "... is not valid JSON
{
"best_global_step": 3696,
"best_metric": 0.04337907209992409,
"best_model_checkpoint": "./models/autocrop-bilder/checkpoint-3696",
"epoch": 50.0,
"eval_steps": 500,
"global_step": 5600,
"is_hyper_param_search": false,
"is_local_process_zero": true,
"is_world_process_zero": true,
"log_history": [
{
"epoch": 0.08928571428571429,
"grad_norm": 3.270373582839966,
"learning_rate": 9.642857142857142e-07,
"loss": 0.6841774940490722,
"step": 10
},
{
"epoch": 0.17857142857142858,
"grad_norm": 3.1556570529937744,
"learning_rate": 2.0357142857142854e-06,
"loss": 0.6719733715057373,
"step": 20
},
{
"epoch": 0.26785714285714285,
"grad_norm": 3.7284576892852783,
"learning_rate": 3.1071428571428574e-06,
"loss": 0.6568694114685059,
"step": 30
},
{
"epoch": 0.35714285714285715,
"grad_norm": 3.3195960521698,
"learning_rate": 4.178571428571429e-06,
"loss": 0.6387552738189697,
"step": 40
},
{
"epoch": 0.44642857142857145,
"grad_norm": 4.566788673400879,
"learning_rate": 5.25e-06,
"loss": 0.6023201465606689,
"step": 50
},
{
"epoch": 0.5357142857142857,
"grad_norm": 3.4431145191192627,
"learning_rate": 6.321428571428571e-06,
"loss": 0.5654563903808594,
"step": 60
},
{
"epoch": 0.625,
"grad_norm": 4.218961715698242,
"learning_rate": 7.392857142857144e-06,
"loss": 0.5167044162750244,
"step": 70
},
{
"epoch": 0.7142857142857143,
"grad_norm": 4.118458271026611,
"learning_rate": 8.464285714285714e-06,
"loss": 0.4801907539367676,
"step": 80
},
{
"epoch": 0.8035714285714286,
"grad_norm": 3.0397183895111084,
"learning_rate": 9.535714285714285e-06,
"loss": 0.4150387763977051,
"step": 90
},
{
"epoch": 0.8928571428571429,
"grad_norm": 6.0887651443481445,
"learning_rate": 1.0607142857142858e-05,
"loss": 0.36455488204956055,
"step": 100
},
{
"epoch": 0.9821428571428571,
"grad_norm": 5.4721360206604,
"learning_rate": 1.1678571428571428e-05,
"loss": 0.32769825458526614,
"step": 110
},
{
"epoch": 1.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.8947501785580725,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.8947501785580725,
"eval_loss": 0.3303993046283722,
"eval_mean_accuracy": 0.8947501785580725,
"eval_mean_iou": 0.44737508927903624,
"eval_overall_accuracy": 0.8947501785580725,
"eval_runtime": 3.069,
"eval_samples_per_second": 51.483,
"eval_steps_per_second": 6.517,
"step": 112
},
{
"epoch": 1.0714285714285714,
"grad_norm": 5.009084701538086,
"learning_rate": 1.275e-05,
"loss": 0.29956760406494143,
"step": 120
},
{
"epoch": 1.1607142857142858,
"grad_norm": 4.929739952087402,
"learning_rate": 1.3821428571428571e-05,
"loss": 0.2776294231414795,
"step": 130
},
{
"epoch": 1.25,
"grad_norm": 2.2742035388946533,
"learning_rate": 1.4892857142857143e-05,
"loss": 0.25046911239624026,
"step": 140
},
{
"epoch": 1.3392857142857144,
"grad_norm": 2.3090789318084717,
"learning_rate": 1.5964285714285715e-05,
"loss": 0.262372350692749,
"step": 150
},
{
"epoch": 1.4285714285714286,
"grad_norm": 1.8420805931091309,
"learning_rate": 1.7035714285714285e-05,
"loss": 0.2225811719894409,
"step": 160
},
{
"epoch": 1.5178571428571428,
"grad_norm": 2.4408090114593506,
"learning_rate": 1.8107142857142858e-05,
"loss": 0.22525691986083984,
"step": 170
},
{
"epoch": 1.6071428571428572,
"grad_norm": 1.8533332347869873,
"learning_rate": 1.9178571428571428e-05,
"loss": 0.22061917781829835,
"step": 180
},
{
"epoch": 1.6964285714285714,
"grad_norm": 2.3673174381256104,
"learning_rate": 2.025e-05,
"loss": 0.1996947169303894,
"step": 190
},
{
"epoch": 1.7857142857142856,
"grad_norm": 2.2984402179718018,
"learning_rate": 2.1321428571428574e-05,
"loss": 0.19175281524658203,
"step": 200
},
{
"epoch": 1.875,
"grad_norm": 5.28623628616333,
"learning_rate": 2.2392857142857144e-05,
"loss": 0.19550073146820068,
"step": 210
},
{
"epoch": 1.9642857142857144,
"grad_norm": 1.4293358325958252,
"learning_rate": 2.3464285714285714e-05,
"loss": 0.18344916105270387,
"step": 220
},
{
"epoch": 2.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9449638670840851,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9449638670840851,
"eval_loss": 0.17327815294265747,
"eval_mean_accuracy": 0.9449638670840851,
"eval_mean_iou": 0.47248193354204254,
"eval_overall_accuracy": 0.9449638670840851,
"eval_runtime": 3.0436,
"eval_samples_per_second": 51.912,
"eval_steps_per_second": 6.571,
"step": 224
},
{
"epoch": 2.0535714285714284,
"grad_norm": 1.0139216184616089,
"learning_rate": 2.4535714285714287e-05,
"loss": 0.18806995153427125,
"step": 230
},
{
"epoch": 2.142857142857143,
"grad_norm": 1.6520318984985352,
"learning_rate": 2.5607142857142857e-05,
"loss": 0.16265342235565186,
"step": 240
},
{
"epoch": 2.232142857142857,
"grad_norm": 3.5133588314056396,
"learning_rate": 2.6678571428571427e-05,
"loss": 0.1572718858718872,
"step": 250
},
{
"epoch": 2.3214285714285716,
"grad_norm": 1.2140995264053345,
"learning_rate": 2.7750000000000004e-05,
"loss": 0.15668554306030275,
"step": 260
},
{
"epoch": 2.4107142857142856,
"grad_norm": 2.7298743724823,
"learning_rate": 2.8821428571428574e-05,
"loss": 0.14472755193710327,
"step": 270
},
{
"epoch": 2.5,
"grad_norm": 0.6985360980033875,
"learning_rate": 2.9892857142857143e-05,
"loss": 0.14720585346221923,
"step": 280
},
{
"epoch": 2.5892857142857144,
"grad_norm": 0.8003563284873962,
"learning_rate": 3.096428571428572e-05,
"loss": 0.14043016433715821,
"step": 290
},
{
"epoch": 2.678571428571429,
"grad_norm": 1.7715791463851929,
"learning_rate": 3.203571428571428e-05,
"loss": 0.129607629776001,
"step": 300
},
{
"epoch": 2.767857142857143,
"grad_norm": 0.7600429058074951,
"learning_rate": 3.310714285714286e-05,
"loss": 0.1326908826828003,
"step": 310
},
{
"epoch": 2.857142857142857,
"grad_norm": 1.411843180656433,
"learning_rate": 3.417857142857143e-05,
"loss": 0.1340739369392395,
"step": 320
},
{
"epoch": 2.946428571428571,
"grad_norm": 1.2389501333236694,
"learning_rate": 3.525e-05,
"loss": 0.1279363751411438,
"step": 330
},
{
"epoch": 3.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9813412891527392,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9813412891527392,
"eval_loss": 0.1177222803235054,
"eval_mean_accuracy": 0.9813412891527392,
"eval_mean_iou": 0.4906706445763696,
"eval_overall_accuracy": 0.9813412891527392,
"eval_runtime": 3.0843,
"eval_samples_per_second": 51.227,
"eval_steps_per_second": 6.484,
"step": 336
},
{
"epoch": 3.0357142857142856,
"grad_norm": 4.182790756225586,
"learning_rate": 3.632142857142857e-05,
"loss": 0.11685030460357666,
"step": 340
},
{
"epoch": 3.125,
"grad_norm": 1.452004313468933,
"learning_rate": 3.739285714285714e-05,
"loss": 0.1146626591682434,
"step": 350
},
{
"epoch": 3.2142857142857144,
"grad_norm": 0.737139105796814,
"learning_rate": 3.8464285714285716e-05,
"loss": 0.1056035041809082,
"step": 360
},
{
"epoch": 3.3035714285714284,
"grad_norm": 0.5500335693359375,
"learning_rate": 3.953571428571429e-05,
"loss": 0.12782689332962036,
"step": 370
},
{
"epoch": 3.392857142857143,
"grad_norm": 0.8951995968818665,
"learning_rate": 4.060714285714286e-05,
"loss": 0.10672543048858643,
"step": 380
},
{
"epoch": 3.482142857142857,
"grad_norm": 1.5596611499786377,
"learning_rate": 4.167857142857143e-05,
"loss": 0.10761728286743164,
"step": 390
},
{
"epoch": 3.571428571428571,
"grad_norm": 1.7340526580810547,
"learning_rate": 4.275e-05,
"loss": 0.12569416761398317,
"step": 400
},
{
"epoch": 3.6607142857142856,
"grad_norm": 0.8778754472732544,
"learning_rate": 4.382142857142857e-05,
"loss": 0.0940355658531189,
"step": 410
},
{
"epoch": 3.75,
"grad_norm": 2.6315760612487793,
"learning_rate": 4.489285714285714e-05,
"loss": 0.10828475952148438,
"step": 420
},
{
"epoch": 3.8392857142857144,
"grad_norm": 0.5823694467544556,
"learning_rate": 4.5964285714285715e-05,
"loss": 0.09212335348129272,
"step": 430
},
{
"epoch": 3.928571428571429,
"grad_norm": 1.48265540599823,
"learning_rate": 4.703571428571429e-05,
"loss": 0.08791649341583252,
"step": 440
},
{
"epoch": 4.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9857982300059793,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9857982300059793,
"eval_loss": 0.08414151519536972,
"eval_mean_accuracy": 0.9857982300059793,
"eval_mean_iou": 0.49289911500298966,
"eval_overall_accuracy": 0.9857982300059793,
"eval_runtime": 2.8965,
"eval_samples_per_second": 54.549,
"eval_steps_per_second": 6.905,
"step": 448
},
{
"epoch": 4.017857142857143,
"grad_norm": 7.7965288162231445,
"learning_rate": 4.810714285714286e-05,
"loss": 0.09109385013580322,
"step": 450
},
{
"epoch": 4.107142857142857,
"grad_norm": 0.60382080078125,
"learning_rate": 4.917857142857143e-05,
"loss": 0.08951844573020935,
"step": 460
},
{
"epoch": 4.196428571428571,
"grad_norm": 28.733182907104492,
"learning_rate": 5.025e-05,
"loss": 0.08306971788406373,
"step": 470
},
{
"epoch": 4.285714285714286,
"grad_norm": 3.4891135692596436,
"learning_rate": 5.132142857142857e-05,
"loss": 0.08310299515724182,
"step": 480
},
{
"epoch": 4.375,
"grad_norm": 0.517422080039978,
"learning_rate": 5.239285714285714e-05,
"loss": 0.08568280935287476,
"step": 490
},
{
"epoch": 4.464285714285714,
"grad_norm": 0.7893465161323547,
"learning_rate": 5.346428571428572e-05,
"loss": 0.09003521800041199,
"step": 500
},
{
"epoch": 4.553571428571429,
"grad_norm": 4.526234149932861,
"learning_rate": 5.453571428571429e-05,
"loss": 0.09423142075538635,
"step": 510
},
{
"epoch": 4.642857142857143,
"grad_norm": 0.7713887691497803,
"learning_rate": 5.560714285714286e-05,
"loss": 0.07021326422691346,
"step": 520
},
{
"epoch": 4.732142857142857,
"grad_norm": 0.3963504135608673,
"learning_rate": 5.667857142857143e-05,
"loss": 0.08367589712142945,
"step": 530
},
{
"epoch": 4.821428571428571,
"grad_norm": 1.0999394655227661,
"learning_rate": 5.775e-05,
"loss": 0.08009102344512939,
"step": 540
},
{
"epoch": 4.910714285714286,
"grad_norm": 0.7939938306808472,
"learning_rate": 5.882142857142857e-05,
"loss": 0.09382905960083007,
"step": 550
},
{
"epoch": 5.0,
"grad_norm": 2.131338357925415,
"learning_rate": 5.989285714285715e-05,
"loss": 0.0795985221862793,
"step": 560
},
{
"epoch": 5.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9741688295995273,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9741688295995273,
"eval_loss": 0.08404607325792313,
"eval_mean_accuracy": 0.9741688295995273,
"eval_mean_iou": 0.48708441479976367,
"eval_overall_accuracy": 0.9741688295995273,
"eval_runtime": 3.1074,
"eval_samples_per_second": 50.846,
"eval_steps_per_second": 6.436,
"step": 560
},
{
"epoch": 5.089285714285714,
"grad_norm": 0.9680992364883423,
"learning_rate": 5.999952792194596e-05,
"loss": 0.07798992395401001,
"step": 570
},
{
"epoch": 5.178571428571429,
"grad_norm": 0.8994519710540771,
"learning_rate": 5.999789606626562e-05,
"loss": 0.06749414801597595,
"step": 580
},
{
"epoch": 5.267857142857143,
"grad_norm": 0.986232340335846,
"learning_rate": 5.99950986682241e-05,
"loss": 0.0746770441532135,
"step": 590
},
{
"epoch": 5.357142857142857,
"grad_norm": 0.6977314352989197,
"learning_rate": 5.999113583651189e-05,
"loss": 0.07597554922103882,
"step": 600
},
{
"epoch": 5.446428571428571,
"grad_norm": 0.9763554930686951,
"learning_rate": 5.9986007725101386e-05,
"loss": 0.07884644269943238,
"step": 610
},
{
"epoch": 5.535714285714286,
"grad_norm": 0.4131947457790375,
"learning_rate": 5.997971453324095e-05,
"loss": 0.07100933790206909,
"step": 620
},
{
"epoch": 5.625,
"grad_norm": 4.289861679077148,
"learning_rate": 5.99722565054471e-05,
"loss": 0.07310172915458679,
"step": 630
},
{
"epoch": 5.714285714285714,
"grad_norm": 1.0220744609832764,
"learning_rate": 5.996363393149509e-05,
"loss": 0.07721139788627625,
"step": 640
},
{
"epoch": 5.803571428571429,
"grad_norm": 0.3010362684726715,
"learning_rate": 5.995384714640757e-05,
"loss": 0.059419333934783936,
"step": 650
},
{
"epoch": 5.892857142857143,
"grad_norm": 3.465324640274048,
"learning_rate": 5.994289653044164e-05,
"loss": 0.07689496874809265,
"step": 660
},
{
"epoch": 5.982142857142857,
"grad_norm": 0.6869708895683289,
"learning_rate": 5.993078250907403e-05,
"loss": 0.06406612396240234,
"step": 670
},
{
"epoch": 6.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9859818189036227,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9859818189036227,
"eval_loss": 0.07088413834571838,
"eval_mean_accuracy": 0.9859818189036227,
"eval_mean_iou": 0.49299090945181134,
"eval_overall_accuracy": 0.9859818189036227,
"eval_runtime": 3.1076,
"eval_samples_per_second": 50.843,
"eval_steps_per_second": 6.436,
"step": 672
},
{
"epoch": 6.071428571428571,
"grad_norm": 1.3824396133422852,
"learning_rate": 5.9917505552984576e-05,
"loss": 0.06562145948410034,
"step": 680
},
{
"epoch": 6.160714285714286,
"grad_norm": 0.8862974047660828,
"learning_rate": 5.990306617803795e-05,
"loss": 0.07552834749221801,
"step": 690
},
{
"epoch": 6.25,
"grad_norm": 1.8890525102615356,
"learning_rate": 5.9887464945263616e-05,
"loss": 0.06953117251396179,
"step": 700
},
{
"epoch": 6.339285714285714,
"grad_norm": 1.3064137697219849,
"learning_rate": 5.9870702460833996e-05,
"loss": 0.05875499844551087,
"step": 710
},
{
"epoch": 6.428571428571429,
"grad_norm": 5.315647125244141,
"learning_rate": 5.985277937604096e-05,
"loss": 0.06155696511268616,
"step": 720
},
{
"epoch": 6.517857142857143,
"grad_norm": 0.5886704921722412,
"learning_rate": 5.98336963872705e-05,
"loss": 0.06854590773582458,
"step": 730
},
{
"epoch": 6.607142857142857,
"grad_norm": 0.36860746145248413,
"learning_rate": 5.981345423597567e-05,
"loss": 0.05901351571083069,
"step": 740
},
{
"epoch": 6.696428571428571,
"grad_norm": 0.5009424090385437,
"learning_rate": 5.979205370864779e-05,
"loss": 0.055243945121765135,
"step": 750
},
{
"epoch": 6.785714285714286,
"grad_norm": 0.5251625180244446,
"learning_rate": 5.976949563678588e-05,
"loss": 0.07381758689880372,
"step": 760
},
{
"epoch": 6.875,
"grad_norm": 0.5076754093170166,
"learning_rate": 5.9745780896864355e-05,
"loss": 0.05926129817962646,
"step": 770
},
{
"epoch": 6.964285714285714,
"grad_norm": 0.5567944645881653,
"learning_rate": 5.972091041029896e-05,
"loss": 0.05233304500579834,
"step": 780
},
{
"epoch": 7.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9894160453154839,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9894160453154839,
"eval_loss": 0.06326749175786972,
"eval_mean_accuracy": 0.9894160453154839,
"eval_mean_iou": 0.49470802265774194,
"eval_overall_accuracy": 0.9894160453154839,
"eval_runtime": 3.1323,
"eval_samples_per_second": 50.443,
"eval_steps_per_second": 6.385,
"step": 784
},
{
"epoch": 7.053571428571429,
"grad_norm": 0.860552191734314,
"learning_rate": 5.969488514341099e-05,
"loss": 0.0780815064907074,
"step": 790
},
{
"epoch": 7.142857142857143,
"grad_norm": 1.0587300062179565,
"learning_rate": 5.966770610738974e-05,
"loss": 0.056760483980178834,
"step": 800
},
{
"epoch": 7.232142857142857,
"grad_norm": 0.7505276799201965,
"learning_rate": 5.963937435825317e-05,
"loss": 0.059036099910736085,
"step": 810
},
{
"epoch": 7.321428571428571,
"grad_norm": 1.0296212434768677,
"learning_rate": 5.960989099680696e-05,
"loss": 0.05659686326980591,
"step": 820
},
{
"epoch": 7.410714285714286,
"grad_norm": 0.46932515501976013,
"learning_rate": 5.957925716860167e-05,
"loss": 0.05175484418869018,
"step": 830
},
{
"epoch": 7.5,
"grad_norm": 0.718617856502533,
"learning_rate": 5.954747406388824e-05,
"loss": 0.055910295248031615,
"step": 840
},
{
"epoch": 7.589285714285714,
"grad_norm": 0.7998201251029968,
"learning_rate": 5.951454291757181e-05,
"loss": 0.06455008387565613,
"step": 850
},
{
"epoch": 7.678571428571429,
"grad_norm": 0.37768468260765076,
"learning_rate": 5.948046500916361e-05,
"loss": 0.05296936631202698,
"step": 860
},
{
"epoch": 7.767857142857143,
"grad_norm": 1.0487741231918335,
"learning_rate": 5.944524166273137e-05,
"loss": 0.056065672636032106,
"step": 870
},
{
"epoch": 7.857142857142857,
"grad_norm": 0.7201439142227173,
"learning_rate": 5.940887424684782e-05,
"loss": 0.0546242892742157,
"step": 880
},
{
"epoch": 7.946428571428571,
"grad_norm": 0.7990844249725342,
"learning_rate": 5.9371364174537516e-05,
"loss": 0.057676571607589724,
"step": 890
},
{
"epoch": 8.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9807289934553552,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9807289934553552,
"eval_loss": 0.06055007502436638,
"eval_mean_accuracy": 0.9807289934553552,
"eval_mean_iou": 0.4903644967276776,
"eval_overall_accuracy": 0.9807289934553552,
"eval_runtime": 2.976,
"eval_samples_per_second": 53.092,
"eval_steps_per_second": 6.72,
"step": 896
},
{
"epoch": 8.035714285714286,
"grad_norm": 0.49310821294784546,
"learning_rate": 5.933271290322194e-05,
"loss": 0.051748812198638916,
"step": 900
},
{
"epoch": 8.125,
"grad_norm": 0.9782583117485046,
"learning_rate": 5.929292193466289e-05,
"loss": 0.052764898538589476,
"step": 910
},
{
"epoch": 8.214285714285714,
"grad_norm": 0.4996137022972107,
"learning_rate": 5.925199281490409e-05,
"loss": 0.04635877311229706,
"step": 920
},
{
"epoch": 8.303571428571429,
"grad_norm": 0.7325310111045837,
"learning_rate": 5.920992713421118e-05,
"loss": 0.0518154501914978,
"step": 930
},
{
"epoch": 8.392857142857142,
"grad_norm": 0.6661192178726196,
"learning_rate": 5.916672652700986e-05,
"loss": 0.05230782628059387,
"step": 940
},
{
"epoch": 8.482142857142858,
"grad_norm": 0.6793703436851501,
"learning_rate": 5.9122392671822454e-05,
"loss": 0.061950719356536864,
"step": 950
},
{
"epoch": 8.571428571428571,
"grad_norm": 0.5158465504646301,
"learning_rate": 5.907692729120263e-05,
"loss": 0.052070868015289304,
"step": 960
},
{
"epoch": 8.660714285714286,
"grad_norm": 1.4337759017944336,
"learning_rate": 5.903033215166852e-05,
"loss": 0.05228162407875061,
"step": 970
},
{
"epoch": 8.75,
"grad_norm": 1.1488945484161377,
"learning_rate": 5.898260906363405e-05,
"loss": 0.05639091730117798,
"step": 980
},
{
"epoch": 8.839285714285714,
"grad_norm": 3.3319473266601562,
"learning_rate": 5.8933759881338625e-05,
"loss": 0.06053876280784607,
"step": 990
},
{
"epoch": 8.928571428571429,
"grad_norm": 0.47250106930732727,
"learning_rate": 5.888378650277505e-05,
"loss": 0.05278565287590027,
"step": 1000
},
{
"epoch": 9.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9903641264589433,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9903641264589433,
"eval_loss": 0.05963556095957756,
"eval_mean_accuracy": 0.9903641264589433,
"eval_mean_iou": 0.49518206322947167,
"eval_overall_accuracy": 0.9903641264589433,
"eval_runtime": 3.041,
"eval_samples_per_second": 51.957,
"eval_steps_per_second": 6.577,
"step": 1008
},
{
"epoch": 9.017857142857142,
"grad_norm": 0.806399405002594,
"learning_rate": 5.8832690869615824e-05,
"loss": 0.05292539000511169,
"step": 1010
},
{
"epoch": 9.107142857142858,
"grad_norm": 3.02130126953125,
"learning_rate": 5.878047496713768e-05,
"loss": 0.04778439402580261,
"step": 1020
},
{
"epoch": 9.196428571428571,
"grad_norm": 2.86051082611084,
"learning_rate": 5.8727140824144435e-05,
"loss": 0.05619266629219055,
"step": 1030
},
{
"epoch": 9.285714285714286,
"grad_norm": 0.7149938344955444,
"learning_rate": 5.8672690512888185e-05,
"loss": 0.047925320267677304,
"step": 1040
},
{
"epoch": 9.375,
"grad_norm": 0.7016188502311707,
"learning_rate": 5.8617126148988775e-05,
"loss": 0.046968936920166016,
"step": 1050
},
{
"epoch": 9.464285714285714,
"grad_norm": 0.4471415579319,
"learning_rate": 5.856044989135162e-05,
"loss": 0.0487202912569046,
"step": 1060
},
{
"epoch": 9.553571428571429,
"grad_norm": 0.589865505695343,
"learning_rate": 5.850266394208378e-05,
"loss": 0.05116734504699707,
"step": 1070
},
{
"epoch": 9.642857142857142,
"grad_norm": 0.477340966463089,
"learning_rate": 5.844377054640846e-05,
"loss": 0.058660686016082764,
"step": 1080
},
{
"epoch": 9.732142857142858,
"grad_norm": 0.38238945603370667,
"learning_rate": 5.83837719925777e-05,
"loss": 0.046440258622169495,
"step": 1090
},
{
"epoch": 9.821428571428571,
"grad_norm": 1.1571301221847534,
"learning_rate": 5.8322670611783533e-05,
"loss": 0.05035667419433594,
"step": 1100
},
{
"epoch": 9.910714285714286,
"grad_norm": 0.7370873689651489,
"learning_rate": 5.826046877806737e-05,
"loss": 0.05174518227577209,
"step": 1110
},
{
"epoch": 10.0,
"grad_norm": 0.7022402882575989,
"learning_rate": 5.819716890822778e-05,
"loss": 0.04487786293029785,
"step": 1120
},
{
"epoch": 10.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9849750743137399,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9849750743137399,
"eval_loss": 0.056510768830776215,
"eval_mean_accuracy": 0.9849750743137399,
"eval_mean_iou": 0.49248753715686994,
"eval_overall_accuracy": 0.9849750743137399,
"eval_runtime": 2.8666,
"eval_samples_per_second": 55.118,
"eval_steps_per_second": 6.977,
"step": 1120
},
{
"epoch": 10.089285714285714,
"grad_norm": 1.81419837474823,
"learning_rate": 5.813277346172658e-05,
"loss": 0.054458075761795045,
"step": 1130
},
{
"epoch": 10.178571428571429,
"grad_norm": 0.6672200560569763,
"learning_rate": 5.806728494059325e-05,
"loss": 0.04975816011428833,
"step": 1140
},
{
"epoch": 10.267857142857142,
"grad_norm": 0.6396266222000122,
"learning_rate": 5.8000705889327764e-05,
"loss": 0.05723657608032227,
"step": 1150
},
{
"epoch": 10.357142857142858,
"grad_norm": 1.1310316324234009,
"learning_rate": 5.79330388948017e-05,
"loss": 0.04499860405921936,
"step": 1160
},
{
"epoch": 10.446428571428571,
"grad_norm": 0.5163964629173279,
"learning_rate": 5.7864286586157726e-05,
"loss": 0.04683603048324585,
"step": 1170
},
{
"epoch": 10.535714285714286,
"grad_norm": 1.1878842115402222,
"learning_rate": 5.779445163470746e-05,
"loss": 0.053842353820800784,
"step": 1180
},
{
"epoch": 10.625,
"grad_norm": 0.9575569033622742,
"learning_rate": 5.772353675382766e-05,
"loss": 0.050610685348510744,
"step": 1190
},
{
"epoch": 10.714285714285714,
"grad_norm": 0.46333664655685425,
"learning_rate": 5.765154469885482e-05,
"loss": 0.04571016728878021,
"step": 1200
},
{
"epoch": 10.803571428571429,
"grad_norm": 0.5651761293411255,
"learning_rate": 5.75784782669781e-05,
"loss": 0.05275800824165344,
"step": 1210
},
{
"epoch": 10.892857142857142,
"grad_norm": 1.1750099658966064,
"learning_rate": 5.7504340297130654e-05,
"loss": 0.04366275668144226,
"step": 1220
},
{
"epoch": 10.982142857142858,
"grad_norm": 1.4780343770980835,
"learning_rate": 5.742913366987931e-05,
"loss": 0.04656153619289398,
"step": 1230
},
{
"epoch": 11.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9852730923489182,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9852730923489182,
"eval_loss": 0.05328800156712532,
"eval_mean_accuracy": 0.9852730923489182,
"eval_mean_iou": 0.4926365461744591,
"eval_overall_accuracy": 0.9852730923489182,
"eval_runtime": 3.133,
"eval_samples_per_second": 50.431,
"eval_steps_per_second": 6.384,
"step": 1232
},
{
"epoch": 11.071428571428571,
"grad_norm": 0.8470721244812012,
"learning_rate": 5.735286130731266e-05,
"loss": 0.049132627248764035,
"step": 1240
},
{
"epoch": 11.160714285714286,
"grad_norm": 0.8392991423606873,
"learning_rate": 5.7275526172927524e-05,
"loss": 0.045812690258026124,
"step": 1250
},
{
"epoch": 11.25,
"grad_norm": 0.7748396396636963,
"learning_rate": 5.71971312715138e-05,
"loss": 0.05167960524559021,
"step": 1260
},
{
"epoch": 11.339285714285714,
"grad_norm": 1.7050870656967163,
"learning_rate": 5.711767964903773e-05,
"loss": 0.05110126733779907,
"step": 1270
},
{
"epoch": 11.428571428571429,
"grad_norm": 0.4576941430568695,
"learning_rate": 5.7037174392523523e-05,
"loss": 0.04657388925552368,
"step": 1280
},
{
"epoch": 11.517857142857142,
"grad_norm": 7.09236478805542,
"learning_rate": 5.695561862993344e-05,
"loss": 0.055950915813446044,
"step": 1290
},
{
"epoch": 11.607142857142858,
"grad_norm": 0.43980512022972107,
"learning_rate": 5.687301553004625e-05,
"loss": 0.04865770637989044,
"step": 1300
},
{
"epoch": 11.696428571428571,
"grad_norm": 0.4581732153892517,
"learning_rate": 5.6789368302334114e-05,
"loss": 0.04953811764717102,
"step": 1310
},
{
"epoch": 11.785714285714286,
"grad_norm": 0.4522385001182556,
"learning_rate": 5.670468019683786e-05,
"loss": 0.04517539143562317,
"step": 1320
},
{
"epoch": 11.875,
"grad_norm": 5.039539813995361,
"learning_rate": 5.661895450404073e-05,
"loss": 0.04825035333633423,
"step": 1330
},
{
"epoch": 11.964285714285714,
"grad_norm": 0.7777697443962097,
"learning_rate": 5.653219455474054e-05,
"loss": 0.04639602601528168,
"step": 1340
},
{
"epoch": 12.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9873568681936357,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9873568681936357,
"eval_loss": 0.05003076419234276,
"eval_mean_accuracy": 0.9873568681936357,
"eval_mean_iou": 0.49367843409681783,
"eval_overall_accuracy": 0.9873568681936357,
"eval_runtime": 3.1124,
"eval_samples_per_second": 50.764,
"eval_steps_per_second": 6.426,
"step": 1344
},
{
"epoch": 12.053571428571429,
"grad_norm": 0.48987045884132385,
"learning_rate": 5.6444403719920244e-05,
"loss": 0.0484184205532074,
"step": 1350
},
{
"epoch": 12.142857142857142,
"grad_norm": 0.774320662021637,
"learning_rate": 5.6355585410616946e-05,
"loss": 0.04041492640972137,
"step": 1360
},
{
"epoch": 12.232142857142858,
"grad_norm": 1.0305246114730835,
"learning_rate": 5.62657430777894e-05,
"loss": 0.04853481948375702,
"step": 1370
},
{
"epoch": 12.321428571428571,
"grad_norm": 1.1221197843551636,
"learning_rate": 5.617488021218392e-05,
"loss": 0.04230141043663025,
"step": 1380
},
{
"epoch": 12.410714285714286,
"grad_norm": 0.3958747088909149,
"learning_rate": 5.608300034419871e-05,
"loss": 0.04070273339748383,
"step": 1390
},
{
"epoch": 12.5,
"grad_norm": 0.6378204822540283,
"learning_rate": 5.599010704374675e-05,
"loss": 0.040793830156326295,
"step": 1400
},
{
"epoch": 12.589285714285714,
"grad_norm": 0.2917404770851135,
"learning_rate": 5.589620392011705e-05,
"loss": 0.04370662868022919,
"step": 1410
},
{
"epoch": 12.678571428571429,
"grad_norm": 0.3751641511917114,
"learning_rate": 5.580129462183444e-05,
"loss": 0.04144810438156128,
"step": 1420
},
{
"epoch": 12.767857142857142,
"grad_norm": 0.8122061491012573,
"learning_rate": 5.570538283651778e-05,
"loss": 0.043512603640556334,
"step": 1430
},
{
"epoch": 12.857142857142858,
"grad_norm": 0.7271958589553833,
"learning_rate": 5.560847229073673e-05,
"loss": 0.04332651495933533,
"step": 1440
},
{
"epoch": 12.946428571428571,
"grad_norm": 0.5666247010231018,
"learning_rate": 5.551056674986689e-05,
"loss": 0.04556152820587158,
"step": 1450
},
{
"epoch": 13.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9913747025252939,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9913747025252939,
"eval_loss": 0.050282228738069534,
"eval_mean_accuracy": 0.9913747025252939,
"eval_mean_iou": 0.49568735126264696,
"eval_overall_accuracy": 0.9913747025252939,
"eval_runtime": 3.1533,
"eval_samples_per_second": 50.106,
"eval_steps_per_second": 6.343,
"step": 1456
},
{
"epoch": 13.035714285714286,
"grad_norm": 1.259560227394104,
"learning_rate": 5.541167001794355e-05,
"loss": 0.044156748056411746,
"step": 1460
},
{
"epoch": 13.125,
"grad_norm": 0.8817604184150696,
"learning_rate": 5.5311785937513874e-05,
"loss": 0.05123854279518127,
"step": 1470
},
{
"epoch": 13.214285714285714,
"grad_norm": 0.5233781337738037,
"learning_rate": 5.52109183894876e-05,
"loss": 0.04295460879802704,
"step": 1480
},
{
"epoch": 13.303571428571429,
"grad_norm": 0.4079657793045044,
"learning_rate": 5.5109071292986255e-05,
"loss": 0.0446503072977066,
"step": 1490
},
{
"epoch": 13.392857142857142,
"grad_norm": 0.3609340190887451,
"learning_rate": 5.5006248605190865e-05,
"loss": 0.04136324226856232,
"step": 1500
},
{
"epoch": 13.482142857142858,
"grad_norm": 0.6312282681465149,
"learning_rate": 5.4902454321188225e-05,
"loss": 0.04388892650604248,
"step": 1510
},
{
"epoch": 13.571428571428571,
"grad_norm": 0.9294518232345581,
"learning_rate": 5.479769247381566e-05,
"loss": 0.04297168850898743,
"step": 1520
},
{
"epoch": 13.660714285714286,
"grad_norm": 0.7301751375198364,
"learning_rate": 5.4691967133504326e-05,
"loss": 0.041097778081893924,
"step": 1530
},
{
"epoch": 13.75,
"grad_norm": 0.588044285774231,
"learning_rate": 5.458528240812107e-05,
"loss": 0.036137142777442934,
"step": 1540
},
{
"epoch": 13.839285714285714,
"grad_norm": 0.49514254927635193,
"learning_rate": 5.447764244280884e-05,
"loss": 0.04436479806900025,
"step": 1550
},
{
"epoch": 13.928571428571429,
"grad_norm": 0.8887337446212769,
"learning_rate": 5.436905141982555e-05,
"loss": 0.039365378022193906,
"step": 1560
},
{
"epoch": 14.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9875765824408328,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9875765824408328,
"eval_loss": 0.04912761226296425,
"eval_mean_accuracy": 0.9875765824408328,
"eval_mean_iou": 0.4937882912204164,
"eval_overall_accuracy": 0.9875765824408328,
"eval_runtime": 3.1041,
"eval_samples_per_second": 50.9,
"eval_steps_per_second": 6.443,
"step": 1568
},
{
"epoch": 14.017857142857142,
"grad_norm": 0.6825718879699707,
"learning_rate": 5.425951355838171e-05,
"loss": 0.04728492200374603,
"step": 1570
},
{
"epoch": 14.107142857142858,
"grad_norm": 0.6529393196105957,
"learning_rate": 5.4149033114476364e-05,
"loss": 0.04193180501461029,
"step": 1580
},
{
"epoch": 14.196428571428571,
"grad_norm": 1.142166256904602,
"learning_rate": 5.403761438073182e-05,
"loss": 0.05213127732276916,
"step": 1590
},
{
"epoch": 14.285714285714286,
"grad_norm": 0.2536723017692566,
"learning_rate": 5.3925261686226815e-05,
"loss": 0.040300771594047546,
"step": 1600
},
{
"epoch": 14.375,
"grad_norm": 0.5792322754859924,
"learning_rate": 5.381197939632832e-05,
"loss": 0.04092682600021362,
"step": 1610
},
{
"epoch": 14.464285714285714,
"grad_norm": 0.41399243474006653,
"learning_rate": 5.369777191252192e-05,
"loss": 0.037803399562835696,
"step": 1620
},
{
"epoch": 14.553571428571429,
"grad_norm": 0.633029043674469,
"learning_rate": 5.358264367224087e-05,
"loss": 0.03901064395904541,
"step": 1630
},
{
"epoch": 14.642857142857142,
"grad_norm": 0.44275617599487305,
"learning_rate": 5.3466599148693555e-05,
"loss": 0.04518336057662964,
"step": 1640
},
{
"epoch": 14.732142857142858,
"grad_norm": 0.5145997405052185,
"learning_rate": 5.334964285068978e-05,
"loss": 0.04450685381889343,
"step": 1650
},
{
"epoch": 14.821428571428571,
"grad_norm": 0.7258153557777405,
"learning_rate": 5.323177932246557e-05,
"loss": 0.03933931291103363,
"step": 1660
},
{
"epoch": 14.910714285714286,
"grad_norm": 1.4203119277954102,
"learning_rate": 5.3113013143506585e-05,
"loss": 0.043070229887962344,
"step": 1670
},
{
"epoch": 15.0,
"grad_norm": 0.701845109462738,
"learning_rate": 5.2993348928370205e-05,
"loss": 0.04021662771701813,
"step": 1680
},
{
"epoch": 15.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9920743816439693,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9920743816439693,
"eval_loss": 0.05143989622592926,
"eval_mean_accuracy": 0.9920743816439693,
"eval_mean_iou": 0.49603719082198466,
"eval_overall_accuracy": 0.9920743816439693,
"eval_runtime": 2.9833,
"eval_samples_per_second": 52.962,
"eval_steps_per_second": 6.704,
"step": 1680
},
{
"epoch": 15.089285714285714,
"grad_norm": 1.7581926584243774,
"learning_rate": 5.287279132650623e-05,
"loss": 0.04302600026130676,
"step": 1690
},
{
"epoch": 15.178571428571429,
"grad_norm": 0.6842783689498901,
"learning_rate": 5.2751345022076234e-05,
"loss": 0.045688962936401366,
"step": 1700
},
{
"epoch": 15.267857142857142,
"grad_norm": 5.589493274688721,
"learning_rate": 5.2629014733771556e-05,
"loss": 0.040783023834228514,
"step": 1710
},
{
"epoch": 15.357142857142858,
"grad_norm": 0.9302808046340942,
"learning_rate": 5.2505805214629965e-05,
"loss": 0.04296206533908844,
"step": 1720
},
{
"epoch": 15.446428571428571,
"grad_norm": 0.5288134813308716,
"learning_rate": 5.238172125185099e-05,
"loss": 0.03719891309738159,
"step": 1730
},
{
"epoch": 15.535714285714286,
"grad_norm": 0.38548046350479126,
"learning_rate": 5.225676766660991e-05,
"loss": 0.0392879843711853,
"step": 1740
},
{
"epoch": 15.625,
"grad_norm": 0.40487754344940186,
"learning_rate": 5.213094931387043e-05,
"loss": 0.042755302786827085,
"step": 1750
},
{
"epoch": 15.714285714285714,
"grad_norm": 0.6676396727561951,
"learning_rate": 5.2004271082196064e-05,
"loss": 0.04512317776679993,
"step": 1760
},
{
"epoch": 15.803571428571429,
"grad_norm": 0.6934312582015991,
"learning_rate": 5.187673789356017e-05,
"loss": 0.04026437401771545,
"step": 1770
},
{
"epoch": 15.892857142857142,
"grad_norm": 1.3655362129211426,
"learning_rate": 5.1748354703154706e-05,
"loss": 0.045592480897903444,
"step": 1780
},
{
"epoch": 15.982142857142858,
"grad_norm": 2.6899712085723877,
"learning_rate": 5.1619126499197756e-05,
"loss": 0.04209406077861786,
"step": 1790
},
{
"epoch": 16.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9909822820615134,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9909822820615134,
"eval_loss": 0.048930149525403976,
"eval_mean_accuracy": 0.9909822820615134,
"eval_mean_iou": 0.4954911410307567,
"eval_overall_accuracy": 0.9909822820615134,
"eval_runtime": 3.199,
"eval_samples_per_second": 49.39,
"eval_steps_per_second": 6.252,
"step": 1792
},
{
"epoch": 16.071428571428573,
"grad_norm": 3.0663135051727295,
"learning_rate": 5.148905830273964e-05,
"loss": 0.044573307037353516,
"step": 1800
},
{
"epoch": 16.160714285714285,
"grad_norm": 0.4636627435684204,
"learning_rate": 5.1358155167467856e-05,
"loss": 0.03752498030662536,
"step": 1810
},
{
"epoch": 16.25,
"grad_norm": 0.47981229424476624,
"learning_rate": 5.1226422179510766e-05,
"loss": 0.03836653232574463,
"step": 1820
},
{
"epoch": 16.339285714285715,
"grad_norm": 0.5740169286727905,
"learning_rate": 5.1093864457239915e-05,
"loss": 0.04181548357009888,
"step": 1830
},
{
"epoch": 16.428571428571427,
"grad_norm": 0.5714458227157593,
"learning_rate": 5.09604871510712e-05,
"loss": 0.04018245935440064,
"step": 1840
},
{
"epoch": 16.517857142857142,
"grad_norm": 0.8310384750366211,
"learning_rate": 5.082629544326473e-05,
"loss": 0.038782325387001035,
"step": 1850
},
{
"epoch": 16.607142857142858,
"grad_norm": 1.200546383857727,
"learning_rate": 5.06912945477235e-05,
"loss": 0.044720190763473514,
"step": 1860
},
{
"epoch": 16.696428571428573,
"grad_norm": 0.4382542371749878,
"learning_rate": 5.055548970979077e-05,
"loss": 0.041479668021202086,
"step": 1870
},
{
"epoch": 16.785714285714285,
"grad_norm": 0.41013088822364807,
"learning_rate": 5.041888620604634e-05,
"loss": 0.035242030024528505,
"step": 1880
},
{
"epoch": 16.875,
"grad_norm": 2.843520164489746,
"learning_rate": 5.0281489344101436e-05,
"loss": 0.0387931764125824,
"step": 1890
},
{
"epoch": 16.964285714285715,
"grad_norm": 0.6174224615097046,
"learning_rate": 5.014330446239254e-05,
"loss": 0.04532441198825836,
"step": 1900
},
{
"epoch": 17.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9893786642719616,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9893786642719616,
"eval_loss": 0.046091217547655106,
"eval_mean_accuracy": 0.9893786642719616,
"eval_mean_iou": 0.4946893321359808,
"eval_overall_accuracy": 0.9893786642719616,
"eval_runtime": 3.0874,
"eval_samples_per_second": 51.176,
"eval_steps_per_second": 6.478,
"step": 1904
},
{
"epoch": 17.053571428571427,
"grad_norm": 0.4036897122859955,
"learning_rate": 5.0004336929973956e-05,
"loss": 0.03707077205181122,
"step": 1910
},
{
"epoch": 17.142857142857142,
"grad_norm": 0.5742233991622925,
"learning_rate": 4.9864592146309236e-05,
"loss": 0.03820139169692993,
"step": 1920
},
{
"epoch": 17.232142857142858,
"grad_norm": 0.7360264658927917,
"learning_rate": 4.972407554106134e-05,
"loss": 0.0436991274356842,
"step": 1930
},
{
"epoch": 17.321428571428573,
"grad_norm": 0.5104629397392273,
"learning_rate": 4.9582792573881675e-05,
"loss": 0.033945232629776,
"step": 1940
},
{
"epoch": 17.410714285714285,
"grad_norm": 1.295369267463684,
"learning_rate": 4.9440748734197995e-05,
"loss": 0.04245510697364807,
"step": 1950
},
{
"epoch": 17.5,
"grad_norm": 0.3614010214805603,
"learning_rate": 4.929794954100111e-05,
"loss": 0.039192336797714236,
"step": 1960
},
{
"epoch": 17.589285714285715,
"grad_norm": 0.3201848268508911,
"learning_rate": 4.9154400542630405e-05,
"loss": 0.0368089109659195,
"step": 1970
},
{
"epoch": 17.678571428571427,
"grad_norm": 0.3553301692008972,
"learning_rate": 4.901010731655833e-05,
"loss": 0.04043708443641662,
"step": 1980
},
{
"epoch": 17.767857142857142,
"grad_norm": 0.4751736521720886,
"learning_rate": 4.886507546917364e-05,
"loss": 0.033682060241699216,
"step": 1990
},
{
"epoch": 17.857142857142858,
"grad_norm": 0.19512499868869781,
"learning_rate": 4.871931063556361e-05,
"loss": 0.03278649747371674,
"step": 2000
},
{
"epoch": 17.946428571428573,
"grad_norm": 0.5196254849433899,
"learning_rate": 4.857281847929503e-05,
"loss": 0.04488261938095093,
"step": 2010
},
{
"epoch": 18.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9857635535340814,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9857635535340814,
"eval_loss": 0.04853605851531029,
"eval_mean_accuracy": 0.9857635535340814,
"eval_mean_iou": 0.4928817767670407,
"eval_overall_accuracy": 0.9857635535340814,
"eval_runtime": 3.1354,
"eval_samples_per_second": 50.393,
"eval_steps_per_second": 6.379,
"step": 2016
},
{
"epoch": 18.035714285714285,
"grad_norm": 0.30406859517097473,
"learning_rate": 4.842560469219418e-05,
"loss": 0.03401051759719849,
"step": 2020
},
{
"epoch": 18.125,
"grad_norm": 0.5000826716423035,
"learning_rate": 4.827767499412573e-05,
"loss": 0.034174400568008426,
"step": 2030
},
{
"epoch": 18.214285714285715,
"grad_norm": 0.4069335460662842,
"learning_rate": 4.8129035132770424e-05,
"loss": 0.03663274347782135,
"step": 2040
},
{
"epoch": 18.303571428571427,
"grad_norm": 0.28684502840042114,
"learning_rate": 4.797969088340177e-05,
"loss": 0.0345532089471817,
"step": 2050
},
{
"epoch": 18.392857142857142,
"grad_norm": 0.4621877074241638,
"learning_rate": 4.782964804866168e-05,
"loss": 0.034203451871871945,
"step": 2060
},
{
"epoch": 18.482142857142858,
"grad_norm": 0.274502694606781,
"learning_rate": 4.7678912458335025e-05,
"loss": 0.033478057384490965,
"step": 2070
},
{
"epoch": 18.571428571428573,
"grad_norm": 2.0716018676757812,
"learning_rate": 4.7527489969123035e-05,
"loss": 0.03838878571987152,
"step": 2080
},
{
"epoch": 18.660714285714285,
"grad_norm": 0.5928405523300171,
"learning_rate": 4.737538646441587e-05,
"loss": 0.04016884863376617,
"step": 2090
},
{
"epoch": 18.75,
"grad_norm": 0.3344573974609375,
"learning_rate": 4.722260785406391e-05,
"loss": 0.034842535853385925,
"step": 2100
},
{
"epoch": 18.839285714285715,
"grad_norm": 0.31821951270103455,
"learning_rate": 4.706916007414821e-05,
"loss": 0.03510299324989319,
"step": 2110
},
{
"epoch": 18.928571428571427,
"grad_norm": 1.2290804386138916,
"learning_rate": 4.691504908674982e-05,
"loss": 0.034851866960525515,
"step": 2120
},
{
"epoch": 19.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9924935580484623,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9924935580484623,
"eval_loss": 0.04678338021039963,
"eval_mean_accuracy": 0.9924935580484623,
"eval_mean_iou": 0.49624677902423114,
"eval_overall_accuracy": 0.9924935580484623,
"eval_runtime": 3.1887,
"eval_samples_per_second": 49.55,
"eval_steps_per_second": 6.272,
"step": 2128
},
{
"epoch": 19.017857142857142,
"grad_norm": 0.8945170640945435,
"learning_rate": 4.6760280879718145e-05,
"loss": 0.03648801743984222,
"step": 2130
},
{
"epoch": 19.107142857142858,
"grad_norm": 0.7037824988365173,
"learning_rate": 4.660486146643829e-05,
"loss": 0.036881595849990845,
"step": 2140
},
{
"epoch": 19.196428571428573,
"grad_norm": 0.6412319540977478,
"learning_rate": 4.644879688559742e-05,
"loss": 0.03466321229934692,
"step": 2150
},
{
"epoch": 19.285714285714285,
"grad_norm": 0.5471871495246887,
"learning_rate": 4.629209320095013e-05,
"loss": 0.031432312726974485,
"step": 2160
},
{
"epoch": 19.375,
"grad_norm": 0.4182012379169464,
"learning_rate": 4.613475650108284e-05,
"loss": 0.03879809677600861,
"step": 2170
},
{
"epoch": 19.464285714285715,
"grad_norm": 0.7332907319068909,
"learning_rate": 4.5976792899177225e-05,
"loss": 0.03283085525035858,
"step": 2180
},
{
"epoch": 19.553571428571427,
"grad_norm": 0.7331687808036804,
"learning_rate": 4.58182085327727e-05,
"loss": 0.03797485828399658,
"step": 2190
},
{
"epoch": 19.642857142857142,
"grad_norm": 1.1568264961242676,
"learning_rate": 4.5659009563527966e-05,
"loss": 0.040525627136230466,
"step": 2200
},
{
"epoch": 19.732142857142858,
"grad_norm": 1.1485722064971924,
"learning_rate": 4.549920217698156e-05,
"loss": 0.03370160162448883,
"step": 2210
},
{
"epoch": 19.821428571428573,
"grad_norm": 1.1431678533554077,
"learning_rate": 4.533879258231156e-05,
"loss": 0.03664481043815613,
"step": 2220
},
{
"epoch": 19.910714285714285,
"grad_norm": 0.6225838661193848,
"learning_rate": 4.5177787012094334e-05,
"loss": 0.035591110587120056,
"step": 2230
},
{
"epoch": 20.0,
"grad_norm": 1.3148231506347656,
"learning_rate": 4.5016191722062336e-05,
"loss": 0.03507326543331146,
"step": 2240
},
{
"epoch": 20.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9924366332552259,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9924366332552259,
"eval_loss": 0.04701998829841614,
"eval_mean_accuracy": 0.9924366332552259,
"eval_mean_iou": 0.49621831662761295,
"eval_overall_accuracy": 0.9924366332552259,
"eval_runtime": 3.013,
"eval_samples_per_second": 52.44,
"eval_steps_per_second": 6.638,
"step": 2240
},
{
"epoch": 20.089285714285715,
"grad_norm": 0.6287689208984375,
"learning_rate": 4.48540129908611e-05,
"loss": 0.03255096971988678,
"step": 2250
},
{
"epoch": 20.178571428571427,
"grad_norm": 0.7971874475479126,
"learning_rate": 4.469125711980525e-05,
"loss": 0.0385926216840744,
"step": 2260
},
{
"epoch": 20.267857142857142,
"grad_norm": 0.4999794065952301,
"learning_rate": 4.452793043263369e-05,
"loss": 0.0330315887928009,
"step": 2270
},
{
"epoch": 20.357142857142858,
"grad_norm": 1.0392268896102905,
"learning_rate": 4.4364039275263886e-05,
"loss": 0.03553598821163177,
"step": 2280
},
{
"epoch": 20.446428571428573,
"grad_norm": 0.748245120048523,
"learning_rate": 4.4199590015545306e-05,
"loss": 0.03817463517189026,
"step": 2290
},
{
"epoch": 20.535714285714285,
"grad_norm": 3.1416192054748535,
"learning_rate": 4.4034589043012e-05,
"loss": 0.03555123507976532,
"step": 2300
},
{
"epoch": 20.625,
"grad_norm": 1.6041500568389893,
"learning_rate": 4.386904276863435e-05,
"loss": 0.04191716015338898,
"step": 2310
},
{
"epoch": 20.714285714285715,
"grad_norm": 0.3397618234157562,
"learning_rate": 4.370295762456997e-05,
"loss": 0.03920762240886688,
"step": 2320
},
{
"epoch": 20.803571428571427,
"grad_norm": 0.47967231273651123,
"learning_rate": 4.3536340063913794e-05,
"loss": 0.03428833186626434,
"step": 2330
},
{
"epoch": 20.892857142857142,
"grad_norm": 0.504014253616333,
"learning_rate": 4.336919656044731e-05,
"loss": 0.03250396251678467,
"step": 2340
},
{
"epoch": 20.982142857142858,
"grad_norm": 0.3230708837509155,
"learning_rate": 4.320153360838713e-05,
"loss": 0.032353276014328004,
"step": 2350
},
{
"epoch": 21.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9897066901732577,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9897066901732577,
"eval_loss": 0.04517462104558945,
"eval_mean_accuracy": 0.9897066901732577,
"eval_mean_iou": 0.49485334508662887,
"eval_overall_accuracy": 0.9897066901732577,
"eval_runtime": 3.124,
"eval_samples_per_second": 50.576,
"eval_steps_per_second": 6.402,
"step": 2352
},
{
"epoch": 21.071428571428573,
"grad_norm": 1.0374712944030762,
"learning_rate": 4.3033357722132514e-05,
"loss": 0.03456159830093384,
"step": 2360
},
{
"epoch": 21.160714285714285,
"grad_norm": 0.5611382126808167,
"learning_rate": 4.28646754360124e-05,
"loss": 0.03961513936519623,
"step": 2370
},
{
"epoch": 21.25,
"grad_norm": 1.1374410390853882,
"learning_rate": 4.26954933040314e-05,
"loss": 0.03642260730266571,
"step": 2380
},
{
"epoch": 21.339285714285715,
"grad_norm": 1.065623164176941,
"learning_rate": 4.252581789961527e-05,
"loss": 0.0321618914604187,
"step": 2390
},
{
"epoch": 21.428571428571427,
"grad_norm": 0.344766229391098,
"learning_rate": 4.235565581535539e-05,
"loss": 0.03374730050563812,
"step": 2400
},
{
"epoch": 21.517857142857142,
"grad_norm": 0.6901429295539856,
"learning_rate": 4.218501366275267e-05,
"loss": 0.037382254004478456,
"step": 2410
},
{
"epoch": 21.607142857142858,
"grad_norm": 0.6230500340461731,
"learning_rate": 4.2013898071960676e-05,
"loss": 0.03607453107833862,
"step": 2420
},
{
"epoch": 21.696428571428573,
"grad_norm": 0.33789336681365967,
"learning_rate": 4.184231569152802e-05,
"loss": 0.03156797885894776,
"step": 2430
},
{
"epoch": 21.785714285714285,
"grad_norm": 0.6263316869735718,
"learning_rate": 4.167027318813999e-05,
"loss": 0.02936406135559082,
"step": 2440
},
{
"epoch": 21.875,
"grad_norm": 0.3787066638469696,
"learning_rate": 4.149777724635957e-05,
"loss": 0.03306094706058502,
"step": 2450
},
{
"epoch": 21.964285714285715,
"grad_norm": 1.0717002153396606,
"learning_rate": 4.132483456836771e-05,
"loss": 0.03666483759880066,
"step": 2460
},
{
"epoch": 22.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9897153834391932,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9897153834391932,
"eval_loss": 0.04611481726169586,
"eval_mean_accuracy": 0.9897153834391932,
"eval_mean_iou": 0.4948576917195966,
"eval_overall_accuracy": 0.9897153834391932,
"eval_runtime": 3.1604,
"eval_samples_per_second": 49.994,
"eval_steps_per_second": 6.328,
"step": 2464
},
{
"epoch": 22.053571428571427,
"grad_norm": 0.26346009969711304,
"learning_rate": 4.1151451873702884e-05,
"loss": 0.036768025159835814,
"step": 2470
},
{
"epoch": 22.142857142857142,
"grad_norm": 0.3978211581707001,
"learning_rate": 4.0977635899000066e-05,
"loss": 0.037500059604644774,
"step": 2480
},
{
"epoch": 22.232142857142858,
"grad_norm": 0.6863635778427124,
"learning_rate": 4.080339339772893e-05,
"loss": 0.03716857135295868,
"step": 2490
},
{
"epoch": 22.321428571428573,
"grad_norm": 0.8167490363121033,
"learning_rate": 4.0628731139931474e-05,
"loss": 0.031910479068756104,
"step": 2500
},
{
"epoch": 22.410714285714285,
"grad_norm": 0.6655036807060242,
"learning_rate": 4.045365591195899e-05,
"loss": 0.03525538444519043,
"step": 2510
},
{
"epoch": 22.5,
"grad_norm": 0.6085823774337769,
"learning_rate": 4.027817451620835e-05,
"loss": 0.03340524137020111,
"step": 2520
},
{
"epoch": 22.589285714285715,
"grad_norm": 0.8327236771583557,
"learning_rate": 4.0102293770857734e-05,
"loss": 0.03699168860912323,
"step": 2530
},
{
"epoch": 22.678571428571427,
"grad_norm": 0.6012502312660217,
"learning_rate": 3.99260205096017e-05,
"loss": 0.0321900874376297,
"step": 2540
},
{
"epoch": 22.767857142857142,
"grad_norm": 0.9624703526496887,
"learning_rate": 3.974936158138568e-05,
"loss": 0.032026082277297974,
"step": 2550
},
{
"epoch": 22.857142857142858,
"grad_norm": 0.4007648229598999,
"learning_rate": 3.957232385013986e-05,
"loss": 0.03329742252826691,
"step": 2560
},
{
"epoch": 22.946428571428573,
"grad_norm": 0.48390379548072815,
"learning_rate": 3.9394914194512486e-05,
"loss": 0.03496589064598084,
"step": 2570
},
{
"epoch": 23.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9903151865914551,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9903151865914551,
"eval_loss": 0.04514744132757187,
"eval_mean_accuracy": 0.9903151865914551,
"eval_mean_iou": 0.49515759329572756,
"eval_overall_accuracy": 0.9903151865914551,
"eval_runtime": 3.1477,
"eval_samples_per_second": 50.196,
"eval_steps_per_second": 6.354,
"step": 2576
},
{
"epoch": 23.035714285714285,
"grad_norm": 0.40391215682029724,
"learning_rate": 3.9217139507602614e-05,
"loss": 0.03333309590816498,
"step": 2580
},
{
"epoch": 23.125,
"grad_norm": 0.3738088309764862,
"learning_rate": 3.9039006696692276e-05,
"loss": 0.03630165755748749,
"step": 2590
},
{
"epoch": 23.214285714285715,
"grad_norm": 0.8210233449935913,
"learning_rate": 3.886052268297809e-05,
"loss": 0.033744516968727115,
"step": 2600
},
{
"epoch": 23.303571428571427,
"grad_norm": 0.362053245306015,
"learning_rate": 3.868169440130236e-05,
"loss": 0.03140257894992828,
"step": 2610
},
{
"epoch": 23.392857142857142,
"grad_norm": 0.5485966205596924,
"learning_rate": 3.850252879988364e-05,
"loss": 0.0314506471157074,
"step": 2620
},
{
"epoch": 23.482142857142858,
"grad_norm": 0.5351651906967163,
"learning_rate": 3.8323032840046734e-05,
"loss": 0.030066084861755372,
"step": 2630
},
{
"epoch": 23.571428571428573,
"grad_norm": 0.49327391386032104,
"learning_rate": 3.8143213495952224e-05,
"loss": 0.031948789954185486,
"step": 2640
},
{
"epoch": 23.660714285714285,
"grad_norm": 0.554222822189331,
"learning_rate": 3.7963077754325563e-05,
"loss": 0.0361316055059433,
"step": 2650
},
{
"epoch": 23.75,
"grad_norm": 0.4138738811016083,
"learning_rate": 3.7782632614185495e-05,
"loss": 0.03466886579990387,
"step": 2660
},
{
"epoch": 23.839285714285715,
"grad_norm": 0.34648677706718445,
"learning_rate": 3.760188508657221e-05,
"loss": 0.028808239102363586,
"step": 2670
},
{
"epoch": 23.928571428571427,
"grad_norm": 1.9430650472640991,
"learning_rate": 3.742084219427489e-05,
"loss": 0.03538582324981689,
"step": 2680
},
{
"epoch": 24.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9913732214503568,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9913732214503568,
"eval_loss": 0.04687141999602318,
"eval_mean_accuracy": 0.9913732214503568,
"eval_mean_iou": 0.4956866107251784,
"eval_overall_accuracy": 0.9913732214503568,
"eval_runtime": 2.9475,
"eval_samples_per_second": 53.605,
"eval_steps_per_second": 6.785,
"step": 2688
},
{
"epoch": 24.017857142857142,
"grad_norm": 0.3821694850921631,
"learning_rate": 3.7239510971558875e-05,
"loss": 0.029324138164520265,
"step": 2690
},
{
"epoch": 24.107142857142858,
"grad_norm": 0.4301556348800659,
"learning_rate": 3.705789846389231e-05,
"loss": 0.03461351692676544,
"step": 2700
},
{
"epoch": 24.196428571428573,
"grad_norm": 0.4085342586040497,
"learning_rate": 3.687601172767243e-05,
"loss": 0.033036014437675475,
"step": 2710
},
{
"epoch": 24.285714285714285,
"grad_norm": 0.4198435842990875,
"learning_rate": 3.6693857829951396e-05,
"loss": 0.028960457444190978,
"step": 2720
},
{
"epoch": 24.375,
"grad_norm": 0.3448272943496704,
"learning_rate": 3.6511443848161685e-05,
"loss": 0.033338889479637146,
"step": 2730
},
{
"epoch": 24.464285714285715,
"grad_norm": 0.700137734413147,
"learning_rate": 3.632877686984114e-05,
"loss": 0.03215117454528808,
"step": 2740
},
{
"epoch": 24.553571428571427,
"grad_norm": 0.5219758152961731,
"learning_rate": 3.6145863992357524e-05,
"loss": 0.030151611566543578,
"step": 2750
},
{
"epoch": 24.642857142857142,
"grad_norm": 1.1105842590332031,
"learning_rate": 3.5962712322632844e-05,
"loss": 0.032877811789512636,
"step": 2760
},
{
"epoch": 24.732142857142858,
"grad_norm": 0.5468029379844666,
"learning_rate": 3.577932897686714e-05,
"loss": 0.03059898316860199,
"step": 2770
},
{
"epoch": 24.821428571428573,
"grad_norm": 0.43046024441719055,
"learning_rate": 3.559572108026204e-05,
"loss": 0.02730157971382141,
"step": 2780
},
{
"epoch": 24.910714285714285,
"grad_norm": 0.7536216378211975,
"learning_rate": 3.541189576674391e-05,
"loss": 0.03176028728485107,
"step": 2790
},
{
"epoch": 25.0,
"grad_norm": 1.3762458562850952,
"learning_rate": 3.522786017868663e-05,
"loss": 0.0352538138628006,
"step": 2800
},
{
"epoch": 25.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9889600030239687,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9889600030239687,
"eval_loss": 0.045154131948947906,
"eval_mean_accuracy": 0.9889600030239687,
"eval_mean_iou": 0.49448000151198435,
"eval_overall_accuracy": 0.9889600030239687,
"eval_runtime": 2.8182,
"eval_samples_per_second": 56.065,
"eval_steps_per_second": 7.097,
"step": 2800
},
{
"epoch": 25.089285714285715,
"grad_norm": 0.3534994125366211,
"learning_rate": 3.504362146663416e-05,
"loss": 0.03126908540725708,
"step": 2810
},
{
"epoch": 25.178571428571427,
"grad_norm": 0.5898330807685852,
"learning_rate": 3.485918678902263e-05,
"loss": 0.03366010189056397,
"step": 2820
},
{
"epoch": 25.267857142857142,
"grad_norm": 0.7023333311080933,
"learning_rate": 3.4674563311902265e-05,
"loss": 0.030235046148300172,
"step": 2830
},
{
"epoch": 25.357142857142858,
"grad_norm": 0.40369901061058044,
"learning_rate": 3.448975820865892e-05,
"loss": 0.02650986909866333,
"step": 2840
},
{
"epoch": 25.446428571428573,
"grad_norm": 0.47843503952026367,
"learning_rate": 3.430477865973538e-05,
"loss": 0.0322486013174057,
"step": 2850
},
{
"epoch": 25.535714285714285,
"grad_norm": 1.224301815032959,
"learning_rate": 3.411963185235238e-05,
"loss": 0.03207373321056366,
"step": 2860
},
{
"epoch": 25.625,
"grad_norm": 0.9510029554367065,
"learning_rate": 3.39343249802293e-05,
"loss": 0.031137165427207947,
"step": 2870
},
{
"epoch": 25.714285714285715,
"grad_norm": 0.4742358326911926,
"learning_rate": 3.374886524330474e-05,
"loss": 0.032748347520828246,
"step": 2880
},
{
"epoch": 25.803571428571427,
"grad_norm": 0.48148679733276367,
"learning_rate": 3.3563259847456706e-05,
"loss": 0.02805485725402832,
"step": 2890
},
{
"epoch": 25.892857142857142,
"grad_norm": 0.4079000949859619,
"learning_rate": 3.337751600422267e-05,
"loss": 0.03277623355388641,
"step": 2900
},
{
"epoch": 25.982142857142858,
"grad_norm": 0.502567708492279,
"learning_rate": 3.319164093051934e-05,
"loss": 0.03339660167694092,
"step": 2910
},
{
"epoch": 26.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9923893676463623,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9923893676463623,
"eval_loss": 0.04475132003426552,
"eval_mean_accuracy": 0.9923893676463623,
"eval_mean_iou": 0.49619468382318116,
"eval_overall_accuracy": 0.9923893676463623,
"eval_runtime": 3.0957,
"eval_samples_per_second": 51.038,
"eval_steps_per_second": 6.461,
"step": 2912
},
{
"epoch": 26.071428571428573,
"grad_norm": 0.7227765917778015,
"learning_rate": 3.300564184836229e-05,
"loss": 0.029735544323921205,
"step": 2920
},
{
"epoch": 26.160714285714285,
"grad_norm": 1.2855943441390991,
"learning_rate": 3.281952598458532e-05,
"loss": 0.0299568772315979,
"step": 2930
},
{
"epoch": 26.25,
"grad_norm": 0.6255515813827515,
"learning_rate": 3.263330057055968e-05,
"loss": 0.030430236458778383,
"step": 2940
},
{
"epoch": 26.339285714285715,
"grad_norm": 1.8101065158843994,
"learning_rate": 3.244697284191312e-05,
"loss": 0.03257070183753967,
"step": 2950
},
{
"epoch": 26.428571428571427,
"grad_norm": 0.7128406167030334,
"learning_rate": 3.2260550038248705e-05,
"loss": 0.029836279153823853,
"step": 2960
},
{
"epoch": 26.517857142857142,
"grad_norm": 0.7769372463226318,
"learning_rate": 3.207403940286358e-05,
"loss": 0.037280154228210446,
"step": 2970
},
{
"epoch": 26.607142857142858,
"grad_norm": 0.7605101466178894,
"learning_rate": 3.188744818246751e-05,
"loss": 0.03187412917613983,
"step": 2980
},
{
"epoch": 26.696428571428573,
"grad_norm": 1.993949294090271,
"learning_rate": 3.170078362690133e-05,
"loss": 0.030369496345520018,
"step": 2990
},
{
"epoch": 26.785714285714285,
"grad_norm": 0.6963241696357727,
"learning_rate": 3.1514052988855223e-05,
"loss": 0.030344370007514953,
"step": 3000
},
{
"epoch": 26.875,
"grad_norm": 0.4319656193256378,
"learning_rate": 3.1327263523586985e-05,
"loss": 0.029322752356529237,
"step": 3010
},
{
"epoch": 26.964285714285715,
"grad_norm": 0.48957666754722595,
"learning_rate": 3.114042248864007e-05,
"loss": 0.026906794309616087,
"step": 3020
},
{
"epoch": 27.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9915391984351606,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9915391984351606,
"eval_loss": 0.044823113828897476,
"eval_mean_accuracy": 0.9915391984351606,
"eval_mean_iou": 0.4957695992175803,
"eval_overall_accuracy": 0.9915391984351606,
"eval_runtime": 3.147,
"eval_samples_per_second": 50.207,
"eval_steps_per_second": 6.355,
"step": 3024
},
{
"epoch": 27.053571428571427,
"grad_norm": 0.8572945594787598,
"learning_rate": 3.0953537143561624e-05,
"loss": 0.0366124838590622,
"step": 3030
},
{
"epoch": 27.142857142857142,
"grad_norm": 0.6149380207061768,
"learning_rate": 3.076661474962045e-05,
"loss": 0.027939742803573607,
"step": 3040
},
{
"epoch": 27.232142857142858,
"grad_norm": 0.5692083239555359,
"learning_rate": 3.057966256952481e-05,
"loss": 0.03376020193099975,
"step": 3050
},
{
"epoch": 27.321428571428573,
"grad_norm": 0.32568567991256714,
"learning_rate": 3.0392687867140333e-05,
"loss": 0.031811395287513734,
"step": 3060
},
{
"epoch": 27.410714285714285,
"grad_norm": 0.8710930943489075,
"learning_rate": 3.0205697907207702e-05,
"loss": 0.032558149099349974,
"step": 3070
},
{
"epoch": 27.5,
"grad_norm": 0.41898801922798157,
"learning_rate": 3.0018699955060417e-05,
"loss": 0.02802801728248596,
"step": 3080
},
{
"epoch": 27.589285714285715,
"grad_norm": 0.3447811007499695,
"learning_rate": 2.9831701276342514e-05,
"loss": 0.02836693823337555,
"step": 3090
},
{
"epoch": 27.678571428571427,
"grad_norm": 0.3702087104320526,
"learning_rate": 2.9644709136726268e-05,
"loss": 0.03142592906951904,
"step": 3100
},
{
"epoch": 27.767857142857142,
"grad_norm": 0.4320816099643707,
"learning_rate": 2.9457730801629877e-05,
"loss": 0.02944057583808899,
"step": 3110
},
{
"epoch": 27.857142857142858,
"grad_norm": 0.6954593658447266,
"learning_rate": 2.927077353593516e-05,
"loss": 0.030368226766586303,
"step": 3120
},
{
"epoch": 27.946428571428573,
"grad_norm": 0.6075822710990906,
"learning_rate": 2.9083844603705326e-05,
"loss": 0.03189859688282013,
"step": 3130
},
{
"epoch": 28.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9898321951755401,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9898321951755401,
"eval_loss": 0.04428162798285484,
"eval_mean_accuracy": 0.9898321951755401,
"eval_mean_iou": 0.49491609758777005,
"eval_overall_accuracy": 0.9898321951755401,
"eval_runtime": 3.1745,
"eval_samples_per_second": 49.772,
"eval_steps_per_second": 6.3,
"step": 3136
},
{
"epoch": 28.035714285714285,
"grad_norm": 0.972698450088501,
"learning_rate": 2.8896951267902705e-05,
"loss": 0.030377256870269775,
"step": 3140
},
{
"epoch": 28.125,
"grad_norm": 0.5971301198005676,
"learning_rate": 2.8710100790106555e-05,
"loss": 0.029175907373428345,
"step": 3150
},
{
"epoch": 28.214285714285715,
"grad_norm": 0.3869675397872925,
"learning_rate": 2.8523300430230912e-05,
"loss": 0.030972689390182495,
"step": 3160
},
{
"epoch": 28.303571428571427,
"grad_norm": 0.4772997796535492,
"learning_rate": 2.833655744624256e-05,
"loss": 0.02870742082595825,
"step": 3170
},
{
"epoch": 28.392857142857142,
"grad_norm": 0.49730241298675537,
"learning_rate": 2.8149879093878954e-05,
"loss": 0.0323731005191803,
"step": 3180
},
{
"epoch": 28.482142857142858,
"grad_norm": 0.48639583587646484,
"learning_rate": 2.7963272626366367e-05,
"loss": 0.02942431569099426,
"step": 3190
},
{
"epoch": 28.571428571428573,
"grad_norm": 0.38169947266578674,
"learning_rate": 2.7776745294138023e-05,
"loss": 0.03691979944705963,
"step": 3200
},
{
"epoch": 28.660714285714285,
"grad_norm": 0.4951934516429901,
"learning_rate": 2.759030434455244e-05,
"loss": 0.031536877155303955,
"step": 3210
},
{
"epoch": 28.75,
"grad_norm": 0.39789584279060364,
"learning_rate": 2.7403957021611794e-05,
"loss": 0.029964196681976318,
"step": 3220
},
{
"epoch": 28.839285714285715,
"grad_norm": 0.6697349548339844,
"learning_rate": 2.7217710565680494e-05,
"loss": 0.02921389937400818,
"step": 3230
},
{
"epoch": 28.928571428571427,
"grad_norm": 0.6118156909942627,
"learning_rate": 2.7031572213203838e-05,
"loss": 0.029344850778579713,
"step": 3240
},
{
"epoch": 29.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9923891744626748,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9923891744626748,
"eval_loss": 0.045042846351861954,
"eval_mean_accuracy": 0.9923891744626748,
"eval_mean_iou": 0.4961945872313374,
"eval_overall_accuracy": 0.9923891744626748,
"eval_runtime": 3.0338,
"eval_samples_per_second": 52.08,
"eval_steps_per_second": 6.592,
"step": 3248
},
{
"epoch": 29.017857142857142,
"grad_norm": 0.3650244474411011,
"learning_rate": 2.6845549196426856e-05,
"loss": 0.025525736808776855,
"step": 3250
},
{
"epoch": 29.107142857142858,
"grad_norm": 0.46227961778640747,
"learning_rate": 2.665964874311331e-05,
"loss": 0.03523986339569092,
"step": 3260
},
{
"epoch": 29.196428571428573,
"grad_norm": 0.449188232421875,
"learning_rate": 2.6473878076264875e-05,
"loss": 0.030411550402641298,
"step": 3270
},
{
"epoch": 29.285714285714285,
"grad_norm": 0.4849155843257904,
"learning_rate": 2.6288244413840478e-05,
"loss": 0.02755580246448517,
"step": 3280
},
{
"epoch": 29.375,
"grad_norm": 0.5743690729141235,
"learning_rate": 2.6102754968475846e-05,
"loss": 0.029297468066215516,
"step": 3290
},
{
"epoch": 29.464285714285715,
"grad_norm": 0.7058063745498657,
"learning_rate": 2.5917416947203298e-05,
"loss": 0.032971051335334775,
"step": 3300
},
{
"epoch": 29.553571428571427,
"grad_norm": 0.6479628086090088,
"learning_rate": 2.5732237551171683e-05,
"loss": 0.029575762152671815,
"step": 3310
},
{
"epoch": 29.642857142857142,
"grad_norm": 0.9846095442771912,
"learning_rate": 2.5547223975366605e-05,
"loss": 0.030085331201553343,
"step": 3320
},
{
"epoch": 29.732142857142858,
"grad_norm": 0.4668130576610565,
"learning_rate": 2.5362383408330884e-05,
"loss": 0.031483760476112364,
"step": 3330
},
{
"epoch": 29.821428571428573,
"grad_norm": 1.0946239233016968,
"learning_rate": 2.5177723031885214e-05,
"loss": 0.026578304171562196,
"step": 3340
},
{
"epoch": 29.910714285714285,
"grad_norm": 0.601983368396759,
"learning_rate": 2.499325002084915e-05,
"loss": 0.02976991832256317,
"step": 3350
},
{
"epoch": 30.0,
"grad_norm": 0.40559685230255127,
"learning_rate": 2.480897154276232e-05,
"loss": 0.03062085509300232,
"step": 3360
},
{
"epoch": 30.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9923291265331581,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9923291265331581,
"eval_loss": 0.04375786706805229,
"eval_mean_accuracy": 0.9923291265331581,
"eval_mean_iou": 0.49616456326657904,
"eval_overall_accuracy": 0.9923291265331581,
"eval_runtime": 3.0864,
"eval_samples_per_second": 51.193,
"eval_steps_per_second": 6.48,
"step": 3360
},
{
"epoch": 30.089285714285715,
"grad_norm": 2.2518370151519775,
"learning_rate": 2.4624894757605942e-05,
"loss": 0.028901228308677675,
"step": 3370
},
{
"epoch": 30.178571428571427,
"grad_norm": 0.48904410004615784,
"learning_rate": 2.4441026817524623e-05,
"loss": 0.03043428063392639,
"step": 3380
},
{
"epoch": 30.267857142857142,
"grad_norm": 0.4779645502567291,
"learning_rate": 2.4257374866548496e-05,
"loss": 0.031688454747200015,
"step": 3390
},
{
"epoch": 30.357142857142858,
"grad_norm": 0.5410107374191284,
"learning_rate": 2.40739460403156e-05,
"loss": 0.029933920502662657,
"step": 3400
},
{
"epoch": 30.446428571428573,
"grad_norm": 0.5752859711647034,
"learning_rate": 2.389074746579468e-05,
"loss": 0.029010221362113953,
"step": 3410
},
{
"epoch": 30.535714285714285,
"grad_norm": 0.7090629935264587,
"learning_rate": 2.3707786261008217e-05,
"loss": 0.029284483194351195,
"step": 3420
},
{
"epoch": 30.625,
"grad_norm": 0.9575799107551575,
"learning_rate": 2.3525069534755923e-05,
"loss": 0.028822487592697142,
"step": 3430
},
{
"epoch": 30.714285714285715,
"grad_norm": 0.27941980957984924,
"learning_rate": 2.3342604386338497e-05,
"loss": 0.029538267850875856,
"step": 3440
},
{
"epoch": 30.803571428571427,
"grad_norm": 0.7441650032997131,
"learning_rate": 2.31603979052818e-05,
"loss": 0.025286585092544556,
"step": 3450
},
{
"epoch": 30.892857142857142,
"grad_norm": 0.5763952136039734,
"learning_rate": 2.2978457171061393e-05,
"loss": 0.031220585107803345,
"step": 3460
},
{
"epoch": 30.982142857142858,
"grad_norm": 0.5611822009086609,
"learning_rate": 2.2796789252827475e-05,
"loss": 0.02782772183418274,
"step": 3470
},
{
"epoch": 31.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.992043246873008,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.992043246873008,
"eval_loss": 0.04470207169651985,
"eval_mean_accuracy": 0.992043246873008,
"eval_mean_iou": 0.496021623436504,
"eval_overall_accuracy": 0.992043246873008,
"eval_runtime": 3.1674,
"eval_samples_per_second": 49.883,
"eval_steps_per_second": 6.314,
"step": 3472
},
{
"epoch": 31.071428571428573,
"grad_norm": 0.9794915914535522,
"learning_rate": 2.261540120913021e-05,
"loss": 0.031087765097618104,
"step": 3480
},
{
"epoch": 31.160714285714285,
"grad_norm": 0.625676691532135,
"learning_rate": 2.2434300087645497e-05,
"loss": 0.027998083829879762,
"step": 3490
},
{
"epoch": 31.25,
"grad_norm": 0.3041325509548187,
"learning_rate": 2.22534929249011e-05,
"loss": 0.025890350341796875,
"step": 3500
},
{
"epoch": 31.339285714285715,
"grad_norm": 0.8442551493644714,
"learning_rate": 2.207298674600328e-05,
"loss": 0.0253944993019104,
"step": 3510
},
{
"epoch": 31.428571428571427,
"grad_norm": 1.6644678115844727,
"learning_rate": 2.1892788564363828e-05,
"loss": 0.03048495650291443,
"step": 3520
},
{
"epoch": 31.517857142857142,
"grad_norm": 0.4767031967639923,
"learning_rate": 2.171290538142757e-05,
"loss": 0.02629549503326416,
"step": 3530
},
{
"epoch": 31.607142857142858,
"grad_norm": 0.5214105248451233,
"learning_rate": 2.1533344186400313e-05,
"loss": 0.027956664562225342,
"step": 3540
},
{
"epoch": 31.696428571428573,
"grad_norm": 0.43287837505340576,
"learning_rate": 2.135411195597732e-05,
"loss": 0.02858385443687439,
"step": 3550
},
{
"epoch": 31.785714285714285,
"grad_norm": 0.6804491877555847,
"learning_rate": 2.117521565407222e-05,
"loss": 0.024375714361667633,
"step": 3560
},
{
"epoch": 31.875,
"grad_norm": Infinity,
"learning_rate": 2.0996662231546415e-05,
"loss": 0.03603389859199524,
"step": 3570
},
{
"epoch": 31.964285714285715,
"grad_norm": 0.4699368476867676,
"learning_rate": 2.0818458625939044e-05,
"loss": 0.026799708604812622,
"step": 3580
},
{
"epoch": 32.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9924100061036386,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9924100061036386,
"eval_loss": 0.045893941074609756,
"eval_mean_accuracy": 0.9924100061036386,
"eval_mean_iou": 0.4962050030518193,
"eval_overall_accuracy": 0.9924100061036386,
"eval_runtime": 3.1947,
"eval_samples_per_second": 49.457,
"eval_steps_per_second": 6.26,
"step": 3584
},
{
"epoch": 32.05357142857143,
"grad_norm": 0.5421997308731079,
"learning_rate": 2.0640611761197383e-05,
"loss": 0.03136940598487854,
"step": 3590
},
{
"epoch": 32.142857142857146,
"grad_norm": 0.5340573191642761,
"learning_rate": 2.046312854740787e-05,
"loss": 0.024993625283241273,
"step": 3600
},
{
"epoch": 32.232142857142854,
"grad_norm": 0.854223370552063,
"learning_rate": 2.0286015880527604e-05,
"loss": 0.032940977811813356,
"step": 3610
},
{
"epoch": 32.32142857142857,
"grad_norm": 0.4844415485858917,
"learning_rate": 2.010928064211639e-05,
"loss": 0.027138784527778625,
"step": 3620
},
{
"epoch": 32.410714285714285,
"grad_norm": 0.8010973930358887,
"learning_rate": 1.993292969906938e-05,
"loss": 0.029732125997543334,
"step": 3630
},
{
"epoch": 32.5,
"grad_norm": 0.5439932942390442,
"learning_rate": 1.9756969903350243e-05,
"loss": 0.02823580801486969,
"step": 3640
},
{
"epoch": 32.589285714285715,
"grad_norm": 0.5155593156814575,
"learning_rate": 1.9581408091725015e-05,
"loss": 0.02901386618614197,
"step": 3650
},
{
"epoch": 32.67857142857143,
"grad_norm": 0.7744992971420288,
"learning_rate": 1.9406251085496335e-05,
"loss": 0.028212952613830566,
"step": 3660
},
{
"epoch": 32.767857142857146,
"grad_norm": 0.5233684182167053,
"learning_rate": 1.9231505690238513e-05,
"loss": 0.029126328229904175,
"step": 3670
},
{
"epoch": 32.857142857142854,
"grad_norm": 0.5012129545211792,
"learning_rate": 1.9057178695533066e-05,
"loss": 0.02480347752571106,
"step": 3680
},
{
"epoch": 32.94642857142857,
"grad_norm": 0.3605862259864807,
"learning_rate": 1.888327687470491e-05,
"loss": 0.026929333806037903,
"step": 3690
},
{
"epoch": 33.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9899491678982931,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9899491678982931,
"eval_loss": 0.04337907209992409,
"eval_mean_accuracy": 0.9899491678982931,
"eval_mean_iou": 0.49497458394914656,
"eval_overall_accuracy": 0.9899491678982931,
"eval_runtime": 3.1897,
"eval_samples_per_second": 49.535,
"eval_steps_per_second": 6.27,
"step": 3696
},
{
"epoch": 33.035714285714285,
"grad_norm": 0.7721555233001709,
"learning_rate": 1.8709806984559214e-05,
"loss": 0.027222782373428345,
"step": 3700
},
{
"epoch": 33.125,
"grad_norm": 0.400393009185791,
"learning_rate": 1.8536775765118827e-05,
"loss": 0.02593788206577301,
"step": 3710
},
{
"epoch": 33.214285714285715,
"grad_norm": 0.5267050266265869,
"learning_rate": 1.8364189939362448e-05,
"loss": 0.031792303919792174,
"step": 3720
},
{
"epoch": 33.30357142857143,
"grad_norm": 0.4609811007976532,
"learning_rate": 1.819205621296338e-05,
"loss": 0.025541388988494874,
"step": 3730
},
{
"epoch": 33.392857142857146,
"grad_norm": 0.47067102789878845,
"learning_rate": 1.8020381274029008e-05,
"loss": 0.025906682014465332,
"step": 3740
},
{
"epoch": 33.482142857142854,
"grad_norm": 0.5264711976051331,
"learning_rate": 1.78491717928409e-05,
"loss": 0.02825929820537567,
"step": 3750
},
{
"epoch": 33.57142857142857,
"grad_norm": 0.7650744915008545,
"learning_rate": 1.7678434421595687e-05,
"loss": 0.02745148241519928,
"step": 3760
},
{
"epoch": 33.660714285714285,
"grad_norm": 0.7770243883132935,
"learning_rate": 1.7508175794146576e-05,
"loss": 0.03023013174533844,
"step": 3770
},
{
"epoch": 33.75,
"grad_norm": 0.5987495183944702,
"learning_rate": 1.7338402525745577e-05,
"loss": 0.02483441084623337,
"step": 3780
},
{
"epoch": 33.839285714285715,
"grad_norm": 0.35336533188819885,
"learning_rate": 1.716912121278651e-05,
"loss": 0.02692849636077881,
"step": 3790
},
{
"epoch": 33.92857142857143,
"grad_norm": 0.39276322722435,
"learning_rate": 1.7000338432548702e-05,
"loss": 0.026848804950714112,
"step": 3800
},
{
"epoch": 34.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9906004867005427,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9906004867005427,
"eval_loss": 0.04445888474583626,
"eval_mean_accuracy": 0.9906004867005427,
"eval_mean_iou": 0.49530024335027134,
"eval_overall_accuracy": 0.9906004867005427,
"eval_runtime": 3.0691,
"eval_samples_per_second": 51.48,
"eval_steps_per_second": 6.516,
"step": 3808
},
{
"epoch": 34.017857142857146,
"grad_norm": 0.4166980981826782,
"learning_rate": 1.683206074294139e-05,
"loss": 0.025022292137145997,
"step": 3810
},
{
"epoch": 34.107142857142854,
"grad_norm": 0.5631642937660217,
"learning_rate": 1.666429468224898e-05,
"loss": 0.025662198662757874,
"step": 3820
},
{
"epoch": 34.19642857142857,
"grad_norm": 0.9187061786651611,
"learning_rate": 1.6497046768876947e-05,
"loss": 0.02872176170349121,
"step": 3830
},
{
"epoch": 34.285714285714285,
"grad_norm": 0.5928124785423279,
"learning_rate": 1.633032350109864e-05,
"loss": 0.028657811880111694,
"step": 3840
},
{
"epoch": 34.375,
"grad_norm": 0.41895392537117004,
"learning_rate": 1.616413135680272e-05,
"loss": 0.02543511092662811,
"step": 3850
},
{
"epoch": 34.464285714285715,
"grad_norm": 0.5905092358589172,
"learning_rate": 1.599847679324151e-05,
"loss": 0.026353082060813902,
"step": 3860
},
{
"epoch": 34.55357142857143,
"grad_norm": 0.5018086433410645,
"learning_rate": 1.5833366246780132e-05,
"loss": 0.029970470070838928,
"step": 3870
},
{
"epoch": 34.642857142857146,
"grad_norm": 0.7949761152267456,
"learning_rate": 1.566880613264633e-05,
"loss": 0.025467506051063536,
"step": 3880
},
{
"epoch": 34.732142857142854,
"grad_norm": 0.5539437532424927,
"learning_rate": 1.550480284468134e-05,
"loss": 0.027051180601119995,
"step": 3890
},
{
"epoch": 34.82142857142857,
"grad_norm": 0.740074098110199,
"learning_rate": 1.534136275509136e-05,
"loss": 0.028169989585876465,
"step": 3900
},
{
"epoch": 34.910714285714285,
"grad_norm": 0.5646836161613464,
"learning_rate": 1.5178492214199992e-05,
"loss": 0.028034254908561707,
"step": 3910
},
{
"epoch": 35.0,
"grad_norm": 0.6476469039916992,
"learning_rate": 1.5016197550201563e-05,
"loss": 0.03015502095222473,
"step": 3920
},
{
"epoch": 35.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9891122961642446,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9891122961642446,
"eval_loss": 0.04427924379706383,
"eval_mean_accuracy": 0.9891122961642446,
"eval_mean_iou": 0.4945561480821223,
"eval_overall_accuracy": 0.9891122961642446,
"eval_runtime": 2.9945,
"eval_samples_per_second": 52.763,
"eval_steps_per_second": 6.679,
"step": 3920
},
{
"epoch": 35.089285714285715,
"grad_norm": 1.9664608240127563,
"learning_rate": 1.4854485068915138e-05,
"loss": 0.0286253958940506,
"step": 3930
},
{
"epoch": 35.17857142857143,
"grad_norm": 0.35685494542121887,
"learning_rate": 1.469336105353964e-05,
"loss": 0.02511138916015625,
"step": 3940
},
{
"epoch": 35.267857142857146,
"grad_norm": 0.6063141822814941,
"learning_rate": 1.4532831764409593e-05,
"loss": 0.027212321758270264,
"step": 3950
},
{
"epoch": 35.357142857142854,
"grad_norm": 0.6104390621185303,
"learning_rate": 1.4372903438752002e-05,
"loss": 0.025636497139930724,
"step": 3960
},
{
"epoch": 35.44642857142857,
"grad_norm": 0.616294264793396,
"learning_rate": 1.4213582290443913e-05,
"loss": 0.02637772560119629,
"step": 3970
},
{
"epoch": 35.535714285714285,
"grad_norm": 0.7684455513954163,
"learning_rate": 1.405487450977105e-05,
"loss": 0.02701924443244934,
"step": 3980
},
{
"epoch": 35.625,
"grad_norm": 0.3559069037437439,
"learning_rate": 1.389678626318724e-05,
"loss": 0.030377697944641114,
"step": 3990
},
{
"epoch": 35.714285714285715,
"grad_norm": 0.4215583801269531,
"learning_rate": 1.373932369307488e-05,
"loss": 0.022440439462661742,
"step": 4000
},
{
"epoch": 35.80357142857143,
"grad_norm": 0.3485909104347229,
"learning_rate": 1.3582492917506218e-05,
"loss": 0.024866998195648193,
"step": 4010
},
{
"epoch": 35.892857142857146,
"grad_norm": 0.7256842851638794,
"learning_rate": 1.3426300030005673e-05,
"loss": 0.024919840693473815,
"step": 4020
},
{
"epoch": 35.982142857142854,
"grad_norm": 0.3357905447483063,
"learning_rate": 1.3270751099313106e-05,
"loss": 0.02386535108089447,
"step": 4030
},
{
"epoch": 36.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.991872182717768,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.991872182717768,
"eval_loss": 0.04389407858252525,
"eval_mean_accuracy": 0.991872182717768,
"eval_mean_iou": 0.495936091358884,
"eval_overall_accuracy": 0.991872182717768,
"eval_runtime": 3.1411,
"eval_samples_per_second": 50.301,
"eval_steps_per_second": 6.367,
"step": 4032
},
{
"epoch": 36.07142857142857,
"grad_norm": 1.1024103164672852,
"learning_rate": 1.3115852169147942e-05,
"loss": 0.02843126356601715,
"step": 4040
},
{
"epoch": 36.160714285714285,
"grad_norm": 0.5255261659622192,
"learning_rate": 1.2961609257974446e-05,
"loss": 0.028734481334686278,
"step": 4050
},
{
"epoch": 36.25,
"grad_norm": 1.559330940246582,
"learning_rate": 1.28080283587678e-05,
"loss": 0.02784898579120636,
"step": 4060
},
{
"epoch": 36.339285714285715,
"grad_norm": 1.8099925518035889,
"learning_rate": 1.2655115438781276e-05,
"loss": 0.02688506543636322,
"step": 4070
},
{
"epoch": 36.42857142857143,
"grad_norm": 1.2787431478500366,
"learning_rate": 1.2502876439314429e-05,
"loss": 0.027660322189331055,
"step": 4080
},
{
"epoch": 36.517857142857146,
"grad_norm": 0.6661645770072937,
"learning_rate": 1.2351317275482168e-05,
"loss": 0.028162682056427003,
"step": 4090
},
{
"epoch": 36.607142857142854,
"grad_norm": 0.659756600856781,
"learning_rate": 1.2200443835985017e-05,
"loss": 0.02568315863609314,
"step": 4100
},
{
"epoch": 36.69642857142857,
"grad_norm": 0.32298824191093445,
"learning_rate": 1.2050261982880229e-05,
"loss": 0.025612333416938783,
"step": 4110
},
{
"epoch": 36.785714285714285,
"grad_norm": 0.5366314053535461,
"learning_rate": 1.1900777551354101e-05,
"loss": 0.02462407052516937,
"step": 4120
},
{
"epoch": 36.875,
"grad_norm": 0.3352350890636444,
"learning_rate": 1.1751996349495216e-05,
"loss": 0.023358260095119477,
"step": 4130
},
{
"epoch": 36.964285714285715,
"grad_norm": 0.45832622051239014,
"learning_rate": 1.1603924158068747e-05,
"loss": 0.026781818270683287,
"step": 4140
},
{
"epoch": 37.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.991538457897692,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.991538457897692,
"eval_loss": 0.044210035353899,
"eval_mean_accuracy": 0.991538457897692,
"eval_mean_iou": 0.495769228948846,
"eval_overall_accuracy": 0.991538457897692,
"eval_runtime": 3.158,
"eval_samples_per_second": 50.031,
"eval_steps_per_second": 6.333,
"step": 4144
},
{
"epoch": 37.05357142857143,
"grad_norm": 0.33479002118110657,
"learning_rate": 1.1456566730291887e-05,
"loss": 0.024782487750053407,
"step": 4150
},
{
"epoch": 37.142857142857146,
"grad_norm": 0.4473731815814972,
"learning_rate": 1.1309929791610332e-05,
"loss": 0.02461591362953186,
"step": 4160
},
{
"epoch": 37.232142857142854,
"grad_norm": 0.5323212146759033,
"learning_rate": 1.1164019039475756e-05,
"loss": 0.029087895154953004,
"step": 4170
},
{
"epoch": 37.32142857142857,
"grad_norm": 0.34507501125335693,
"learning_rate": 1.1018840143124519e-05,
"loss": 0.023842757940292357,
"step": 4180
},
{
"epoch": 37.410714285714285,
"grad_norm": 0.6882377862930298,
"learning_rate": 1.087439874335733e-05,
"loss": 0.026730936765670777,
"step": 4190
},
{
"epoch": 37.5,
"grad_norm": 0.7014771699905396,
"learning_rate": 1.0730700452320104e-05,
"loss": 0.02618339955806732,
"step": 4200
},
{
"epoch": 37.589285714285715,
"grad_norm": 0.5191277861595154,
"learning_rate": 1.0587750853285933e-05,
"loss": 0.02311095893383026,
"step": 4210
},
{
"epoch": 37.67857142857143,
"grad_norm": 0.32207751274108887,
"learning_rate": 1.0445555500438094e-05,
"loss": 0.024721568822860716,
"step": 4220
},
{
"epoch": 37.767857142857146,
"grad_norm": 0.4454548954963684,
"learning_rate": 1.0304119918654315e-05,
"loss": 0.026396998763084413,
"step": 4230
},
{
"epoch": 37.857142857142854,
"grad_norm": 0.4234572947025299,
"learning_rate": 1.0163449603292046e-05,
"loss": 0.025258558988571166,
"step": 4240
},
{
"epoch": 37.94642857142857,
"grad_norm": 0.36918315291404724,
"learning_rate": 1.0023550019974975e-05,
"loss": 0.031771954894065854,
"step": 4250
},
{
"epoch": 38.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9915934830513351,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9915934830513351,
"eval_loss": 0.04508010670542717,
"eval_mean_accuracy": 0.9915934830513351,
"eval_mean_iou": 0.49579674152566755,
"eval_overall_accuracy": 0.9915934830513351,
"eval_runtime": 3.1481,
"eval_samples_per_second": 50.188,
"eval_steps_per_second": 6.353,
"step": 4256
},
{
"epoch": 38.035714285714285,
"grad_norm": 0.3639099597930908,
"learning_rate": 9.884426604380682e-06,
"loss": 0.03158144354820251,
"step": 4260
},
{
"epoch": 38.125,
"grad_norm": 0.3746374249458313,
"learning_rate": 9.746084762029392e-06,
"loss": 0.027127474546432495,
"step": 4270
},
{
"epoch": 38.214285714285715,
"grad_norm": 0.7463239431381226,
"learning_rate": 9.608529868073992e-06,
"loss": 0.02929815649986267,
"step": 4280
},
{
"epoch": 38.30357142857143,
"grad_norm": 0.2743181586265564,
"learning_rate": 9.471767267091185e-06,
"loss": 0.024283508956432342,
"step": 4290
},
{
"epoch": 38.392857142857146,
"grad_norm": 0.4589490294456482,
"learning_rate": 9.335802272873778e-06,
"loss": 0.0359749972820282,
"step": 4300
},
{
"epoch": 38.482142857142854,
"grad_norm": 0.6548665761947632,
"learning_rate": 9.200640168224273e-06,
"loss": 0.02526823282241821,
"step": 4310
},
{
"epoch": 38.57142857142857,
"grad_norm": 0.8196024894714355,
"learning_rate": 9.066286204749602e-06,
"loss": 0.029026347398757934,
"step": 4320
},
{
"epoch": 38.660714285714285,
"grad_norm": 0.954537034034729,
"learning_rate": 8.932745602657037e-06,
"loss": 0.028312593698501587,
"step": 4330
},
{
"epoch": 38.75,
"grad_norm": 0.23943273723125458,
"learning_rate": 8.800023550551443e-06,
"loss": 0.021906113624572753,
"step": 4340
},
{
"epoch": 38.839285714285715,
"grad_norm": 0.4769308567047119,
"learning_rate": 8.668125205233592e-06,
"loss": 0.024248187243938447,
"step": 4350
},
{
"epoch": 38.92857142857143,
"grad_norm": 0.8277206420898438,
"learning_rate": 8.537055691499845e-06,
"loss": 0.027632582187652587,
"step": 4360
},
{
"epoch": 39.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9912071800709905,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9912071800709905,
"eval_loss": 0.044417619705200195,
"eval_mean_accuracy": 0.9912071800709905,
"eval_mean_iou": 0.49560359003549526,
"eval_overall_accuracy": 0.9912071800709905,
"eval_runtime": 3.0475,
"eval_samples_per_second": 51.846,
"eval_steps_per_second": 6.563,
"step": 4368
},
{
"epoch": 39.017857142857146,
"grad_norm": 0.5799295902252197,
"learning_rate": 8.406820101943053e-06,
"loss": 0.029939955472946166,
"step": 4370
},
{
"epoch": 39.107142857142854,
"grad_norm": 0.4670115113258362,
"learning_rate": 8.277423496754626e-06,
"loss": 0.02502877414226532,
"step": 4380
},
{
"epoch": 39.19642857142857,
"grad_norm": 0.3573046922683716,
"learning_rate": 8.148870903527995e-06,
"loss": 0.027808144688606262,
"step": 4390
},
{
"epoch": 39.285714285714285,
"grad_norm": 0.48127973079681396,
"learning_rate": 8.021167317063218e-06,
"loss": 0.024090613424777984,
"step": 4400
},
{
"epoch": 39.375,
"grad_norm": 0.5244694352149963,
"learning_rate": 7.894317699172912e-06,
"loss": 0.027278715372085573,
"step": 4410
},
{
"epoch": 39.464285714285715,
"grad_norm": 0.5811761021614075,
"learning_rate": 7.768326978489516e-06,
"loss": 0.027140852808952332,
"step": 4420
},
{
"epoch": 39.55357142857143,
"grad_norm": 0.7176029086112976,
"learning_rate": 7.643200050273741e-06,
"loss": 0.026023095846176146,
"step": 4430
},
{
"epoch": 39.642857142857146,
"grad_norm": 0.28565794229507446,
"learning_rate": 7.518941776224381e-06,
"loss": 0.024949049949645995,
"step": 4440
},
{
"epoch": 39.732142857142854,
"grad_norm": 0.42266854643821716,
"learning_rate": 7.395556984289442e-06,
"loss": 0.02561112344264984,
"step": 4450
},
{
"epoch": 39.82142857142857,
"grad_norm": 0.9398337602615356,
"learning_rate": 7.273050468478509e-06,
"loss": 0.024365237355232237,
"step": 4460
},
{
"epoch": 39.910714285714285,
"grad_norm": 0.370419979095459,
"learning_rate": 7.151426988676538e-06,
"loss": 0.025940805673599243,
"step": 4470
},
{
"epoch": 40.0,
"grad_norm": 0.46006032824516296,
"learning_rate": 7.0306912704588566e-06,
"loss": 0.02482418715953827,
"step": 4480
},
{
"epoch": 40.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9920959538224017,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9920959538224017,
"eval_loss": 0.045616794377565384,
"eval_mean_accuracy": 0.9920959538224017,
"eval_mean_iou": 0.49604797691120084,
"eval_overall_accuracy": 0.9920959538224017,
"eval_runtime": 2.8701,
"eval_samples_per_second": 55.05,
"eval_steps_per_second": 6.968,
"step": 4480
},
{
"epoch": 40.089285714285715,
"grad_norm": 0.3945085406303406,
"learning_rate": 6.910848004907583e-06,
"loss": 0.026185140013694763,
"step": 4490
},
{
"epoch": 40.17857142857143,
"grad_norm": 0.6535700559616089,
"learning_rate": 6.791901848429387e-06,
"loss": 0.02537115216255188,
"step": 4500
},
{
"epoch": 40.267857142857146,
"grad_norm": 0.5408845543861389,
"learning_rate": 6.673857422574499e-06,
"loss": 0.025524777173995972,
"step": 4510
},
{
"epoch": 40.357142857142854,
"grad_norm": 0.6645027995109558,
"learning_rate": 6.556719313857219e-06,
"loss": 0.0288840651512146,
"step": 4520
},
{
"epoch": 40.44642857142857,
"grad_norm": 0.2951991856098175,
"learning_rate": 6.440492073577659e-06,
"loss": 0.02452797442674637,
"step": 4530
},
{
"epoch": 40.535714285714285,
"grad_norm": 0.4799725413322449,
"learning_rate": 6.325180217644914e-06,
"loss": 0.024873518943786622,
"step": 4540
},
{
"epoch": 40.625,
"grad_norm": 0.3771775960922241,
"learning_rate": 6.2107882264016446e-06,
"loss": 0.025704348087310792,
"step": 4550
},
{
"epoch": 40.714285714285715,
"grad_norm": 0.36452680826187134,
"learning_rate": 6.097320544449921e-06,
"loss": 0.02450278103351593,
"step": 4560
},
{
"epoch": 40.80357142857143,
"grad_norm": 0.7826708555221558,
"learning_rate": 5.984781580478611e-06,
"loss": 0.02239405959844589,
"step": 4570
},
{
"epoch": 40.892857142857146,
"grad_norm": 0.4126140773296356,
"learning_rate": 5.873175707092019e-06,
"loss": 0.029208868741989136,
"step": 4580
},
{
"epoch": 40.982142857142854,
"grad_norm": 0.4714967906475067,
"learning_rate": 5.7625072606400375e-06,
"loss": 0.02443849891424179,
"step": 4590
},
{
"epoch": 41.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9904924004274125,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9904924004274125,
"eval_loss": 0.04487628862261772,
"eval_mean_accuracy": 0.9904924004274125,
"eval_mean_iou": 0.49524620021370624,
"eval_overall_accuracy": 0.9904924004274125,
"eval_runtime": 3.1369,
"eval_samples_per_second": 50.367,
"eval_steps_per_second": 6.376,
"step": 4592
},
{
"epoch": 41.07142857142857,
"grad_norm": 0.8939480781555176,
"learning_rate": 5.652780541049631e-06,
"loss": 0.024046406149864197,
"step": 4600
},
{
"epoch": 41.160714285714285,
"grad_norm": 0.9223622679710388,
"learning_rate": 5.543999811657797e-06,
"loss": 0.026213526725769043,
"step": 4610
},
{
"epoch": 41.25,
"grad_norm": 0.2867562770843506,
"learning_rate": 5.436169299045876e-06,
"loss": 0.028421574831008913,
"step": 4620
},
{
"epoch": 41.339285714285715,
"grad_norm": 0.5164304375648499,
"learning_rate": 5.329293192875387e-06,
"loss": 0.02325395345687866,
"step": 4630
},
{
"epoch": 41.42857142857143,
"grad_norm": 0.34760358929634094,
"learning_rate": 5.223375645725183e-06,
"loss": 0.02278565615415573,
"step": 4640
},
{
"epoch": 41.517857142857146,
"grad_norm": 0.3044535219669342,
"learning_rate": 5.118420772930138e-06,
"loss": 0.025249192118644716,
"step": 4650
},
{
"epoch": 41.607142857142854,
"grad_norm": 0.7161318063735962,
"learning_rate": 5.01443265242126e-06,
"loss": 0.025399017333984374,
"step": 4660
},
{
"epoch": 41.69642857142857,
"grad_norm": 0.48156532645225525,
"learning_rate": 4.911415324567213e-06,
"loss": 0.02383261322975159,
"step": 4670
},
{
"epoch": 41.785714285714285,
"grad_norm": 0.5352237224578857,
"learning_rate": 4.809372792017372e-06,
"loss": 0.02105867862701416,
"step": 4680
},
{
"epoch": 41.875,
"grad_norm": 0.5803747773170471,
"learning_rate": 4.708309019546263e-06,
"loss": 0.02634103000164032,
"step": 4690
},
{
"epoch": 41.964285714285715,
"grad_norm": 0.47478434443473816,
"learning_rate": 4.608227933899527e-06,
"loss": 0.023492810130119324,
"step": 4700
},
{
"epoch": 42.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9922144076200919,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9922144076200919,
"eval_loss": 0.044545359909534454,
"eval_mean_accuracy": 0.9922144076200919,
"eval_mean_iou": 0.49610720381004597,
"eval_overall_accuracy": 0.9922144076200919,
"eval_runtime": 3.0802,
"eval_samples_per_second": 51.295,
"eval_steps_per_second": 6.493,
"step": 4704
},
{
"epoch": 42.05357142857143,
"grad_norm": 0.4991433918476105,
"learning_rate": 4.509133423641388e-06,
"loss": 0.028053835034370422,
"step": 4710
},
{
"epoch": 42.142857142857146,
"grad_norm": 0.5921125411987305,
"learning_rate": 4.4110293390035e-06,
"loss": 0.024588567018508912,
"step": 4720
},
{
"epoch": 42.232142857142854,
"grad_norm": 0.4289485216140747,
"learning_rate": 4.313919491735413e-06,
"loss": 0.026377671957015993,
"step": 4730
},
{
"epoch": 42.32142857142857,
"grad_norm": 0.2543030381202698,
"learning_rate": 4.217807654956419e-06,
"loss": 0.02101795971393585,
"step": 4740
},
{
"epoch": 42.410714285714285,
"grad_norm": 0.46004971861839294,
"learning_rate": 4.122697563008991e-06,
"loss": 0.023616319894790648,
"step": 4750
},
{
"epoch": 42.5,
"grad_norm": 0.4452957808971405,
"learning_rate": 4.028592911313669e-06,
"loss": 0.02816382348537445,
"step": 4760
},
{
"epoch": 42.589285714285715,
"grad_norm": 1.8105047941207886,
"learning_rate": 3.935497356225467e-06,
"loss": 0.03450767695903778,
"step": 4770
},
{
"epoch": 42.67857142857143,
"grad_norm": 0.3400633633136749,
"learning_rate": 3.843414514891828e-06,
"loss": 0.02481631338596344,
"step": 4780
},
{
"epoch": 42.767857142857146,
"grad_norm": 0.3335254490375519,
"learning_rate": 3.752347965112084e-06,
"loss": 0.02071080356836319,
"step": 4790
},
{
"epoch": 42.857142857142854,
"grad_norm": 0.36557644605636597,
"learning_rate": 3.6623012451984194e-06,
"loss": 0.024737077951431274,
"step": 4800
},
{
"epoch": 42.94642857142857,
"grad_norm": 0.5764870047569275,
"learning_rate": 3.5732778538384336e-06,
"loss": 0.024080076813697816,
"step": 4810
},
{
"epoch": 43.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9919902823453646,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9919902823453646,
"eval_loss": 0.04448164626955986,
"eval_mean_accuracy": 0.9919902823453646,
"eval_mean_iou": 0.4959951411726823,
"eval_overall_accuracy": 0.9919902823453646,
"eval_runtime": 3.171,
"eval_samples_per_second": 49.827,
"eval_steps_per_second": 6.307,
"step": 4816
},
{
"epoch": 43.035714285714285,
"grad_norm": 0.4781723916530609,
"learning_rate": 3.485281249959158e-06,
"loss": 0.026803573966026305,
"step": 4820
},
{
"epoch": 43.125,
"grad_norm": 0.3812042772769928,
"learning_rate": 3.3983148525926798e-06,
"loss": 0.024715760350227357,
"step": 4830
},
{
"epoch": 43.214285714285715,
"grad_norm": 0.4324609041213989,
"learning_rate": 3.312382040743319e-06,
"loss": 0.027126455307006837,
"step": 4840
},
{
"epoch": 43.30357142857143,
"grad_norm": 0.8323965668678284,
"learning_rate": 3.2274861532563093e-06,
"loss": 0.02302350103855133,
"step": 4850
},
{
"epoch": 43.392857142857146,
"grad_norm": 0.40330275893211365,
"learning_rate": 3.143630488688095e-06,
"loss": 0.024910798668861388,
"step": 4860
},
{
"epoch": 43.482142857142854,
"grad_norm": 0.7080916166305542,
"learning_rate": 3.060818305178145e-06,
"loss": 0.024807298183441163,
"step": 4870
},
{
"epoch": 43.57142857142857,
"grad_norm": 2.711069107055664,
"learning_rate": 2.979052820322364e-06,
"loss": 0.024544814229011537,
"step": 4880
},
{
"epoch": 43.660714285714285,
"grad_norm": 7.1795220375061035,
"learning_rate": 2.898337211048119e-06,
"loss": 0.0320773184299469,
"step": 4890
},
{
"epoch": 43.75,
"grad_norm": 0.5481147766113281,
"learning_rate": 2.8186746134907225e-06,
"loss": 0.02236861139535904,
"step": 4900
},
{
"epoch": 43.839285714285715,
"grad_norm": 0.5208039879798889,
"learning_rate": 2.7400681228716583e-06,
"loss": 0.025225913524627684,
"step": 4910
},
{
"epoch": 43.92857142857143,
"grad_norm": 0.8581423163414001,
"learning_rate": 2.6625207933782827e-06,
"loss": 0.029476696252822877,
"step": 4920
},
{
"epoch": 44.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9918761107860795,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9918761107860795,
"eval_loss": 0.044531892985105515,
"eval_mean_accuracy": 0.9918761107860795,
"eval_mean_iou": 0.49593805539303976,
"eval_overall_accuracy": 0.9918761107860795,
"eval_runtime": 2.9802,
"eval_samples_per_second": 53.017,
"eval_steps_per_second": 6.711,
"step": 4928
},
{
"epoch": 44.017857142857146,
"grad_norm": 0.33332762122154236,
"learning_rate": 2.5860356380451466e-06,
"loss": 0.021295398473739624,
"step": 4930
},
{
"epoch": 44.107142857142854,
"grad_norm": 0.9368950128555298,
"learning_rate": 2.5106156286369418e-06,
"loss": 0.024914734065532684,
"step": 4940
},
{
"epoch": 44.19642857142857,
"grad_norm": 0.4496859610080719,
"learning_rate": 2.4362636955330543e-06,
"loss": 0.02527157962322235,
"step": 4950
},
{
"epoch": 44.285714285714285,
"grad_norm": 0.6395953893661499,
"learning_rate": 2.362982727613658e-06,
"loss": 0.023759710788726806,
"step": 4960
},
{
"epoch": 44.375,
"grad_norm": 0.7984117269515991,
"learning_rate": 2.2907755721475286e-06,
"loss": 0.022670991718769073,
"step": 4970
},
{
"epoch": 44.464285714285715,
"grad_norm": 0.4340791404247284,
"learning_rate": 2.219645034681367e-06,
"loss": 0.024120573699474335,
"step": 4980
},
{
"epoch": 44.55357142857143,
"grad_norm": 0.5286053419113159,
"learning_rate": 2.1495938789308055e-06,
"loss": 0.02684595584869385,
"step": 4990
},
{
"epoch": 44.642857142857146,
"grad_norm": 0.5050071477890015,
"learning_rate": 2.0806248266730554e-06,
"loss": 0.026467105746269225,
"step": 5000
},
{
"epoch": 44.732142857142854,
"grad_norm": 0.2880910038948059,
"learning_rate": 2.012740557641105e-06,
"loss": 0.021798455715179445,
"step": 5010
},
{
"epoch": 44.82142857142857,
"grad_norm": 0.3844790458679199,
"learning_rate": 1.945943709419652e-06,
"loss": 0.02199341207742691,
"step": 5020
},
{
"epoch": 44.910714285714285,
"grad_norm": 0.5376768112182617,
"learning_rate": 1.8802368773425739e-06,
"loss": 0.025217828154563905,
"step": 5030
},
{
"epoch": 45.0,
"grad_norm": 0.8637105822563171,
"learning_rate": 1.8156226143921162e-06,
"loss": 0.025202780961990356,
"step": 5040
},
{
"epoch": 45.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9919142645643516,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9919142645643516,
"eval_loss": 0.04428554326295853,
"eval_mean_accuracy": 0.9919142645643516,
"eval_mean_iou": 0.4959571322821758,
"eval_overall_accuracy": 0.9919142645643516,
"eval_runtime": 3.2068,
"eval_samples_per_second": 49.271,
"eval_steps_per_second": 6.237,
"step": 5040
},
{
"epoch": 45.089285714285715,
"grad_norm": 0.36045849323272705,
"learning_rate": 1.7521034310997053e-06,
"loss": 0.023151762783527374,
"step": 5050
},
{
"epoch": 45.17857142857143,
"grad_norm": 0.5583776831626892,
"learning_rate": 1.689681795448389e-06,
"loss": 0.027086129784584044,
"step": 5060
},
{
"epoch": 45.267857142857146,
"grad_norm": 0.28848934173583984,
"learning_rate": 1.6283601327769371e-06,
"loss": 0.024879464507102968,
"step": 5070
},
{
"epoch": 45.357142857142854,
"grad_norm": 0.5597347021102905,
"learning_rate": 1.56814082568564e-06,
"loss": 0.025781130790710448,
"step": 5080
},
{
"epoch": 45.44642857142857,
"grad_norm": 0.42186370491981506,
"learning_rate": 1.5090262139436896e-06,
"loss": 0.026576164364814758,
"step": 5090
},
{
"epoch": 45.535714285714285,
"grad_norm": 0.6118794083595276,
"learning_rate": 1.4510185943983112e-06,
"loss": 0.026358428597450256,
"step": 5100
},
{
"epoch": 45.625,
"grad_norm": 0.46963897347450256,
"learning_rate": 1.3941202208854965e-06,
"loss": 0.025634509325027467,
"step": 5110
},
{
"epoch": 45.714285714285715,
"grad_norm": 0.8034435510635376,
"learning_rate": 1.338333304142435e-06,
"loss": 0.02395763248205185,
"step": 5120
},
{
"epoch": 45.80357142857143,
"grad_norm": 0.6469313502311707,
"learning_rate": 1.2836600117216346e-06,
"loss": 0.024726195633411406,
"step": 5130
},
{
"epoch": 45.892857142857146,
"grad_norm": 0.4325697124004364,
"learning_rate": 1.2301024679066808e-06,
"loss": 0.02584630250930786,
"step": 5140
},
{
"epoch": 45.982142857142854,
"grad_norm": 0.39687296748161316,
"learning_rate": 1.177662753629717e-06,
"loss": 0.021341803669929504,
"step": 5150
},
{
"epoch": 46.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9921635681130104,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9921635681130104,
"eval_loss": 0.044276703149080276,
"eval_mean_accuracy": 0.9921635681130104,
"eval_mean_iou": 0.4960817840565052,
"eval_overall_accuracy": 0.9921635681130104,
"eval_runtime": 3.1403,
"eval_samples_per_second": 50.313,
"eval_steps_per_second": 6.369,
"step": 5152
},
{
"epoch": 46.07142857142857,
"grad_norm": 0.5137065649032593,
"learning_rate": 1.126342906390585e-06,
"loss": 0.02478640079498291,
"step": 5160
},
{
"epoch": 46.160714285714285,
"grad_norm": 0.5068938136100769,
"learning_rate": 1.0761449201776464e-06,
"loss": 0.022511668503284454,
"step": 5170
},
{
"epoch": 46.25,
"grad_norm": 0.49176064133644104,
"learning_rate": 1.0270707453903428e-06,
"loss": 0.025940099358558656,
"step": 5180
},
{
"epoch": 46.339285714285715,
"grad_norm": 0.4621039927005768,
"learning_rate": 9.791222887633711e-07,
"loss": 0.02201744318008423,
"step": 5190
},
{
"epoch": 46.42857142857143,
"grad_norm": 3.4700331687927246,
"learning_rate": 9.323014132926355e-07,
"loss": 0.03096678853034973,
"step": 5200
},
{
"epoch": 46.517857142857146,
"grad_norm": 0.49781036376953125,
"learning_rate": 8.86609938162839e-07,
"loss": 0.02691877484321594,
"step": 5210
},
{
"epoch": 46.607142857142854,
"grad_norm": 0.5014402866363525,
"learning_rate": 8.420496386768195e-07,
"loss": 0.02660224735736847,
"step": 5220
},
{
"epoch": 46.69642857142857,
"grad_norm": 0.5916736125946045,
"learning_rate": 7.986222461865455e-07,
"loss": 0.021325075626373292,
"step": 5230
},
{
"epoch": 46.785714285714285,
"grad_norm": 0.4295494258403778,
"learning_rate": 7.563294480258798e-07,
"loss": 0.019958339631557465,
"step": 5240
},
{
"epoch": 46.875,
"grad_norm": 0.30950236320495605,
"learning_rate": 7.151728874449848e-07,
"loss": 0.026697978377342224,
"step": 5250
},
{
"epoch": 46.964285714285715,
"grad_norm": 0.481393426656723,
"learning_rate": 6.751541635465075e-07,
"loss": 0.023805753886699678,
"step": 5260
},
{
"epoch": 47.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9916805123025328,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9916805123025328,
"eval_loss": 0.04457485303282738,
"eval_mean_accuracy": 0.9916805123025328,
"eval_mean_iou": 0.4958402561512664,
"eval_overall_accuracy": 0.9916805123025328,
"eval_runtime": 3.1185,
"eval_samples_per_second": 50.666,
"eval_steps_per_second": 6.413,
"step": 5264
},
{
"epoch": 47.05357142857143,
"grad_norm": 0.4641105830669403,
"learning_rate": 6.362748312234223e-07,
"loss": 0.02568671405315399,
"step": 5270
},
{
"epoch": 47.142857142857146,
"grad_norm": 0.5612961649894714,
"learning_rate": 5.985364010986261e-07,
"loss": 0.02504618465900421,
"step": 5280
},
{
"epoch": 47.232142857142854,
"grad_norm": 0.7722740173339844,
"learning_rate": 5.619403394662614e-07,
"loss": 0.028320273756980895,
"step": 5290
},
{
"epoch": 47.32142857142857,
"grad_norm": 0.5712404251098633,
"learning_rate": 5.264880682347095e-07,
"loss": 0.025172898173332216,
"step": 5300
},
{
"epoch": 47.410714285714285,
"grad_norm": 0.448178231716156,
"learning_rate": 4.921809648713737e-07,
"loss": 0.025293144583702087,
"step": 5310
},
{
"epoch": 47.5,
"grad_norm": 0.8815834522247314,
"learning_rate": 4.590203623491429e-07,
"loss": 0.025543418526649476,
"step": 5320
},
{
"epoch": 47.589285714285715,
"grad_norm": 0.6897329688072205,
"learning_rate": 4.270075490946124e-07,
"loss": 0.023450803756713868,
"step": 5330
},
{
"epoch": 47.67857142857143,
"grad_norm": 0.2958068549633026,
"learning_rate": 3.9614376893800763e-07,
"loss": 0.021414244174957277,
"step": 5340
},
{
"epoch": 47.767857142857146,
"grad_norm": 0.438213586807251,
"learning_rate": 3.664302210648729e-07,
"loss": 0.02141619473695755,
"step": 5350
},
{
"epoch": 47.857142857142854,
"grad_norm": 0.6407127976417542,
"learning_rate": 3.378680599694617e-07,
"loss": 0.02390940934419632,
"step": 5360
},
{
"epoch": 47.94642857142857,
"grad_norm": 0.6588020324707031,
"learning_rate": 3.1045839540989273e-07,
"loss": 0.023431585729122163,
"step": 5370
},
{
"epoch": 48.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9918207636596241,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9918207636596241,
"eval_loss": 0.04451696202158928,
"eval_mean_accuracy": 0.9918207636596241,
"eval_mean_iou": 0.49591038182981206,
"eval_overall_accuracy": 0.9918207636596241,
"eval_runtime": 3.1745,
"eval_samples_per_second": 49.771,
"eval_steps_per_second": 6.3,
"step": 5376
},
{
"epoch": 48.035714285714285,
"grad_norm": 0.23221944272518158,
"learning_rate": 2.842022923650278e-07,
"loss": 0.026059791445732117,
"step": 5380
},
{
"epoch": 48.125,
"grad_norm": 0.4213135540485382,
"learning_rate": 2.5910077099309147e-07,
"loss": 0.023841065168380738,
"step": 5390
},
{
"epoch": 48.214285714285715,
"grad_norm": 0.47122108936309814,
"learning_rate": 2.3515480659202616e-07,
"loss": 0.025115084648132325,
"step": 5400
},
{
"epoch": 48.30357142857143,
"grad_norm": 0.7628607749938965,
"learning_rate": 2.123653295616157e-07,
"loss": 0.02465710639953613,
"step": 5410
},
{
"epoch": 48.392857142857146,
"grad_norm": 0.4654390513896942,
"learning_rate": 1.9073322536732107e-07,
"loss": 0.023554743826389314,
"step": 5420
},
{
"epoch": 48.482142857142854,
"grad_norm": 0.433553546667099,
"learning_rate": 1.7025933450587784e-07,
"loss": 0.025577667355537414,
"step": 5430
},
{
"epoch": 48.57142857142857,
"grad_norm": 0.8381280303001404,
"learning_rate": 1.509444524726489e-07,
"loss": 0.023599877953529358,
"step": 5440
},
{
"epoch": 48.660714285714285,
"grad_norm": 0.5404291749000549,
"learning_rate": 1.3278932973070257e-07,
"loss": 0.02920941114425659,
"step": 5450
},
{
"epoch": 48.75,
"grad_norm": 0.5444062352180481,
"learning_rate": 1.1579467168166269e-07,
"loss": 0.025456267595291137,
"step": 5460
},
{
"epoch": 48.839285714285715,
"grad_norm": 0.489740252494812,
"learning_rate": 9.996113863830369e-08,
"loss": 0.023142220079898836,
"step": 5470
},
{
"epoch": 48.92857142857143,
"grad_norm": 0.40527722239494324,
"learning_rate": 8.528934579888459e-08,
"loss": 0.02229561060667038,
"step": 5480
},
{
"epoch": 49.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.9914031971191933,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.9914031971191933,
"eval_loss": 0.04447474330663681,
"eval_mean_accuracy": 0.9914031971191933,
"eval_mean_iou": 0.49570159855959667,
"eval_overall_accuracy": 0.9914031971191933,
"eval_runtime": 3.066,
"eval_samples_per_second": 51.533,
"eval_steps_per_second": 6.523,
"step": 5488
},
{
"epoch": 49.017857142857146,
"grad_norm": 1.488918662071228,
"learning_rate": 7.177986322325137e-08,
"loss": 0.026862525939941408,
"step": 5490
},
{
"epoch": 49.107142857142854,
"grad_norm": 0.9656788110733032,
"learning_rate": 5.943321581069139e-08,
"loss": 0.027856603264808655,
"step": 5500
},
{
"epoch": 49.19642857142857,
"grad_norm": 1.4815126657485962,
"learning_rate": 4.824988327953639e-08,
"loss": 0.027299723029136656,
"step": 5510
},
{
"epoch": 49.285714285714285,
"grad_norm": 0.2918512225151062,
"learning_rate": 3.823030014851403e-08,
"loss": 0.021877503395080565,
"step": 5520
},
{
"epoch": 49.375,
"grad_norm": 0.4252746105194092,
"learning_rate": 2.9374855719884742e-08,
"loss": 0.026218003034591673,
"step": 5530
},
{
"epoch": 49.464285714285715,
"grad_norm": 0.2831713557243347,
"learning_rate": 2.168389406429716e-08,
"loss": 0.025749343633651733,
"step": 5540
},
{
"epoch": 49.55357142857143,
"grad_norm": 0.4766254127025604,
"learning_rate": 1.5157714007425495e-08,
"loss": 0.023514069616794586,
"step": 5550
},
{
"epoch": 49.642857142857146,
"grad_norm": 0.9032825827598572,
"learning_rate": 9.796569118368793e-09,
"loss": 0.027806323766708375,
"step": 5560
},
{
"epoch": 49.732142857142854,
"grad_norm": 0.3083033263683319,
"learning_rate": 5.60066769977885e-09,
"loss": 0.022344766557216643,
"step": 5570
},
{
"epoch": 49.82142857142857,
"grad_norm": 0.4118826985359192,
"learning_rate": 2.570172779789992e-09,
"loss": 0.02296028733253479,
"step": 5580
},
{
"epoch": 49.910714285714285,
"grad_norm": 0.44650617241859436,
"learning_rate": 7.052021056608293e-10,
"loss": 0.02406269907951355,
"step": 5590
},
{
"epoch": 50.0,
"grad_norm": 0.5170707106590271,
"learning_rate": 5.8281392212311545e-12,
"loss": 0.02451837360858917,
"step": 5600
},
{
"epoch": 50.0,
"eval_accuracy_background": NaN,
"eval_accuracy_crop": 0.991746323545392,
"eval_iou_background": 0.0,
"eval_iou_crop": 0.991746323545392,
"eval_loss": 0.04466014727950096,
"eval_mean_accuracy": 0.991746323545392,
"eval_mean_iou": 0.495873161772696,
"eval_overall_accuracy": 0.991746323545392,
"eval_runtime": 2.9949,
"eval_samples_per_second": 52.756,
"eval_steps_per_second": 6.678,
"step": 5600
},
{
"epoch": 50.0,
"step": 5600,
"total_flos": 7.834996118126592e+17,
"train_loss": 0.05321301036647388,
"train_runtime": 744.0706,
"train_samples_per_second": 60.075,
"train_steps_per_second": 7.526
}
],
"logging_steps": 10,
"max_steps": 5600,
"num_input_tokens_seen": 0,
"num_train_epochs": 50,
"save_steps": 500,
"stateful_callbacks": {
"TrainerControl": {
"args": {
"should_epoch_stop": false,
"should_evaluate": false,
"should_log": false,
"should_save": true,
"should_training_stop": true
},
"attributes": {}
}
},
"total_flos": 7.834996118126592e+17,
"train_batch_size": 8,
"trial_name": null,
"trial_params": null
}